Hex Tiled Q-Learning SAR example

The challenge in this example is implementing a Q-Learning search algorithm in a hexagonal tiled environment

[1]:
# Setup
import sys, os
from loguru import logger

sys.path.insert(0, os.path.join(os.getcwd(), "../src")) # run from within examples folder

if os.environ.get("CI", False):
    logger.remove()
    logger.add(sys.stderr, level="INFO")

logger.add("/tmp/ql.log", level='DEBUG')

BUILD: str = os.environ.get("BUILD", "")
num_trials: int
steps: int
if BUILD == "doctest": # tox env specific to doctests
    num_trials = 1
    steps = 5
elif BUILD == "html": # tox env specific to building docs
    num_trials = 30000
    steps = 20
else: # normal operation
    num_trials = 500000
    steps = 20
[2]:
import numpy as np
import matplotlib.pyplot as plt
import matplotlib as mpl
from copy import copy
import itertools
[3]:
from jsim.Environment import HexEnvironment, HexDirections
from jsim.Agent import Agent
from jsim.Simulation import Simulation
from jsim.Environment.HexEnvironment.HexCoords import OffsetCoord
from jsim.Meta import State
[4]:
class QHexEnv(HexEnvironment):
    def __init__(self, **kwargs):
        super().__init__(**kwargs)

        self.pdm = self._generate_pdm()
        self.n_bins = 4
        self.digitized_pdm = self._encode_pdm(n=self.n_bins)
        self._digitized_pdm_store = np.copy(self.digitized_pdm)

        self._encode_penalty()

        self._generate_states()

    def _generate_pdm(self, N:int=5):
        self._shape = (self._shape[0]+2, self._shape[1]+2)

        x, y = np.meshgrid(np.arange(self.shape[0]), np.arange(self.shape[1]))

        pdm = np.zeros(self.shape) # pad the PDM with zeros on all sides

        for _ in range(N): # Generate N gaussians
            A = max(np.random.rand()*2,1)
            a = np.random.rand()*0.03
            b = 0
            c = np.random.rand()*0.03
            x0 = np.random.uniform(0,self.shape[0]) # Centre of gaussian
            y0 = np.random.uniform(0,self.shape[1])

            pdm += A*np.exp(-(a*(x-x0)**2+2*b*(x-x0)*(y-y0)+c*(y-y0)**2))

        return pdm

    def _encode_penalty(self):
        penalty = -1
        self.pdm[0,:] = penalty
        self.pdm[-1,:] = penalty
        self.pdm[:,0] = penalty
        self.pdm[:,-1] = penalty

        self.digitized_pdm[0,:] = -1
        self.digitized_pdm[-1,:] = -1
        self.digitized_pdm[:,0] = -1
        self.digitized_pdm[:,-1] = -1

    def _encode_pdm(self, n: int) -> np.ndarray:
        n_bins = n
        bins = np.arange(0,np.max(self.pdm), np.max(self.pdm)/n_bins)
        return np.digitize(self.pdm, bins)

    def _generate_states(self) -> None:
        c = np.arange(-1,1+np.max(self.digitized_pdm))
        dirs = np.array([f.flatten() for f in np.meshgrid(c,c,c,c,c,c)])
        pstates = np.unique(dirs,axis=1)
        i = -1
        self.possible_states = {(a,b,c,d,e,f): (i:=i+1) for a,b,c,d,e,f in pstates.transpose()}

        # Old method, used as a warning against not using numpy for everything
        # This would take about 7s to run. The above method takes about 0.2s
        #
        # c = np.arange(-1,1+np.max(self.digitized_pdm))
        # u,v,w,x,y,z = np.meshgrid(c,c,c,c,c,c) # one for each direction (6)
        # u,v,w,x,y,z = u.flatten(), v.flatten(), w.flatten(), x.flatten(), y.flatten(), z.flatten()
        # self.possible_states = {(a,b,c,d,e,f): int(np.where((u==a)&(v==b)&(w==c)&(x==d)&(y==e)&(z==f))[0]) for a,b,c,d,e,f in zip(u,v,w,x,y,z)}


    def _state_from_list(self, l):
        assert len(l) == len(HexDirections)
        return self.possible_states[tuple(l)]

    def _evaluate_digi_position(self, pos: OffsetCoord) -> int:
        return self.digitized_pdm[pos.row, pos.col]

    def _evaluate_position(self, pos: OffsetCoord) -> float:
        return self.pdm[pos.row, pos.col]

    def reset(self, agent_p: OffsetCoord) -> int:
        self.digitized_pdm = np.copy(self._digitized_pdm_store)
        return self._evaluate_digi_position(agent_p)

    def step(self, agent_s: OffsetCoord) -> tuple[int, float]:
        reward = self._evaluate_position(agent_s)
        neighbors = self.neighbors_coord(agent_s)

        values_at_neighbors = self._state_from_list([self._evaluate_digi_position(n) for n in neighbors])

        self.digitized_pdm[agent_s.row][agent_s.col] = -1

        return values_at_neighbors, reward
[5]:
class QAgent(Agent):
    def __init__(self, penv: QHexEnv = None) -> None:
        self.state = OffsetCoord(col=0,row=0)
        self.states = []
        self.penv = penv

        self.epsilon = 1
        self.qtable = np.zeros((len(self.penv.possible_states),6))

    def policy(self, pnext_s: int) -> HexDirections:
        epsilon = 0.2
        result = None

        if np.random.uniform(0,1) < epsilon:
            idx = np.random.randint(0,6)
        else:
            idx = np.argmax(self.qtable[pnext_s])
        result = HexDirections(idx)
        return result

    def step(self, pnext_s: int) -> HexDirections:
        return self.policy(pnext_s)

    def learn(self, reward: float, state: int, next_state: int,  action: HexDirections) -> None:
        """
        Maximize the reward through a Q-Learning Step

        :param reward: Reward based on the probability seen from the previous action by the agent
        :type reward: float
        :param state: The state of the digitized PDM around the agent when the previous action was deciced
        :type state: int
        :param next_state: The new state that the agent is in
        :type next_state: int
        :param action: The action by the agent
        :type action: HexDirections
        """
        alpha = 0.01
        gamma = 0.99

        reward *= -1

        new_value = (1 - alpha) * self.qtable[state,action] + alpha * (reward+gamma*np.max(self.qtable[next_state]))

        self.qtable[state][action] = new_value


    def update(self, pa: HexDirections) -> OffsetCoord:
        if not hasattr(self,'state'):
            logger.error(f"Reset has not been called as {hasattr(self,'state')=}")
            raise Exception

        next_state = QHexEnv.neighbor_coord(self.state, pa)
        self.state = next_state

        return copy(self.state)

    def reset(self, ps: OffsetCoord, vicinity: int) -> tuple[HexDirections, OffsetCoord]:
        self.epsilon = np.max([0.01,self.epsilon*0.99])
        self.state = copy(ps)
        return self.policy(vicinity), self.state
[6]:
class QSim(Simulation):
    agent: QAgent
    env: QHexEnv

    def __init__(self, initial_pos=OffsetCoord(col=5,row=5)) -> None:
        self.env = QHexEnv(psim=self)
        self.agent = QAgent(penv=self.env)

        self.initial_agent_s = initial_pos

        self.data_store = {'env_s':[],'agent_s':[],'agent_a':[],'reward':[]}
        self.long_term_ds = {}
        super().__init__()

    def reset(self) -> None:
        self.vicinity_pdm = self.env.reset(self.initial_agent_s)
        self.agent_a, self.agent_s = self.agent.reset(copy(self.initial_agent_s),self.vicinity_pdm)
        self.data_store = {'env_s':[],'agent_s':[],'agent_a':[],'reward':[]}

    def trials(self, num_trials: int, max_num_steps: int):
        for i in range(num_trials):
            try:
                self.steps(max_num_steps)
                logger.debug(f"Trial = {i}/{num_trials} | Max number of steps ({max_num_steps}) reached ")
            except IndexError as e:
                logger.debug(f"Trial = {i}/{num_trials} | Agent went out of bounds, resetting")
            finally:
                self.data_store['total_reward'] = np.sum(self.data_store['reward'])
                logger.debug(f"Trial = {i}/{num_trials} | Total reward = {self.data_store['total_reward']:.2f}")

                # trim the data a bit to save memory
                self.data_store.pop("agent_a",None)
                self.data_store.pop("env_s",None)
                self.data_store.pop("reward",None)

                self.long_term_ds[i] = copy(self.data_store)

    def steps(self, num_steps: int) -> None:
        self.reset()

        agent_s = self.agent_s
        for _ in range(num_steps):
            vicinity_pdm, reward = self.env.step(self.agent_s)

            self.collect_data(vicinity_pdm, self.agent_a, self.agent_s, reward)

            agent_a = self.agent.step(vicinity_pdm)

            if agent_s and (agent_s.row > 0 or \
                    agent_s.col > 0 or \
                    agent_s.row < self.env.shape[0] or \
                    agent_s.col < self.env.shape[1]):

                agent_s = self.agent.update(agent_a)
            else:
                print(agent_s, reward)

            if agent_s.row < 0 or agent_s.col < 0:
                raise IndexError(f"Out of bounds with {agent_s} < 0")
            if agent_s.row > self.env.shape[0] or agent_s.col > self.env.shape[1]:
                raise IndexError(f"Out of bounds with {agent_s} > {self.env.shape}")

            self.agent.learn(reward, self.vicinity_pdm, vicinity_pdm, agent_a)

            self.agent_s = agent_s
            self.agent_a = agent_a
            self.vicinity_pdm = vicinity_pdm



    def collect_data(self, env_s: int, agent_a: HexDirections, agent_s: OffsetCoord, reward: float) -> None:
        self.data_store['env_s'].append(copy(env_s))
        self.data_store['agent_a'].append(copy(agent_a))
        self.data_store['agent_s'].append(copy(agent_s))
        self.data_store['reward'].append(copy(reward))

[7]:
def plot(sim: QSim):
    fig, (ax1, ax2) = plt.subplots(1,2,figsize=(8, 6), dpi=80)

    t = np.arange(0,len(sim.long_term_ds))

    # Reward over time
    ax1.plot(sim.long_term_ds.keys(), [sim.long_term_ds[ds]['total_reward'] for ds in sim.long_term_ds])
    ax1.set_ylabel('Total reward')
    ax1.set_xlabel('Epoch')

    # Show pdm and path
    import operator
    best_ds = max(sim.long_term_ds.values(), key=operator.itemgetter('total_reward'))
    xy = [HexEnvironment.offset_to_pixel(f) for f in best_ds['agent_s']]
    x = [f.x for f in xy]
    y = [f.y for f in xy]

    for p in sim.env.as_mpl_polygons(cmap=mpl.cm.get_cmap('gray')):
        ax2.add_patch(p)

    ax2.plot(x,y)
    ax2.scatter(x[0],y[0],label='Start')
    ax2.scatter(x[-1],y[-1],label='End')
    ax2.set_ylabel('y')
    ax2.set_xlabel('x')
    ax2.legend()
    ax2.set_aspect('equal')
    fig.tight_layout()

    logger.info(f"Number of steps: {steps}")
    logger.info(f"Number of trials: {num_trials}")
    plt.show()
[8]:
# Learn
sim = QSim()

sim.trials(num_trials,steps)

plot(sim)
2022-01-26 14:16:23.594 | DEBUG    | __main__:trials:24 - Trial = 0/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.595 | DEBUG    | __main__:trials:29 - Trial = 0/30000 | Total reward = 61.71
2022-01-26 14:16:23.598 | DEBUG    | __main__:trials:24 - Trial = 1/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.599 | DEBUG    | __main__:trials:29 - Trial = 1/30000 | Total reward = 63.20
2022-01-26 14:16:23.602 | DEBUG    | __main__:trials:24 - Trial = 2/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.603 | DEBUG    | __main__:trials:29 - Trial = 2/30000 | Total reward = 53.96
2022-01-26 14:16:23.607 | DEBUG    | __main__:trials:26 - Trial = 3/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:23.608 | DEBUG    | __main__:trials:29 - Trial = 3/30000 | Total reward = 49.04
2022-01-26 14:16:23.611 | DEBUG    | __main__:trials:24 - Trial = 4/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.611 | DEBUG    | __main__:trials:29 - Trial = 4/30000 | Total reward = 53.81
2022-01-26 14:16:23.614 | DEBUG    | __main__:trials:24 - Trial = 5/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.615 | DEBUG    | __main__:trials:29 - Trial = 5/30000 | Total reward = 47.19
2022-01-26 14:16:23.618 | DEBUG    | __main__:trials:24 - Trial = 6/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.619 | DEBUG    | __main__:trials:29 - Trial = 6/30000 | Total reward = 63.92
2022-01-26 14:16:23.622 | DEBUG    | __main__:trials:24 - Trial = 7/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.623 | DEBUG    | __main__:trials:29 - Trial = 7/30000 | Total reward = 61.05
2022-01-26 14:16:23.626 | DEBUG    | __main__:trials:24 - Trial = 8/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.628 | DEBUG    | __main__:trials:29 - Trial = 8/30000 | Total reward = 45.83
2022-01-26 14:16:23.631 | DEBUG    | __main__:trials:24 - Trial = 9/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.632 | DEBUG    | __main__:trials:29 - Trial = 9/30000 | Total reward = 62.45
2022-01-26 14:16:23.635 | DEBUG    | __main__:trials:24 - Trial = 10/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.636 | DEBUG    | __main__:trials:29 - Trial = 10/30000 | Total reward = 44.54
2022-01-26 14:16:23.639 | DEBUG    | __main__:trials:24 - Trial = 11/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.640 | DEBUG    | __main__:trials:29 - Trial = 11/30000 | Total reward = 58.01
2022-01-26 14:16:23.643 | DEBUG    | __main__:trials:24 - Trial = 12/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.644 | DEBUG    | __main__:trials:29 - Trial = 12/30000 | Total reward = 54.68
2022-01-26 14:16:23.647 | DEBUG    | __main__:trials:24 - Trial = 13/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.648 | DEBUG    | __main__:trials:29 - Trial = 13/30000 | Total reward = 47.66
2022-01-26 14:16:23.651 | DEBUG    | __main__:trials:24 - Trial = 14/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.651 | DEBUG    | __main__:trials:29 - Trial = 14/30000 | Total reward = 50.77
2022-01-26 14:16:23.655 | DEBUG    | __main__:trials:24 - Trial = 15/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.655 | DEBUG    | __main__:trials:29 - Trial = 15/30000 | Total reward = 52.84
2022-01-26 14:16:23.658 | DEBUG    | __main__:trials:24 - Trial = 16/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.659 | DEBUG    | __main__:trials:29 - Trial = 16/30000 | Total reward = 32.50
2022-01-26 14:16:23.663 | DEBUG    | __main__:trials:24 - Trial = 17/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.663 | DEBUG    | __main__:trials:29 - Trial = 17/30000 | Total reward = 36.03
2022-01-26 14:16:23.667 | DEBUG    | __main__:trials:24 - Trial = 18/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.667 | DEBUG    | __main__:trials:29 - Trial = 18/30000 | Total reward = 45.18
2022-01-26 14:16:23.670 | DEBUG    | __main__:trials:24 - Trial = 19/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.671 | DEBUG    | __main__:trials:29 - Trial = 19/30000 | Total reward = 42.02
2022-01-26 14:16:23.674 | DEBUG    | __main__:trials:24 - Trial = 20/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.675 | DEBUG    | __main__:trials:29 - Trial = 20/30000 | Total reward = 61.56
2022-01-26 14:16:23.678 | DEBUG    | __main__:trials:24 - Trial = 21/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.679 | DEBUG    | __main__:trials:29 - Trial = 21/30000 | Total reward = 61.74
2022-01-26 14:16:23.682 | DEBUG    | __main__:trials:24 - Trial = 22/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.683 | DEBUG    | __main__:trials:29 - Trial = 22/30000 | Total reward = 46.93
2022-01-26 14:16:23.686 | DEBUG    | __main__:trials:24 - Trial = 23/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.687 | DEBUG    | __main__:trials:29 - Trial = 23/30000 | Total reward = 63.66
2022-01-26 14:16:23.690 | DEBUG    | __main__:trials:24 - Trial = 24/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.691 | DEBUG    | __main__:trials:29 - Trial = 24/30000 | Total reward = 49.61
2022-01-26 14:16:23.694 | DEBUG    | __main__:trials:24 - Trial = 25/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.695 | DEBUG    | __main__:trials:29 - Trial = 25/30000 | Total reward = 36.00
2022-01-26 14:16:23.698 | DEBUG    | __main__:trials:24 - Trial = 26/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.698 | DEBUG    | __main__:trials:29 - Trial = 26/30000 | Total reward = 38.26
2022-01-26 14:16:23.701 | DEBUG    | __main__:trials:26 - Trial = 27/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:23.702 | DEBUG    | __main__:trials:29 - Trial = 27/30000 | Total reward = 24.48
2022-01-26 14:16:23.705 | DEBUG    | __main__:trials:24 - Trial = 28/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.706 | DEBUG    | __main__:trials:29 - Trial = 28/30000 | Total reward = 42.88
2022-01-26 14:16:23.709 | DEBUG    | __main__:trials:24 - Trial = 29/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.710 | DEBUG    | __main__:trials:29 - Trial = 29/30000 | Total reward = 47.22
2022-01-26 14:16:23.713 | DEBUG    | __main__:trials:24 - Trial = 30/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.714 | DEBUG    | __main__:trials:29 - Trial = 30/30000 | Total reward = 51.58
2022-01-26 14:16:23.717 | DEBUG    | __main__:trials:24 - Trial = 31/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.718 | DEBUG    | __main__:trials:29 - Trial = 31/30000 | Total reward = 65.62
2022-01-26 14:16:23.722 | DEBUG    | __main__:trials:24 - Trial = 32/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.723 | DEBUG    | __main__:trials:29 - Trial = 32/30000 | Total reward = 39.86
2022-01-26 14:16:23.726 | DEBUG    | __main__:trials:24 - Trial = 33/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.726 | DEBUG    | __main__:trials:29 - Trial = 33/30000 | Total reward = 43.49
2022-01-26 14:16:23.729 | DEBUG    | __main__:trials:24 - Trial = 34/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.731 | DEBUG    | __main__:trials:29 - Trial = 34/30000 | Total reward = 42.08
2022-01-26 14:16:23.735 | DEBUG    | __main__:trials:24 - Trial = 35/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.736 | DEBUG    | __main__:trials:29 - Trial = 35/30000 | Total reward = 42.55
2022-01-26 14:16:23.739 | DEBUG    | __main__:trials:24 - Trial = 36/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.741 | DEBUG    | __main__:trials:29 - Trial = 36/30000 | Total reward = 54.85
2022-01-26 14:16:23.744 | DEBUG    | __main__:trials:24 - Trial = 37/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.746 | DEBUG    | __main__:trials:29 - Trial = 37/30000 | Total reward = 36.54
2022-01-26 14:16:23.749 | DEBUG    | __main__:trials:24 - Trial = 38/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.750 | DEBUG    | __main__:trials:29 - Trial = 38/30000 | Total reward = 60.86
2022-01-26 14:16:23.753 | DEBUG    | __main__:trials:24 - Trial = 39/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.755 | DEBUG    | __main__:trials:29 - Trial = 39/30000 | Total reward = 45.69
2022-01-26 14:16:23.759 | DEBUG    | __main__:trials:24 - Trial = 40/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.759 | DEBUG    | __main__:trials:29 - Trial = 40/30000 | Total reward = 41.58
2022-01-26 14:16:23.764 | DEBUG    | __main__:trials:24 - Trial = 41/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.764 | DEBUG    | __main__:trials:29 - Trial = 41/30000 | Total reward = 51.64
2022-01-26 14:16:23.768 | DEBUG    | __main__:trials:24 - Trial = 42/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.770 | DEBUG    | __main__:trials:29 - Trial = 42/30000 | Total reward = 46.74
2022-01-26 14:16:23.773 | DEBUG    | __main__:trials:24 - Trial = 43/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.774 | DEBUG    | __main__:trials:29 - Trial = 43/30000 | Total reward = 27.31
2022-01-26 14:16:23.777 | DEBUG    | __main__:trials:24 - Trial = 44/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.778 | DEBUG    | __main__:trials:29 - Trial = 44/30000 | Total reward = 56.63
2022-01-26 14:16:23.781 | DEBUG    | __main__:trials:24 - Trial = 45/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.782 | DEBUG    | __main__:trials:29 - Trial = 45/30000 | Total reward = 53.98
2022-01-26 14:16:23.785 | DEBUG    | __main__:trials:24 - Trial = 46/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.787 | DEBUG    | __main__:trials:29 - Trial = 46/30000 | Total reward = 37.99
2022-01-26 14:16:23.790 | DEBUG    | __main__:trials:24 - Trial = 47/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.792 | DEBUG    | __main__:trials:29 - Trial = 47/30000 | Total reward = 54.69
2022-01-26 14:16:23.796 | DEBUG    | __main__:trials:24 - Trial = 48/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.797 | DEBUG    | __main__:trials:29 - Trial = 48/30000 | Total reward = 35.74
2022-01-26 14:16:23.800 | DEBUG    | __main__:trials:24 - Trial = 49/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.802 | DEBUG    | __main__:trials:29 - Trial = 49/30000 | Total reward = 37.08
2022-01-26 14:16:23.806 | DEBUG    | __main__:trials:24 - Trial = 50/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.807 | DEBUG    | __main__:trials:29 - Trial = 50/30000 | Total reward = 49.14
2022-01-26 14:16:23.810 | DEBUG    | __main__:trials:24 - Trial = 51/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.813 | DEBUG    | __main__:trials:29 - Trial = 51/30000 | Total reward = 44.78
2022-01-26 14:16:23.815 | DEBUG    | __main__:trials:24 - Trial = 52/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.818 | DEBUG    | __main__:trials:29 - Trial = 52/30000 | Total reward = 45.88
2022-01-26 14:16:23.821 | DEBUG    | __main__:trials:24 - Trial = 53/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.822 | DEBUG    | __main__:trials:29 - Trial = 53/30000 | Total reward = 51.78
2022-01-26 14:16:23.825 | DEBUG    | __main__:trials:24 - Trial = 54/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.827 | DEBUG    | __main__:trials:29 - Trial = 54/30000 | Total reward = 44.84
2022-01-26 14:16:23.831 | DEBUG    | __main__:trials:24 - Trial = 55/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.832 | DEBUG    | __main__:trials:29 - Trial = 55/30000 | Total reward = 39.92
2022-01-26 14:16:23.836 | DEBUG    | __main__:trials:24 - Trial = 56/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.837 | DEBUG    | __main__:trials:29 - Trial = 56/30000 | Total reward = 29.65
2022-01-26 14:16:23.840 | DEBUG    | __main__:trials:24 - Trial = 57/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.842 | DEBUG    | __main__:trials:29 - Trial = 57/30000 | Total reward = 61.55
2022-01-26 14:16:23.846 | DEBUG    | __main__:trials:24 - Trial = 58/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.847 | DEBUG    | __main__:trials:29 - Trial = 58/30000 | Total reward = 29.64
2022-01-26 14:16:23.851 | DEBUG    | __main__:trials:24 - Trial = 59/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.852 | DEBUG    | __main__:trials:29 - Trial = 59/30000 | Total reward = 38.50
2022-01-26 14:16:23.855 | DEBUG    | __main__:trials:24 - Trial = 60/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.856 | DEBUG    | __main__:trials:29 - Trial = 60/30000 | Total reward = 29.47
2022-01-26 14:16:23.860 | DEBUG    | __main__:trials:24 - Trial = 61/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.861 | DEBUG    | __main__:trials:29 - Trial = 61/30000 | Total reward = 34.24
2022-01-26 14:16:23.864 | DEBUG    | __main__:trials:24 - Trial = 62/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.865 | DEBUG    | __main__:trials:29 - Trial = 62/30000 | Total reward = 33.34
2022-01-26 14:16:23.870 | DEBUG    | __main__:trials:24 - Trial = 63/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.871 | DEBUG    | __main__:trials:29 - Trial = 63/30000 | Total reward = 54.19
2022-01-26 14:16:23.874 | DEBUG    | __main__:trials:24 - Trial = 64/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.876 | DEBUG    | __main__:trials:29 - Trial = 64/30000 | Total reward = 42.15
2022-01-26 14:16:23.879 | DEBUG    | __main__:trials:24 - Trial = 65/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.881 | DEBUG    | __main__:trials:29 - Trial = 65/30000 | Total reward = 29.30
2022-01-26 14:16:23.884 | DEBUG    | __main__:trials:24 - Trial = 66/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.885 | DEBUG    | __main__:trials:29 - Trial = 66/30000 | Total reward = 57.91
2022-01-26 14:16:23.889 | DEBUG    | __main__:trials:24 - Trial = 67/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.889 | DEBUG    | __main__:trials:29 - Trial = 67/30000 | Total reward = 31.04
2022-01-26 14:16:23.893 | DEBUG    | __main__:trials:24 - Trial = 68/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.894 | DEBUG    | __main__:trials:29 - Trial = 68/30000 | Total reward = 28.78
2022-01-26 14:16:23.898 | DEBUG    | __main__:trials:24 - Trial = 69/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.899 | DEBUG    | __main__:trials:29 - Trial = 69/30000 | Total reward = 57.54
2022-01-26 14:16:23.902 | DEBUG    | __main__:trials:24 - Trial = 70/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.904 | DEBUG    | __main__:trials:29 - Trial = 70/30000 | Total reward = 33.98
2022-01-26 14:16:23.907 | DEBUG    | __main__:trials:24 - Trial = 71/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.909 | DEBUG    | __main__:trials:29 - Trial = 71/30000 | Total reward = 28.97
2022-01-26 14:16:23.912 | DEBUG    | __main__:trials:24 - Trial = 72/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.913 | DEBUG    | __main__:trials:29 - Trial = 72/30000 | Total reward = 26.97
2022-01-26 14:16:23.917 | DEBUG    | __main__:trials:24 - Trial = 73/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.918 | DEBUG    | __main__:trials:29 - Trial = 73/30000 | Total reward = 32.62
2022-01-26 14:16:23.921 | DEBUG    | __main__:trials:24 - Trial = 74/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.923 | DEBUG    | __main__:trials:29 - Trial = 74/30000 | Total reward = 57.45
2022-01-26 14:16:23.926 | DEBUG    | __main__:trials:24 - Trial = 75/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.927 | DEBUG    | __main__:trials:29 - Trial = 75/30000 | Total reward = 53.92
2022-01-26 14:16:23.930 | DEBUG    | __main__:trials:24 - Trial = 76/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.932 | DEBUG    | __main__:trials:29 - Trial = 76/30000 | Total reward = 42.07
2022-01-26 14:16:23.935 | DEBUG    | __main__:trials:24 - Trial = 77/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.936 | DEBUG    | __main__:trials:29 - Trial = 77/30000 | Total reward = 30.12
2022-01-26 14:16:23.939 | DEBUG    | __main__:trials:24 - Trial = 78/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.941 | DEBUG    | __main__:trials:29 - Trial = 78/30000 | Total reward = 49.72
2022-01-26 14:16:23.944 | DEBUG    | __main__:trials:24 - Trial = 79/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.945 | DEBUG    | __main__:trials:29 - Trial = 79/30000 | Total reward = 26.11
2022-01-26 14:16:23.948 | DEBUG    | __main__:trials:24 - Trial = 80/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.950 | DEBUG    | __main__:trials:29 - Trial = 80/30000 | Total reward = 53.48
2022-01-26 14:16:23.954 | DEBUG    | __main__:trials:24 - Trial = 81/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.954 | DEBUG    | __main__:trials:29 - Trial = 81/30000 | Total reward = 54.29
2022-01-26 14:16:23.958 | DEBUG    | __main__:trials:24 - Trial = 82/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.960 | DEBUG    | __main__:trials:29 - Trial = 82/30000 | Total reward = 26.48
2022-01-26 14:16:23.963 | DEBUG    | __main__:trials:24 - Trial = 83/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.965 | DEBUG    | __main__:trials:29 - Trial = 83/30000 | Total reward = 37.88
2022-01-26 14:16:23.968 | DEBUG    | __main__:trials:24 - Trial = 84/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.970 | DEBUG    | __main__:trials:29 - Trial = 84/30000 | Total reward = 41.83
2022-01-26 14:16:23.973 | DEBUG    | __main__:trials:24 - Trial = 85/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.974 | DEBUG    | __main__:trials:29 - Trial = 85/30000 | Total reward = 55.97
2022-01-26 14:16:23.978 | DEBUG    | __main__:trials:24 - Trial = 86/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.979 | DEBUG    | __main__:trials:29 - Trial = 86/30000 | Total reward = 50.93
2022-01-26 14:16:23.983 | DEBUG    | __main__:trials:24 - Trial = 87/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.985 | DEBUG    | __main__:trials:29 - Trial = 87/30000 | Total reward = 41.76
2022-01-26 14:16:23.988 | DEBUG    | __main__:trials:24 - Trial = 88/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.989 | DEBUG    | __main__:trials:29 - Trial = 88/30000 | Total reward = 46.91
2022-01-26 14:16:23.992 | DEBUG    | __main__:trials:24 - Trial = 89/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.994 | DEBUG    | __main__:trials:29 - Trial = 89/30000 | Total reward = 54.23
2022-01-26 14:16:23.997 | DEBUG    | __main__:trials:24 - Trial = 90/30000 | Max number of steps (20) reached
2022-01-26 14:16:23.998 | DEBUG    | __main__:trials:29 - Trial = 90/30000 | Total reward = 46.07
2022-01-26 14:16:24.001 | DEBUG    | __main__:trials:24 - Trial = 91/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.003 | DEBUG    | __main__:trials:29 - Trial = 91/30000 | Total reward = 23.45
2022-01-26 14:16:24.007 | DEBUG    | __main__:trials:24 - Trial = 92/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.009 | DEBUG    | __main__:trials:29 - Trial = 92/30000 | Total reward = 41.07
2022-01-26 14:16:24.012 | DEBUG    | __main__:trials:26 - Trial = 93/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.014 | DEBUG    | __main__:trials:29 - Trial = 93/30000 | Total reward = 29.33
2022-01-26 14:16:24.017 | DEBUG    | __main__:trials:24 - Trial = 94/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.018 | DEBUG    | __main__:trials:29 - Trial = 94/30000 | Total reward = 29.65
2022-01-26 14:16:24.022 | DEBUG    | __main__:trials:24 - Trial = 95/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.023 | DEBUG    | __main__:trials:29 - Trial = 95/30000 | Total reward = 30.39
2022-01-26 14:16:24.026 | DEBUG    | __main__:trials:24 - Trial = 96/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.028 | DEBUG    | __main__:trials:29 - Trial = 96/30000 | Total reward = 47.06
2022-01-26 14:16:24.031 | DEBUG    | __main__:trials:24 - Trial = 97/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.032 | DEBUG    | __main__:trials:29 - Trial = 97/30000 | Total reward = 50.49
2022-01-26 14:16:24.035 | DEBUG    | __main__:trials:24 - Trial = 98/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.037 | DEBUG    | __main__:trials:29 - Trial = 98/30000 | Total reward = 47.20
2022-01-26 14:16:24.040 | DEBUG    | __main__:trials:24 - Trial = 99/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.041 | DEBUG    | __main__:trials:29 - Trial = 99/30000 | Total reward = 61.07
2022-01-26 14:16:24.045 | DEBUG    | __main__:trials:24 - Trial = 100/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.046 | DEBUG    | __main__:trials:29 - Trial = 100/30000 | Total reward = 37.38
2022-01-26 14:16:24.049 | DEBUG    | __main__:trials:24 - Trial = 101/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.051 | DEBUG    | __main__:trials:29 - Trial = 101/30000 | Total reward = 41.69
2022-01-26 14:16:24.054 | DEBUG    | __main__:trials:24 - Trial = 102/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.055 | DEBUG    | __main__:trials:29 - Trial = 102/30000 | Total reward = 44.75
2022-01-26 14:16:24.058 | DEBUG    | __main__:trials:24 - Trial = 103/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.060 | DEBUG    | __main__:trials:29 - Trial = 103/30000 | Total reward = 47.02
2022-01-26 14:16:24.063 | DEBUG    | __main__:trials:24 - Trial = 104/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.064 | DEBUG    | __main__:trials:29 - Trial = 104/30000 | Total reward = 58.26
2022-01-26 14:16:24.067 | DEBUG    | __main__:trials:24 - Trial = 105/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.069 | DEBUG    | __main__:trials:29 - Trial = 105/30000 | Total reward = 30.98
2022-01-26 14:16:24.072 | DEBUG    | __main__:trials:24 - Trial = 106/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.073 | DEBUG    | __main__:trials:29 - Trial = 106/30000 | Total reward = 48.29
2022-01-26 14:16:24.077 | DEBUG    | __main__:trials:24 - Trial = 107/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.078 | DEBUG    | __main__:trials:29 - Trial = 107/30000 | Total reward = 45.33
2022-01-26 14:16:24.081 | DEBUG    | __main__:trials:24 - Trial = 108/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.083 | DEBUG    | __main__:trials:29 - Trial = 108/30000 | Total reward = 38.97
2022-01-26 14:16:24.086 | DEBUG    | __main__:trials:24 - Trial = 109/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.088 | DEBUG    | __main__:trials:29 - Trial = 109/30000 | Total reward = 55.40
2022-01-26 14:16:24.091 | DEBUG    | __main__:trials:24 - Trial = 110/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.092 | DEBUG    | __main__:trials:29 - Trial = 110/30000 | Total reward = 47.96
2022-01-26 14:16:24.095 | DEBUG    | __main__:trials:24 - Trial = 111/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.096 | DEBUG    | __main__:trials:29 - Trial = 111/30000 | Total reward = 25.79
2022-01-26 14:16:24.099 | DEBUG    | __main__:trials:24 - Trial = 112/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.101 | DEBUG    | __main__:trials:29 - Trial = 112/30000 | Total reward = 32.47
2022-01-26 14:16:24.104 | DEBUG    | __main__:trials:24 - Trial = 113/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.105 | DEBUG    | __main__:trials:29 - Trial = 113/30000 | Total reward = 58.36
2022-01-26 14:16:24.108 | DEBUG    | __main__:trials:24 - Trial = 114/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.109 | DEBUG    | __main__:trials:29 - Trial = 114/30000 | Total reward = 32.62
2022-01-26 14:16:24.112 | DEBUG    | __main__:trials:26 - Trial = 115/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.113 | DEBUG    | __main__:trials:29 - Trial = 115/30000 | Total reward = 15.56
2022-01-26 14:16:24.117 | DEBUG    | __main__:trials:24 - Trial = 116/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.117 | DEBUG    | __main__:trials:29 - Trial = 116/30000 | Total reward = 51.33
2022-01-26 14:16:24.120 | DEBUG    | __main__:trials:24 - Trial = 117/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.121 | DEBUG    | __main__:trials:29 - Trial = 117/30000 | Total reward = 36.06
2022-01-26 14:16:24.125 | DEBUG    | __main__:trials:24 - Trial = 118/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.126 | DEBUG    | __main__:trials:29 - Trial = 118/30000 | Total reward = 30.01
2022-01-26 14:16:24.129 | DEBUG    | __main__:trials:24 - Trial = 119/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.130 | DEBUG    | __main__:trials:29 - Trial = 119/30000 | Total reward = 30.53
2022-01-26 14:16:24.133 | DEBUG    | __main__:trials:24 - Trial = 120/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.135 | DEBUG    | __main__:trials:29 - Trial = 120/30000 | Total reward = 29.68
2022-01-26 14:16:24.138 | DEBUG    | __main__:trials:24 - Trial = 121/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.139 | DEBUG    | __main__:trials:29 - Trial = 121/30000 | Total reward = 46.18
2022-01-26 14:16:24.143 | DEBUG    | __main__:trials:24 - Trial = 122/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.145 | DEBUG    | __main__:trials:29 - Trial = 122/30000 | Total reward = 38.96
2022-01-26 14:16:24.148 | DEBUG    | __main__:trials:24 - Trial = 123/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.150 | DEBUG    | __main__:trials:29 - Trial = 123/30000 | Total reward = 42.33
2022-01-26 14:16:24.153 | DEBUG    | __main__:trials:24 - Trial = 124/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.154 | DEBUG    | __main__:trials:29 - Trial = 124/30000 | Total reward = 41.17
2022-01-26 14:16:24.157 | DEBUG    | __main__:trials:24 - Trial = 125/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.159 | DEBUG    | __main__:trials:29 - Trial = 125/30000 | Total reward = 23.83
2022-01-26 14:16:24.162 | DEBUG    | __main__:trials:24 - Trial = 126/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.163 | DEBUG    | __main__:trials:29 - Trial = 126/30000 | Total reward = 48.97
2022-01-26 14:16:24.166 | DEBUG    | __main__:trials:26 - Trial = 127/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.167 | DEBUG    | __main__:trials:29 - Trial = 127/30000 | Total reward = 10.83
2022-01-26 14:16:24.169 | DEBUG    | __main__:trials:26 - Trial = 128/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.170 | DEBUG    | __main__:trials:29 - Trial = 128/30000 | Total reward = 10.83
2022-01-26 14:16:24.174 | DEBUG    | __main__:trials:24 - Trial = 129/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.175 | DEBUG    | __main__:trials:29 - Trial = 129/30000 | Total reward = 28.47
2022-01-26 14:16:24.177 | DEBUG    | __main__:trials:26 - Trial = 130/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.179 | DEBUG    | __main__:trials:29 - Trial = 130/30000 | Total reward = 14.09
2022-01-26 14:16:24.182 | DEBUG    | __main__:trials:24 - Trial = 131/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.183 | DEBUG    | __main__:trials:29 - Trial = 131/30000 | Total reward = 62.90
2022-01-26 14:16:24.185 | DEBUG    | __main__:trials:26 - Trial = 132/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.185 | DEBUG    | __main__:trials:29 - Trial = 132/30000 | Total reward = 11.09
2022-01-26 14:16:24.189 | DEBUG    | __main__:trials:24 - Trial = 133/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.189 | DEBUG    | __main__:trials:29 - Trial = 133/30000 | Total reward = 33.77
2022-01-26 14:16:24.193 | DEBUG    | __main__:trials:24 - Trial = 134/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.194 | DEBUG    | __main__:trials:29 - Trial = 134/30000 | Total reward = 37.76
2022-01-26 14:16:24.197 | DEBUG    | __main__:trials:24 - Trial = 135/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.199 | DEBUG    | __main__:trials:29 - Trial = 135/30000 | Total reward = 42.24
2022-01-26 14:16:24.202 | DEBUG    | __main__:trials:24 - Trial = 136/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.203 | DEBUG    | __main__:trials:29 - Trial = 136/30000 | Total reward = 53.44
2022-01-26 14:16:24.206 | DEBUG    | __main__:trials:24 - Trial = 137/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.208 | DEBUG    | __main__:trials:29 - Trial = 137/30000 | Total reward = 33.09
2022-01-26 14:16:24.211 | DEBUG    | __main__:trials:24 - Trial = 138/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.213 | DEBUG    | __main__:trials:29 - Trial = 138/30000 | Total reward = 44.40
2022-01-26 14:16:24.215 | DEBUG    | __main__:trials:26 - Trial = 139/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.216 | DEBUG    | __main__:trials:29 - Trial = 139/30000 | Total reward = 8.16
2022-01-26 14:16:24.219 | DEBUG    | __main__:trials:26 - Trial = 140/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.220 | DEBUG    | __main__:trials:29 - Trial = 140/30000 | Total reward = 8.31
2022-01-26 14:16:24.223 | DEBUG    | __main__:trials:24 - Trial = 141/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.225 | DEBUG    | __main__:trials:29 - Trial = 141/30000 | Total reward = 29.48
2022-01-26 14:16:24.228 | DEBUG    | __main__:trials:24 - Trial = 142/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.229 | DEBUG    | __main__:trials:29 - Trial = 142/30000 | Total reward = 44.68
2022-01-26 14:16:24.234 | DEBUG    | __main__:trials:24 - Trial = 143/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.234 | DEBUG    | __main__:trials:29 - Trial = 143/30000 | Total reward = 25.07
2022-01-26 14:16:24.238 | DEBUG    | __main__:trials:24 - Trial = 144/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.239 | DEBUG    | __main__:trials:29 - Trial = 144/30000 | Total reward = 41.33
2022-01-26 14:16:24.242 | DEBUG    | __main__:trials:24 - Trial = 145/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.244 | DEBUG    | __main__:trials:29 - Trial = 145/30000 | Total reward = 22.95
2022-01-26 14:16:24.247 | DEBUG    | __main__:trials:24 - Trial = 146/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.249 | DEBUG    | __main__:trials:29 - Trial = 146/30000 | Total reward = 36.68
2022-01-26 14:16:24.253 | DEBUG    | __main__:trials:24 - Trial = 147/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.254 | DEBUG    | __main__:trials:29 - Trial = 147/30000 | Total reward = 21.15
2022-01-26 14:16:24.258 | DEBUG    | __main__:trials:24 - Trial = 148/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.259 | DEBUG    | __main__:trials:29 - Trial = 148/30000 | Total reward = 45.72
2022-01-26 14:16:24.262 | DEBUG    | __main__:trials:24 - Trial = 149/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.264 | DEBUG    | __main__:trials:29 - Trial = 149/30000 | Total reward = 24.77
2022-01-26 14:16:24.267 | DEBUG    | __main__:trials:24 - Trial = 150/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.270 | DEBUG    | __main__:trials:29 - Trial = 150/30000 | Total reward = 35.36
2022-01-26 14:16:24.273 | DEBUG    | __main__:trials:24 - Trial = 151/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.273 | DEBUG    | __main__:trials:29 - Trial = 151/30000 | Total reward = 27.71
2022-01-26 14:16:24.277 | DEBUG    | __main__:trials:24 - Trial = 152/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.278 | DEBUG    | __main__:trials:29 - Trial = 152/30000 | Total reward = 55.75
2022-01-26 14:16:24.281 | DEBUG    | __main__:trials:24 - Trial = 153/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.283 | DEBUG    | __main__:trials:29 - Trial = 153/30000 | Total reward = 23.74
2022-01-26 14:16:24.286 | DEBUG    | __main__:trials:24 - Trial = 154/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.288 | DEBUG    | __main__:trials:29 - Trial = 154/30000 | Total reward = 33.67
2022-01-26 14:16:24.291 | DEBUG    | __main__:trials:24 - Trial = 155/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.293 | DEBUG    | __main__:trials:29 - Trial = 155/30000 | Total reward = 24.56
2022-01-26 14:16:24.296 | DEBUG    | __main__:trials:24 - Trial = 156/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.298 | DEBUG    | __main__:trials:29 - Trial = 156/30000 | Total reward = 19.51
2022-01-26 14:16:24.300 | DEBUG    | __main__:trials:26 - Trial = 157/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.302 | DEBUG    | __main__:trials:29 - Trial = 157/30000 | Total reward = 11.97
2022-01-26 14:16:24.305 | DEBUG    | __main__:trials:24 - Trial = 158/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.307 | DEBUG    | __main__:trials:29 - Trial = 158/30000 | Total reward = 30.62
2022-01-26 14:16:24.311 | DEBUG    | __main__:trials:24 - Trial = 159/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.312 | DEBUG    | __main__:trials:29 - Trial = 159/30000 | Total reward = 43.67
2022-01-26 14:16:24.315 | DEBUG    | __main__:trials:26 - Trial = 160/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.316 | DEBUG    | __main__:trials:29 - Trial = 160/30000 | Total reward = 9.97
2022-01-26 14:16:24.319 | DEBUG    | __main__:trials:26 - Trial = 161/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.320 | DEBUG    | __main__:trials:29 - Trial = 161/30000 | Total reward = 10.83
2022-01-26 14:16:24.324 | DEBUG    | __main__:trials:24 - Trial = 162/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.326 | DEBUG    | __main__:trials:29 - Trial = 162/30000 | Total reward = 47.90
2022-01-26 14:16:24.328 | DEBUG    | __main__:trials:26 - Trial = 163/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.329 | DEBUG    | __main__:trials:29 - Trial = 163/30000 | Total reward = 11.97
2022-01-26 14:16:24.333 | DEBUG    | __main__:trials:24 - Trial = 164/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.334 | DEBUG    | __main__:trials:29 - Trial = 164/30000 | Total reward = 28.98
2022-01-26 14:16:24.337 | DEBUG    | __main__:trials:24 - Trial = 165/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.339 | DEBUG    | __main__:trials:29 - Trial = 165/30000 | Total reward = 16.57
2022-01-26 14:16:24.342 | DEBUG    | __main__:trials:24 - Trial = 166/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.344 | DEBUG    | __main__:trials:29 - Trial = 166/30000 | Total reward = 32.27
2022-01-26 14:16:24.347 | DEBUG    | __main__:trials:24 - Trial = 167/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.348 | DEBUG    | __main__:trials:29 - Trial = 167/30000 | Total reward = 25.94
2022-01-26 14:16:24.350 | DEBUG    | __main__:trials:26 - Trial = 168/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.352 | DEBUG    | __main__:trials:29 - Trial = 168/30000 | Total reward = 19.23
2022-01-26 14:16:24.355 | DEBUG    | __main__:trials:24 - Trial = 169/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.356 | DEBUG    | __main__:trials:29 - Trial = 169/30000 | Total reward = 58.65
2022-01-26 14:16:24.360 | DEBUG    | __main__:trials:24 - Trial = 170/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.361 | DEBUG    | __main__:trials:29 - Trial = 170/30000 | Total reward = 37.64
2022-01-26 14:16:24.365 | DEBUG    | __main__:trials:24 - Trial = 171/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.366 | DEBUG    | __main__:trials:29 - Trial = 171/30000 | Total reward = 51.25
2022-01-26 14:16:24.368 | DEBUG    | __main__:trials:26 - Trial = 172/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.369 | DEBUG    | __main__:trials:29 - Trial = 172/30000 | Total reward = 16.51
2022-01-26 14:16:24.373 | DEBUG    | __main__:trials:24 - Trial = 173/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.374 | DEBUG    | __main__:trials:29 - Trial = 173/30000 | Total reward = 24.56
2022-01-26 14:16:24.377 | DEBUG    | __main__:trials:24 - Trial = 174/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.378 | DEBUG    | __main__:trials:29 - Trial = 174/30000 | Total reward = 49.41
2022-01-26 14:16:24.381 | DEBUG    | __main__:trials:24 - Trial = 175/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.382 | DEBUG    | __main__:trials:29 - Trial = 175/30000 | Total reward = 20.47
2022-01-26 14:16:24.386 | DEBUG    | __main__:trials:24 - Trial = 176/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.387 | DEBUG    | __main__:trials:29 - Trial = 176/30000 | Total reward = 18.37
2022-01-26 14:16:24.391 | DEBUG    | __main__:trials:24 - Trial = 177/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.392 | DEBUG    | __main__:trials:29 - Trial = 177/30000 | Total reward = 25.21
2022-01-26 14:16:24.395 | DEBUG    | __main__:trials:24 - Trial = 178/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.396 | DEBUG    | __main__:trials:29 - Trial = 178/30000 | Total reward = 33.88
2022-01-26 14:16:24.400 | DEBUG    | __main__:trials:24 - Trial = 179/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.402 | DEBUG    | __main__:trials:29 - Trial = 179/30000 | Total reward = 29.05
2022-01-26 14:16:24.405 | DEBUG    | __main__:trials:24 - Trial = 180/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.406 | DEBUG    | __main__:trials:29 - Trial = 180/30000 | Total reward = 36.32
2022-01-26 14:16:24.410 | DEBUG    | __main__:trials:24 - Trial = 181/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.412 | DEBUG    | __main__:trials:29 - Trial = 181/30000 | Total reward = 51.45
2022-01-26 14:16:24.415 | DEBUG    | __main__:trials:26 - Trial = 182/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.416 | DEBUG    | __main__:trials:29 - Trial = 182/30000 | Total reward = 14.06
2022-01-26 14:16:24.419 | DEBUG    | __main__:trials:24 - Trial = 183/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.420 | DEBUG    | __main__:trials:29 - Trial = 183/30000 | Total reward = 29.03
2022-01-26 14:16:24.423 | DEBUG    | __main__:trials:26 - Trial = 184/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.425 | DEBUG    | __main__:trials:29 - Trial = 184/30000 | Total reward = 14.50
2022-01-26 14:16:24.428 | DEBUG    | __main__:trials:24 - Trial = 185/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.430 | DEBUG    | __main__:trials:29 - Trial = 185/30000 | Total reward = 52.58
2022-01-26 14:16:24.432 | DEBUG    | __main__:trials:26 - Trial = 186/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.433 | DEBUG    | __main__:trials:29 - Trial = 186/30000 | Total reward = 17.37
2022-01-26 14:16:24.436 | DEBUG    | __main__:trials:24 - Trial = 187/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.437 | DEBUG    | __main__:trials:29 - Trial = 187/30000 | Total reward = 23.92
2022-01-26 14:16:24.440 | DEBUG    | __main__:trials:26 - Trial = 188/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.442 | DEBUG    | __main__:trials:29 - Trial = 188/30000 | Total reward = 20.60
2022-01-26 14:16:24.445 | DEBUG    | __main__:trials:24 - Trial = 189/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.446 | DEBUG    | __main__:trials:29 - Trial = 189/30000 | Total reward = 47.32
2022-01-26 14:16:24.449 | DEBUG    | __main__:trials:26 - Trial = 190/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.449 | DEBUG    | __main__:trials:29 - Trial = 190/30000 | Total reward = 14.11
2022-01-26 14:16:24.453 | DEBUG    | __main__:trials:24 - Trial = 191/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.453 | DEBUG    | __main__:trials:29 - Trial = 191/30000 | Total reward = 24.26
2022-01-26 14:16:24.458 | DEBUG    | __main__:trials:24 - Trial = 192/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.459 | DEBUG    | __main__:trials:29 - Trial = 192/30000 | Total reward = 39.92
2022-01-26 14:16:24.461 | DEBUG    | __main__:trials:26 - Trial = 193/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.462 | DEBUG    | __main__:trials:29 - Trial = 193/30000 | Total reward = 13.27
2022-01-26 14:16:24.465 | DEBUG    | __main__:trials:24 - Trial = 194/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.466 | DEBUG    | __main__:trials:29 - Trial = 194/30000 | Total reward = 39.71
2022-01-26 14:16:24.469 | DEBUG    | __main__:trials:24 - Trial = 195/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.470 | DEBUG    | __main__:trials:29 - Trial = 195/30000 | Total reward = 40.05
2022-01-26 14:16:24.472 | DEBUG    | __main__:trials:26 - Trial = 196/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.473 | DEBUG    | __main__:trials:29 - Trial = 196/30000 | Total reward = 17.18
2022-01-26 14:16:24.475 | DEBUG    | __main__:trials:26 - Trial = 197/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.477 | DEBUG    | __main__:trials:29 - Trial = 197/30000 | Total reward = 10.83
2022-01-26 14:16:24.480 | DEBUG    | __main__:trials:24 - Trial = 198/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.482 | DEBUG    | __main__:trials:29 - Trial = 198/30000 | Total reward = 27.95
2022-01-26 14:16:24.485 | DEBUG    | __main__:trials:24 - Trial = 199/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.486 | DEBUG    | __main__:trials:29 - Trial = 199/30000 | Total reward = 37.77
2022-01-26 14:16:24.489 | DEBUG    | __main__:trials:24 - Trial = 200/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.490 | DEBUG    | __main__:trials:29 - Trial = 200/30000 | Total reward = 47.69
2022-01-26 14:16:24.494 | DEBUG    | __main__:trials:24 - Trial = 201/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.495 | DEBUG    | __main__:trials:29 - Trial = 201/30000 | Total reward = 43.71
2022-01-26 14:16:24.498 | DEBUG    | __main__:trials:24 - Trial = 202/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.499 | DEBUG    | __main__:trials:29 - Trial = 202/30000 | Total reward = 45.07
2022-01-26 14:16:24.502 | DEBUG    | __main__:trials:24 - Trial = 203/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.505 | DEBUG    | __main__:trials:29 - Trial = 203/30000 | Total reward = 40.19
2022-01-26 14:16:24.509 | DEBUG    | __main__:trials:24 - Trial = 204/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.509 | DEBUG    | __main__:trials:29 - Trial = 204/30000 | Total reward = 52.09
2022-01-26 14:16:24.513 | DEBUG    | __main__:trials:24 - Trial = 205/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.513 | DEBUG    | __main__:trials:29 - Trial = 205/30000 | Total reward = 29.80
2022-01-26 14:16:24.516 | DEBUG    | __main__:trials:26 - Trial = 206/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.517 | DEBUG    | __main__:trials:29 - Trial = 206/30000 | Total reward = 10.83
2022-01-26 14:16:24.519 | DEBUG    | __main__:trials:26 - Trial = 207/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.520 | DEBUG    | __main__:trials:29 - Trial = 207/30000 | Total reward = 7.98
2022-01-26 14:16:24.523 | DEBUG    | __main__:trials:24 - Trial = 208/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.525 | DEBUG    | __main__:trials:29 - Trial = 208/30000 | Total reward = 24.88
2022-01-26 14:16:24.528 | DEBUG    | __main__:trials:26 - Trial = 209/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.528 | DEBUG    | __main__:trials:29 - Trial = 209/30000 | Total reward = 18.83
2022-01-26 14:16:24.532 | DEBUG    | __main__:trials:24 - Trial = 210/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.534 | DEBUG    | __main__:trials:29 - Trial = 210/30000 | Total reward = 40.83
2022-01-26 14:16:24.536 | DEBUG    | __main__:trials:26 - Trial = 211/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.537 | DEBUG    | __main__:trials:29 - Trial = 211/30000 | Total reward = 10.83
2022-01-26 14:16:24.539 | DEBUG    | __main__:trials:26 - Trial = 212/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.541 | DEBUG    | __main__:trials:29 - Trial = 212/30000 | Total reward = 10.83
2022-01-26 14:16:24.542 | DEBUG    | __main__:trials:26 - Trial = 213/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.544 | DEBUG    | __main__:trials:29 - Trial = 213/30000 | Total reward = 10.83
2022-01-26 14:16:24.547 | DEBUG    | __main__:trials:24 - Trial = 214/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.548 | DEBUG    | __main__:trials:29 - Trial = 214/30000 | Total reward = 42.75
2022-01-26 14:16:24.550 | DEBUG    | __main__:trials:26 - Trial = 215/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.552 | DEBUG    | __main__:trials:29 - Trial = 215/30000 | Total reward = 10.83
2022-01-26 14:16:24.553 | DEBUG    | __main__:trials:26 - Trial = 216/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.555 | DEBUG    | __main__:trials:29 - Trial = 216/30000 | Total reward = 14.27
2022-01-26 14:16:24.558 | DEBUG    | __main__:trials:24 - Trial = 217/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.559 | DEBUG    | __main__:trials:29 - Trial = 217/30000 | Total reward = 60.09
2022-01-26 14:16:24.562 | DEBUG    | __main__:trials:24 - Trial = 218/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.564 | DEBUG    | __main__:trials:29 - Trial = 218/30000 | Total reward = 41.17
2022-01-26 14:16:24.566 | DEBUG    | __main__:trials:26 - Trial = 219/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.567 | DEBUG    | __main__:trials:29 - Trial = 219/30000 | Total reward = 10.83
2022-01-26 14:16:24.569 | DEBUG    | __main__:trials:26 - Trial = 220/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.571 | DEBUG    | __main__:trials:29 - Trial = 220/30000 | Total reward = 10.83
2022-01-26 14:16:24.574 | DEBUG    | __main__:trials:24 - Trial = 221/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.575 | DEBUG    | __main__:trials:29 - Trial = 221/30000 | Total reward = 47.23
2022-01-26 14:16:24.578 | DEBUG    | __main__:trials:24 - Trial = 222/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.580 | DEBUG    | __main__:trials:29 - Trial = 222/30000 | Total reward = 28.98
2022-01-26 14:16:24.584 | DEBUG    | __main__:trials:24 - Trial = 223/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.585 | DEBUG    | __main__:trials:29 - Trial = 223/30000 | Total reward = 25.30
2022-01-26 14:16:24.588 | DEBUG    | __main__:trials:26 - Trial = 224/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.589 | DEBUG    | __main__:trials:29 - Trial = 224/30000 | Total reward = 18.31
2022-01-26 14:16:24.591 | DEBUG    | __main__:trials:26 - Trial = 225/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.593 | DEBUG    | __main__:trials:29 - Trial = 225/30000 | Total reward = 23.82
2022-01-26 14:16:24.596 | DEBUG    | __main__:trials:24 - Trial = 226/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.597 | DEBUG    | __main__:trials:29 - Trial = 226/30000 | Total reward = 43.20
2022-01-26 14:16:24.601 | DEBUG    | __main__:trials:24 - Trial = 227/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.602 | DEBUG    | __main__:trials:29 - Trial = 227/30000 | Total reward = 42.44
2022-01-26 14:16:24.605 | DEBUG    | __main__:trials:24 - Trial = 228/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.607 | DEBUG    | __main__:trials:29 - Trial = 228/30000 | Total reward = 42.95
2022-01-26 14:16:24.610 | DEBUG    | __main__:trials:24 - Trial = 229/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.611 | DEBUG    | __main__:trials:29 - Trial = 229/30000 | Total reward = 28.40
2022-01-26 14:16:24.614 | DEBUG    | __main__:trials:24 - Trial = 230/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.616 | DEBUG    | __main__:trials:29 - Trial = 230/30000 | Total reward = 40.05
2022-01-26 14:16:24.620 | DEBUG    | __main__:trials:24 - Trial = 231/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.621 | DEBUG    | __main__:trials:29 - Trial = 231/30000 | Total reward = 49.01
2022-01-26 14:16:24.624 | DEBUG    | __main__:trials:24 - Trial = 232/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.625 | DEBUG    | __main__:trials:29 - Trial = 232/30000 | Total reward = 46.47
2022-01-26 14:16:24.629 | DEBUG    | __main__:trials:24 - Trial = 233/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.630 | DEBUG    | __main__:trials:29 - Trial = 233/30000 | Total reward = 42.89
2022-01-26 14:16:24.634 | DEBUG    | __main__:trials:24 - Trial = 234/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.636 | DEBUG    | __main__:trials:29 - Trial = 234/30000 | Total reward = 40.76
2022-01-26 14:16:24.639 | DEBUG    | __main__:trials:24 - Trial = 235/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.641 | DEBUG    | __main__:trials:29 - Trial = 235/30000 | Total reward = 38.88
2022-01-26 14:16:24.645 | DEBUG    | __main__:trials:24 - Trial = 236/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.647 | DEBUG    | __main__:trials:29 - Trial = 236/30000 | Total reward = 34.65
2022-01-26 14:16:24.651 | DEBUG    | __main__:trials:24 - Trial = 237/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.651 | DEBUG    | __main__:trials:29 - Trial = 237/30000 | Total reward = 23.31
2022-01-26 14:16:24.654 | DEBUG    | __main__:trials:26 - Trial = 238/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.655 | DEBUG    | __main__:trials:29 - Trial = 238/30000 | Total reward = 10.83
2022-01-26 14:16:24.659 | DEBUG    | __main__:trials:24 - Trial = 239/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.661 | DEBUG    | __main__:trials:29 - Trial = 239/30000 | Total reward = 19.70
2022-01-26 14:16:24.664 | DEBUG    | __main__:trials:24 - Trial = 240/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.665 | DEBUG    | __main__:trials:29 - Trial = 240/30000 | Total reward = 32.28
2022-01-26 14:16:24.667 | DEBUG    | __main__:trials:26 - Trial = 241/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.669 | DEBUG    | __main__:trials:29 - Trial = 241/30000 | Total reward = 14.81
2022-01-26 14:16:24.671 | DEBUG    | __main__:trials:26 - Trial = 242/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.673 | DEBUG    | __main__:trials:29 - Trial = 242/30000 | Total reward = 10.83
2022-01-26 14:16:24.674 | DEBUG    | __main__:trials:26 - Trial = 243/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.675 | DEBUG    | __main__:trials:29 - Trial = 243/30000 | Total reward = 10.83
2022-01-26 14:16:24.677 | DEBUG    | __main__:trials:26 - Trial = 244/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.678 | DEBUG    | __main__:trials:29 - Trial = 244/30000 | Total reward = 10.83
2022-01-26 14:16:24.681 | DEBUG    | __main__:trials:26 - Trial = 245/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.683 | DEBUG    | __main__:trials:29 - Trial = 245/30000 | Total reward = 10.83
2022-01-26 14:16:24.686 | DEBUG    | __main__:trials:24 - Trial = 246/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.688 | DEBUG    | __main__:trials:29 - Trial = 246/30000 | Total reward = 28.78
2022-01-26 14:16:24.691 | DEBUG    | __main__:trials:24 - Trial = 247/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.693 | DEBUG    | __main__:trials:29 - Trial = 247/30000 | Total reward = 29.97
2022-01-26 14:16:24.696 | DEBUG    | __main__:trials:24 - Trial = 248/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.698 | DEBUG    | __main__:trials:29 - Trial = 248/30000 | Total reward = 14.02
2022-01-26 14:16:24.700 | DEBUG    | __main__:trials:26 - Trial = 249/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.702 | DEBUG    | __main__:trials:29 - Trial = 249/30000 | Total reward = 8.83
2022-01-26 14:16:24.705 | DEBUG    | __main__:trials:24 - Trial = 250/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.706 | DEBUG    | __main__:trials:29 - Trial = 250/30000 | Total reward = 43.54
2022-01-26 14:16:24.709 | DEBUG    | __main__:trials:26 - Trial = 251/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.709 | DEBUG    | __main__:trials:29 - Trial = 251/30000 | Total reward = 9.16
2022-01-26 14:16:24.713 | DEBUG    | __main__:trials:24 - Trial = 252/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.714 | DEBUG    | __main__:trials:29 - Trial = 252/30000 | Total reward = 32.05
2022-01-26 14:16:24.718 | DEBUG    | __main__:trials:24 - Trial = 253/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.720 | DEBUG    | __main__:trials:29 - Trial = 253/30000 | Total reward = 50.07
2022-01-26 14:16:24.724 | DEBUG    | __main__:trials:24 - Trial = 254/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.725 | DEBUG    | __main__:trials:29 - Trial = 254/30000 | Total reward = 66.25
2022-01-26 14:16:24.727 | DEBUG    | __main__:trials:26 - Trial = 255/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.729 | DEBUG    | __main__:trials:29 - Trial = 255/30000 | Total reward = 16.17
2022-01-26 14:16:24.731 | DEBUG    | __main__:trials:26 - Trial = 256/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.733 | DEBUG    | __main__:trials:29 - Trial = 256/30000 | Total reward = 7.98
2022-01-26 14:16:24.735 | DEBUG    | __main__:trials:26 - Trial = 257/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.736 | DEBUG    | __main__:trials:29 - Trial = 257/30000 | Total reward = 10.83
2022-01-26 14:16:24.740 | DEBUG    | __main__:trials:24 - Trial = 258/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.742 | DEBUG    | __main__:trials:29 - Trial = 258/30000 | Total reward = 21.52
2022-01-26 14:16:24.746 | DEBUG    | __main__:trials:24 - Trial = 259/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.747 | DEBUG    | __main__:trials:29 - Trial = 259/30000 | Total reward = 41.93
2022-01-26 14:16:24.749 | DEBUG    | __main__:trials:26 - Trial = 260/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.751 | DEBUG    | __main__:trials:29 - Trial = 260/30000 | Total reward = 17.84
2022-01-26 14:16:24.754 | DEBUG    | __main__:trials:24 - Trial = 261/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.755 | DEBUG    | __main__:trials:29 - Trial = 261/30000 | Total reward = 45.39
2022-01-26 14:16:24.758 | DEBUG    | __main__:trials:24 - Trial = 262/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.760 | DEBUG    | __main__:trials:29 - Trial = 262/30000 | Total reward = 49.65
2022-01-26 14:16:24.764 | DEBUG    | __main__:trials:24 - Trial = 263/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.765 | DEBUG    | __main__:trials:29 - Trial = 263/30000 | Total reward = 43.97
2022-01-26 14:16:24.767 | DEBUG    | __main__:trials:26 - Trial = 264/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.769 | DEBUG    | __main__:trials:29 - Trial = 264/30000 | Total reward = 10.83
2022-01-26 14:16:24.772 | DEBUG    | __main__:trials:24 - Trial = 265/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.773 | DEBUG    | __main__:trials:29 - Trial = 265/30000 | Total reward = 43.52
2022-01-26 14:16:24.776 | DEBUG    | __main__:trials:24 - Trial = 266/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.778 | DEBUG    | __main__:trials:29 - Trial = 266/30000 | Total reward = 42.80
2022-01-26 14:16:24.779 | DEBUG    | __main__:trials:26 - Trial = 267/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.780 | DEBUG    | __main__:trials:29 - Trial = 267/30000 | Total reward = 10.83
2022-01-26 14:16:24.783 | DEBUG    | __main__:trials:24 - Trial = 268/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.784 | DEBUG    | __main__:trials:29 - Trial = 268/30000 | Total reward = 36.64
2022-01-26 14:16:24.788 | DEBUG    | __main__:trials:24 - Trial = 269/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.789 | DEBUG    | __main__:trials:29 - Trial = 269/30000 | Total reward = 24.07
2022-01-26 14:16:24.793 | DEBUG    | __main__:trials:24 - Trial = 270/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.794 | DEBUG    | __main__:trials:29 - Trial = 270/30000 | Total reward = 42.96
2022-01-26 14:16:24.798 | DEBUG    | __main__:trials:24 - Trial = 271/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.800 | DEBUG    | __main__:trials:29 - Trial = 271/30000 | Total reward = 23.13
2022-01-26 14:16:24.801 | DEBUG    | __main__:trials:26 - Trial = 272/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.802 | DEBUG    | __main__:trials:29 - Trial = 272/30000 | Total reward = 10.83
2022-01-26 14:16:24.804 | DEBUG    | __main__:trials:26 - Trial = 273/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.805 | DEBUG    | __main__:trials:29 - Trial = 273/30000 | Total reward = 7.98
2022-01-26 14:16:24.808 | DEBUG    | __main__:trials:24 - Trial = 274/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.809 | DEBUG    | __main__:trials:29 - Trial = 274/30000 | Total reward = 44.26
2022-01-26 14:16:24.813 | DEBUG    | __main__:trials:24 - Trial = 275/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.814 | DEBUG    | __main__:trials:29 - Trial = 275/30000 | Total reward = 42.13
2022-01-26 14:16:24.816 | DEBUG    | __main__:trials:26 - Trial = 276/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.818 | DEBUG    | __main__:trials:29 - Trial = 276/30000 | Total reward = 10.83
2022-01-26 14:16:24.820 | DEBUG    | __main__:trials:26 - Trial = 277/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.822 | DEBUG    | __main__:trials:29 - Trial = 277/30000 | Total reward = 13.49
2022-01-26 14:16:24.823 | DEBUG    | __main__:trials:26 - Trial = 278/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.824 | DEBUG    | __main__:trials:29 - Trial = 278/30000 | Total reward = 10.83
2022-01-26 14:16:24.826 | DEBUG    | __main__:trials:26 - Trial = 279/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.826 | DEBUG    | __main__:trials:29 - Trial = 279/30000 | Total reward = 10.83
2022-01-26 14:16:24.830 | DEBUG    | __main__:trials:24 - Trial = 280/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.830 | DEBUG    | __main__:trials:29 - Trial = 280/30000 | Total reward = 29.16
2022-01-26 14:16:24.835 | DEBUG    | __main__:trials:24 - Trial = 281/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.835 | DEBUG    | __main__:trials:29 - Trial = 281/30000 | Total reward = 37.57
2022-01-26 14:16:24.839 | DEBUG    | __main__:trials:24 - Trial = 282/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.841 | DEBUG    | __main__:trials:29 - Trial = 282/30000 | Total reward = 41.43
2022-01-26 14:16:24.844 | DEBUG    | __main__:trials:24 - Trial = 283/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.846 | DEBUG    | __main__:trials:29 - Trial = 283/30000 | Total reward = 39.16
2022-01-26 14:16:24.847 | DEBUG    | __main__:trials:26 - Trial = 284/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.848 | DEBUG    | __main__:trials:29 - Trial = 284/30000 | Total reward = 7.70
2022-01-26 14:16:24.852 | DEBUG    | __main__:trials:24 - Trial = 285/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.852 | DEBUG    | __main__:trials:29 - Trial = 285/30000 | Total reward = 31.89
2022-01-26 14:16:24.856 | DEBUG    | __main__:trials:24 - Trial = 286/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.856 | DEBUG    | __main__:trials:29 - Trial = 286/30000 | Total reward = 49.36
2022-01-26 14:16:24.860 | DEBUG    | __main__:trials:24 - Trial = 287/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.862 | DEBUG    | __main__:trials:29 - Trial = 287/30000 | Total reward = 57.49
2022-01-26 14:16:24.864 | DEBUG    | __main__:trials:26 - Trial = 288/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.865 | DEBUG    | __main__:trials:29 - Trial = 288/30000 | Total reward = 10.83
2022-01-26 14:16:24.868 | DEBUG    | __main__:trials:26 - Trial = 289/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.869 | DEBUG    | __main__:trials:29 - Trial = 289/30000 | Total reward = 9.16
2022-01-26 14:16:24.872 | DEBUG    | __main__:trials:26 - Trial = 290/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.872 | DEBUG    | __main__:trials:29 - Trial = 290/30000 | Total reward = 21.56
2022-01-26 14:16:24.874 | DEBUG    | __main__:trials:26 - Trial = 291/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.875 | DEBUG    | __main__:trials:29 - Trial = 291/30000 | Total reward = 10.83
2022-01-26 14:16:24.879 | DEBUG    | __main__:trials:24 - Trial = 292/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.880 | DEBUG    | __main__:trials:29 - Trial = 292/30000 | Total reward = 50.40
2022-01-26 14:16:24.883 | DEBUG    | __main__:trials:26 - Trial = 293/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.885 | DEBUG    | __main__:trials:29 - Trial = 293/30000 | Total reward = 13.89
2022-01-26 14:16:24.888 | DEBUG    | __main__:trials:24 - Trial = 294/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.888 | DEBUG    | __main__:trials:29 - Trial = 294/30000 | Total reward = 44.66
2022-01-26 14:16:24.892 | DEBUG    | __main__:trials:24 - Trial = 295/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.893 | DEBUG    | __main__:trials:29 - Trial = 295/30000 | Total reward = 35.64
2022-01-26 14:16:24.896 | DEBUG    | __main__:trials:24 - Trial = 296/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.897 | DEBUG    | __main__:trials:29 - Trial = 296/30000 | Total reward = 40.93
2022-01-26 14:16:24.901 | DEBUG    | __main__:trials:24 - Trial = 297/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.902 | DEBUG    | __main__:trials:29 - Trial = 297/30000 | Total reward = 21.48
2022-01-26 14:16:24.904 | DEBUG    | __main__:trials:26 - Trial = 298/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.905 | DEBUG    | __main__:trials:29 - Trial = 298/30000 | Total reward = 11.12
2022-01-26 14:16:24.908 | DEBUG    | __main__:trials:24 - Trial = 299/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.909 | DEBUG    | __main__:trials:29 - Trial = 299/30000 | Total reward = 48.90
2022-01-26 14:16:24.912 | DEBUG    | __main__:trials:26 - Trial = 300/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.913 | DEBUG    | __main__:trials:29 - Trial = 300/30000 | Total reward = 15.71
2022-01-26 14:16:24.915 | DEBUG    | __main__:trials:26 - Trial = 301/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.915 | DEBUG    | __main__:trials:29 - Trial = 301/30000 | Total reward = 10.83
2022-01-26 14:16:24.919 | DEBUG    | __main__:trials:24 - Trial = 302/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.920 | DEBUG    | __main__:trials:29 - Trial = 302/30000 | Total reward = 42.68
2022-01-26 14:16:24.923 | DEBUG    | __main__:trials:24 - Trial = 303/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.924 | DEBUG    | __main__:trials:29 - Trial = 303/30000 | Total reward = 32.18
2022-01-26 14:16:24.927 | DEBUG    | __main__:trials:26 - Trial = 304/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.928 | DEBUG    | __main__:trials:29 - Trial = 304/30000 | Total reward = 26.93
2022-01-26 14:16:24.931 | DEBUG    | __main__:trials:24 - Trial = 305/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.933 | DEBUG    | __main__:trials:29 - Trial = 305/30000 | Total reward = 48.29
2022-01-26 14:16:24.935 | DEBUG    | __main__:trials:26 - Trial = 306/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.936 | DEBUG    | __main__:trials:29 - Trial = 306/30000 | Total reward = 16.60
2022-01-26 14:16:24.939 | DEBUG    | __main__:trials:24 - Trial = 307/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.940 | DEBUG    | __main__:trials:29 - Trial = 307/30000 | Total reward = 43.32
2022-01-26 14:16:24.944 | DEBUG    | __main__:trials:24 - Trial = 308/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.945 | DEBUG    | __main__:trials:29 - Trial = 308/30000 | Total reward = 32.14
2022-01-26 14:16:24.948 | DEBUG    | __main__:trials:24 - Trial = 309/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.949 | DEBUG    | __main__:trials:29 - Trial = 309/30000 | Total reward = 51.04
2022-01-26 14:16:24.952 | DEBUG    | __main__:trials:24 - Trial = 310/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.952 | DEBUG    | __main__:trials:29 - Trial = 310/30000 | Total reward = 42.46
2022-01-26 14:16:24.955 | DEBUG    | __main__:trials:24 - Trial = 311/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.956 | DEBUG    | __main__:trials:29 - Trial = 311/30000 | Total reward = 32.55
2022-01-26 14:16:24.959 | DEBUG    | __main__:trials:24 - Trial = 312/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.960 | DEBUG    | __main__:trials:29 - Trial = 312/30000 | Total reward = 47.72
2022-01-26 14:16:24.963 | DEBUG    | __main__:trials:24 - Trial = 313/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.964 | DEBUG    | __main__:trials:29 - Trial = 313/30000 | Total reward = 36.68
2022-01-26 14:16:24.968 | DEBUG    | __main__:trials:24 - Trial = 314/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.968 | DEBUG    | __main__:trials:29 - Trial = 314/30000 | Total reward = 42.63
2022-01-26 14:16:24.971 | DEBUG    | __main__:trials:24 - Trial = 315/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.972 | DEBUG    | __main__:trials:29 - Trial = 315/30000 | Total reward = 38.89
2022-01-26 14:16:24.975 | DEBUG    | __main__:trials:24 - Trial = 316/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.976 | DEBUG    | __main__:trials:29 - Trial = 316/30000 | Total reward = 44.62
2022-01-26 14:16:24.979 | DEBUG    | __main__:trials:24 - Trial = 317/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.980 | DEBUG    | __main__:trials:29 - Trial = 317/30000 | Total reward = 51.66
2022-01-26 14:16:24.983 | DEBUG    | __main__:trials:26 - Trial = 318/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.983 | DEBUG    | __main__:trials:29 - Trial = 318/30000 | Total reward = 18.63
2022-01-26 14:16:24.986 | DEBUG    | __main__:trials:24 - Trial = 319/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.987 | DEBUG    | __main__:trials:29 - Trial = 319/30000 | Total reward = 51.08
2022-01-26 14:16:24.990 | DEBUG    | __main__:trials:24 - Trial = 320/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.991 | DEBUG    | __main__:trials:29 - Trial = 320/30000 | Total reward = 47.41
2022-01-26 14:16:24.994 | DEBUG    | __main__:trials:24 - Trial = 321/30000 | Max number of steps (20) reached
2022-01-26 14:16:24.995 | DEBUG    | __main__:trials:29 - Trial = 321/30000 | Total reward = 43.36
2022-01-26 14:16:24.997 | DEBUG    | __main__:trials:26 - Trial = 322/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:24.998 | DEBUG    | __main__:trials:29 - Trial = 322/30000 | Total reward = 21.83
2022-01-26 14:16:25.001 | DEBUG    | __main__:trials:24 - Trial = 323/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.002 | DEBUG    | __main__:trials:29 - Trial = 323/30000 | Total reward = 27.97
2022-01-26 14:16:25.005 | DEBUG    | __main__:trials:24 - Trial = 324/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.006 | DEBUG    | __main__:trials:29 - Trial = 324/30000 | Total reward = 49.77
2022-01-26 14:16:25.009 | DEBUG    | __main__:trials:24 - Trial = 325/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.010 | DEBUG    | __main__:trials:29 - Trial = 325/30000 | Total reward = 44.52
2022-01-26 14:16:25.012 | DEBUG    | __main__:trials:26 - Trial = 326/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.013 | DEBUG    | __main__:trials:29 - Trial = 326/30000 | Total reward = 17.97
2022-01-26 14:16:25.016 | DEBUG    | __main__:trials:24 - Trial = 327/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.017 | DEBUG    | __main__:trials:29 - Trial = 327/30000 | Total reward = 28.04
2022-01-26 14:16:25.019 | DEBUG    | __main__:trials:26 - Trial = 328/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.020 | DEBUG    | __main__:trials:29 - Trial = 328/30000 | Total reward = 18.42
2022-01-26 14:16:25.023 | DEBUG    | __main__:trials:24 - Trial = 329/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.023 | DEBUG    | __main__:trials:29 - Trial = 329/30000 | Total reward = 45.18
2022-01-26 14:16:25.026 | DEBUG    | __main__:trials:24 - Trial = 330/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.027 | DEBUG    | __main__:trials:29 - Trial = 330/30000 | Total reward = 45.73
2022-01-26 14:16:25.030 | DEBUG    | __main__:trials:24 - Trial = 331/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.031 | DEBUG    | __main__:trials:29 - Trial = 331/30000 | Total reward = 38.44
2022-01-26 14:16:25.033 | DEBUG    | __main__:trials:26 - Trial = 332/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.034 | DEBUG    | __main__:trials:29 - Trial = 332/30000 | Total reward = 13.88
2022-01-26 14:16:25.037 | DEBUG    | __main__:trials:24 - Trial = 333/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.038 | DEBUG    | __main__:trials:29 - Trial = 333/30000 | Total reward = 29.30
2022-01-26 14:16:25.039 | DEBUG    | __main__:trials:26 - Trial = 334/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.040 | DEBUG    | __main__:trials:29 - Trial = 334/30000 | Total reward = 10.82
2022-01-26 14:16:25.043 | DEBUG    | __main__:trials:24 - Trial = 335/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.044 | DEBUG    | __main__:trials:29 - Trial = 335/30000 | Total reward = 45.79
2022-01-26 14:16:25.046 | DEBUG    | __main__:trials:26 - Trial = 336/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.047 | DEBUG    | __main__:trials:29 - Trial = 336/30000 | Total reward = 10.83
2022-01-26 14:16:25.050 | DEBUG    | __main__:trials:24 - Trial = 337/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.051 | DEBUG    | __main__:trials:29 - Trial = 337/30000 | Total reward = 37.35
2022-01-26 14:16:25.052 | DEBUG    | __main__:trials:26 - Trial = 338/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.053 | DEBUG    | __main__:trials:29 - Trial = 338/30000 | Total reward = 10.82
2022-01-26 14:16:25.056 | DEBUG    | __main__:trials:24 - Trial = 339/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.057 | DEBUG    | __main__:trials:29 - Trial = 339/30000 | Total reward = 44.25
2022-01-26 14:16:25.060 | DEBUG    | __main__:trials:24 - Trial = 340/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.061 | DEBUG    | __main__:trials:29 - Trial = 340/30000 | Total reward = 30.32
2022-01-26 14:16:25.064 | DEBUG    | __main__:trials:24 - Trial = 341/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.065 | DEBUG    | __main__:trials:29 - Trial = 341/30000 | Total reward = 31.97
2022-01-26 14:16:25.067 | DEBUG    | __main__:trials:26 - Trial = 342/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.067 | DEBUG    | __main__:trials:29 - Trial = 342/30000 | Total reward = 10.83
2022-01-26 14:16:25.071 | DEBUG    | __main__:trials:24 - Trial = 343/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.071 | DEBUG    | __main__:trials:29 - Trial = 343/30000 | Total reward = 42.20
2022-01-26 14:16:25.075 | DEBUG    | __main__:trials:24 - Trial = 344/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.075 | DEBUG    | __main__:trials:29 - Trial = 344/30000 | Total reward = 31.71
2022-01-26 14:16:25.078 | DEBUG    | __main__:trials:26 - Trial = 345/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.079 | DEBUG    | __main__:trials:29 - Trial = 345/30000 | Total reward = 22.98
2022-01-26 14:16:25.081 | DEBUG    | __main__:trials:26 - Trial = 346/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.082 | DEBUG    | __main__:trials:29 - Trial = 346/30000 | Total reward = 21.88
2022-01-26 14:16:25.084 | DEBUG    | __main__:trials:26 - Trial = 347/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.085 | DEBUG    | __main__:trials:29 - Trial = 347/30000 | Total reward = 10.82
2022-01-26 14:16:25.088 | DEBUG    | __main__:trials:24 - Trial = 348/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.089 | DEBUG    | __main__:trials:29 - Trial = 348/30000 | Total reward = 48.22
2022-01-26 14:16:25.091 | DEBUG    | __main__:trials:26 - Trial = 349/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.091 | DEBUG    | __main__:trials:29 - Trial = 349/30000 | Total reward = 10.83
2022-01-26 14:16:25.093 | DEBUG    | __main__:trials:26 - Trial = 350/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.094 | DEBUG    | __main__:trials:29 - Trial = 350/30000 | Total reward = 10.83
2022-01-26 14:16:25.097 | DEBUG    | __main__:trials:24 - Trial = 351/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.098 | DEBUG    | __main__:trials:29 - Trial = 351/30000 | Total reward = 27.59
2022-01-26 14:16:25.100 | DEBUG    | __main__:trials:26 - Trial = 352/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.100 | DEBUG    | __main__:trials:29 - Trial = 352/30000 | Total reward = 9.16
2022-01-26 14:16:25.102 | DEBUG    | __main__:trials:26 - Trial = 353/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.103 | DEBUG    | __main__:trials:29 - Trial = 353/30000 | Total reward = 10.18
2022-01-26 14:16:25.106 | DEBUG    | __main__:trials:24 - Trial = 354/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.107 | DEBUG    | __main__:trials:29 - Trial = 354/30000 | Total reward = 42.05
2022-01-26 14:16:25.110 | DEBUG    | __main__:trials:24 - Trial = 355/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.111 | DEBUG    | __main__:trials:29 - Trial = 355/30000 | Total reward = 39.03
2022-01-26 14:16:25.115 | DEBUG    | __main__:trials:24 - Trial = 356/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.116 | DEBUG    | __main__:trials:29 - Trial = 356/30000 | Total reward = 45.08
2022-01-26 14:16:25.119 | DEBUG    | __main__:trials:24 - Trial = 357/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.120 | DEBUG    | __main__:trials:29 - Trial = 357/30000 | Total reward = 41.57
2022-01-26 14:16:25.123 | DEBUG    | __main__:trials:24 - Trial = 358/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.124 | DEBUG    | __main__:trials:29 - Trial = 358/30000 | Total reward = 37.57
2022-01-26 14:16:25.127 | DEBUG    | __main__:trials:24 - Trial = 359/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.128 | DEBUG    | __main__:trials:29 - Trial = 359/30000 | Total reward = 37.57
2022-01-26 14:16:25.131 | DEBUG    | __main__:trials:24 - Trial = 360/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.131 | DEBUG    | __main__:trials:29 - Trial = 360/30000 | Total reward = 37.57
2022-01-26 14:16:25.134 | DEBUG    | __main__:trials:24 - Trial = 361/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.135 | DEBUG    | __main__:trials:29 - Trial = 361/30000 | Total reward = 59.21
2022-01-26 14:16:25.138 | DEBUG    | __main__:trials:24 - Trial = 362/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.140 | DEBUG    | __main__:trials:29 - Trial = 362/30000 | Total reward = 38.97
2022-01-26 14:16:25.143 | DEBUG    | __main__:trials:24 - Trial = 363/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.144 | DEBUG    | __main__:trials:29 - Trial = 363/30000 | Total reward = 36.98
2022-01-26 14:16:25.148 | DEBUG    | __main__:trials:24 - Trial = 364/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.150 | DEBUG    | __main__:trials:29 - Trial = 364/30000 | Total reward = 32.69
2022-01-26 14:16:25.153 | DEBUG    | __main__:trials:24 - Trial = 365/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.154 | DEBUG    | __main__:trials:29 - Trial = 365/30000 | Total reward = 45.36
2022-01-26 14:16:25.158 | DEBUG    | __main__:trials:24 - Trial = 366/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.159 | DEBUG    | __main__:trials:29 - Trial = 366/30000 | Total reward = 37.03
2022-01-26 14:16:25.162 | DEBUG    | __main__:trials:24 - Trial = 367/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.164 | DEBUG    | __main__:trials:29 - Trial = 367/30000 | Total reward = 41.97
2022-01-26 14:16:25.167 | DEBUG    | __main__:trials:24 - Trial = 368/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.168 | DEBUG    | __main__:trials:29 - Trial = 368/30000 | Total reward = 43.19
2022-01-26 14:16:25.171 | DEBUG    | __main__:trials:24 - Trial = 369/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.173 | DEBUG    | __main__:trials:29 - Trial = 369/30000 | Total reward = 43.82
2022-01-26 14:16:25.176 | DEBUG    | __main__:trials:24 - Trial = 370/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.178 | DEBUG    | __main__:trials:29 - Trial = 370/30000 | Total reward = 56.59
2022-01-26 14:16:25.181 | DEBUG    | __main__:trials:24 - Trial = 371/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.182 | DEBUG    | __main__:trials:29 - Trial = 371/30000 | Total reward = 37.57
2022-01-26 14:16:25.185 | DEBUG    | __main__:trials:24 - Trial = 372/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.187 | DEBUG    | __main__:trials:29 - Trial = 372/30000 | Total reward = 36.71
2022-01-26 14:16:25.191 | DEBUG    | __main__:trials:24 - Trial = 373/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.191 | DEBUG    | __main__:trials:29 - Trial = 373/30000 | Total reward = 31.21
2022-01-26 14:16:25.195 | DEBUG    | __main__:trials:24 - Trial = 374/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.197 | DEBUG    | __main__:trials:29 - Trial = 374/30000 | Total reward = 47.49
2022-01-26 14:16:25.200 | DEBUG    | __main__:trials:24 - Trial = 375/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.201 | DEBUG    | __main__:trials:29 - Trial = 375/30000 | Total reward = 48.76
2022-01-26 14:16:25.204 | DEBUG    | __main__:trials:26 - Trial = 376/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.205 | DEBUG    | __main__:trials:29 - Trial = 376/30000 | Total reward = 26.68
2022-01-26 14:16:25.209 | DEBUG    | __main__:trials:24 - Trial = 377/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.210 | DEBUG    | __main__:trials:29 - Trial = 377/30000 | Total reward = 36.19
2022-01-26 14:16:25.213 | DEBUG    | __main__:trials:24 - Trial = 378/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.215 | DEBUG    | __main__:trials:29 - Trial = 378/30000 | Total reward = 48.49
2022-01-26 14:16:25.218 | DEBUG    | __main__:trials:24 - Trial = 379/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.220 | DEBUG    | __main__:trials:29 - Trial = 379/30000 | Total reward = 48.86
2022-01-26 14:16:25.224 | DEBUG    | __main__:trials:24 - Trial = 380/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.224 | DEBUG    | __main__:trials:29 - Trial = 380/30000 | Total reward = 45.66
2022-01-26 14:16:25.228 | DEBUG    | __main__:trials:24 - Trial = 381/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.229 | DEBUG    | __main__:trials:29 - Trial = 381/30000 | Total reward = 49.25
2022-01-26 14:16:25.232 | DEBUG    | __main__:trials:24 - Trial = 382/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.234 | DEBUG    | __main__:trials:29 - Trial = 382/30000 | Total reward = 34.95
2022-01-26 14:16:25.238 | DEBUG    | __main__:trials:24 - Trial = 383/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.239 | DEBUG    | __main__:trials:29 - Trial = 383/30000 | Total reward = 45.43
2022-01-26 14:16:25.242 | DEBUG    | __main__:trials:24 - Trial = 384/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.244 | DEBUG    | __main__:trials:29 - Trial = 384/30000 | Total reward = 35.03
2022-01-26 14:16:25.248 | DEBUG    | __main__:trials:24 - Trial = 385/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.249 | DEBUG    | __main__:trials:29 - Trial = 385/30000 | Total reward = 41.74
2022-01-26 14:16:25.252 | DEBUG    | __main__:trials:24 - Trial = 386/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.253 | DEBUG    | __main__:trials:29 - Trial = 386/30000 | Total reward = 37.69
2022-01-26 14:16:25.256 | DEBUG    | __main__:trials:24 - Trial = 387/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.258 | DEBUG    | __main__:trials:29 - Trial = 387/30000 | Total reward = 37.57
2022-01-26 14:16:25.260 | DEBUG    | __main__:trials:26 - Trial = 388/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.262 | DEBUG    | __main__:trials:29 - Trial = 388/30000 | Total reward = 13.73
2022-01-26 14:16:25.265 | DEBUG    | __main__:trials:24 - Trial = 389/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.266 | DEBUG    | __main__:trials:29 - Trial = 389/30000 | Total reward = 35.76
2022-01-26 14:16:25.270 | DEBUG    | __main__:trials:24 - Trial = 390/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.271 | DEBUG    | __main__:trials:29 - Trial = 390/30000 | Total reward = 27.54
2022-01-26 14:16:25.274 | DEBUG    | __main__:trials:24 - Trial = 391/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.276 | DEBUG    | __main__:trials:29 - Trial = 391/30000 | Total reward = 33.57
2022-01-26 14:16:25.280 | DEBUG    | __main__:trials:24 - Trial = 392/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.282 | DEBUG    | __main__:trials:29 - Trial = 392/30000 | Total reward = 38.43
2022-01-26 14:16:25.285 | DEBUG    | __main__:trials:24 - Trial = 393/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.286 | DEBUG    | __main__:trials:29 - Trial = 393/30000 | Total reward = 33.67
2022-01-26 14:16:25.290 | DEBUG    | __main__:trials:24 - Trial = 394/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.291 | DEBUG    | __main__:trials:29 - Trial = 394/30000 | Total reward = 33.12
2022-01-26 14:16:25.295 | DEBUG    | __main__:trials:24 - Trial = 395/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.297 | DEBUG    | __main__:trials:29 - Trial = 395/30000 | Total reward = 38.02
2022-01-26 14:16:25.300 | DEBUG    | __main__:trials:24 - Trial = 396/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.302 | DEBUG    | __main__:trials:29 - Trial = 396/30000 | Total reward = 39.62
2022-01-26 14:16:25.306 | DEBUG    | __main__:trials:24 - Trial = 397/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.307 | DEBUG    | __main__:trials:29 - Trial = 397/30000 | Total reward = 56.76
2022-01-26 14:16:25.311 | DEBUG    | __main__:trials:24 - Trial = 398/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.313 | DEBUG    | __main__:trials:29 - Trial = 398/30000 | Total reward = 32.92
2022-01-26 14:16:25.315 | DEBUG    | __main__:trials:26 - Trial = 399/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.316 | DEBUG    | __main__:trials:29 - Trial = 399/30000 | Total reward = 11.70
2022-01-26 14:16:25.319 | DEBUG    | __main__:trials:26 - Trial = 400/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.321 | DEBUG    | __main__:trials:29 - Trial = 400/30000 | Total reward = 13.32
2022-01-26 14:16:25.325 | DEBUG    | __main__:trials:24 - Trial = 401/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.326 | DEBUG    | __main__:trials:29 - Trial = 401/30000 | Total reward = 41.70
2022-01-26 14:16:25.330 | DEBUG    | __main__:trials:24 - Trial = 402/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.332 | DEBUG    | __main__:trials:29 - Trial = 402/30000 | Total reward = 37.37
2022-01-26 14:16:25.334 | DEBUG    | __main__:trials:26 - Trial = 403/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.336 | DEBUG    | __main__:trials:29 - Trial = 403/30000 | Total reward = 16.35
2022-01-26 14:16:25.339 | DEBUG    | __main__:trials:26 - Trial = 404/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.340 | DEBUG    | __main__:trials:29 - Trial = 404/30000 | Total reward = 9.83
2022-01-26 14:16:25.344 | DEBUG    | __main__:trials:24 - Trial = 405/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.345 | DEBUG    | __main__:trials:29 - Trial = 405/30000 | Total reward = 38.75
2022-01-26 14:16:25.350 | DEBUG    | __main__:trials:24 - Trial = 406/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.352 | DEBUG    | __main__:trials:29 - Trial = 406/30000 | Total reward = 48.14
2022-01-26 14:16:25.355 | DEBUG    | __main__:trials:24 - Trial = 407/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.357 | DEBUG    | __main__:trials:29 - Trial = 407/30000 | Total reward = 29.71
2022-01-26 14:16:25.361 | DEBUG    | __main__:trials:24 - Trial = 408/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.362 | DEBUG    | __main__:trials:29 - Trial = 408/30000 | Total reward = 45.24
2022-01-26 14:16:25.365 | DEBUG    | __main__:trials:26 - Trial = 409/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.367 | DEBUG    | __main__:trials:29 - Trial = 409/30000 | Total reward = 10.83
2022-01-26 14:16:25.370 | DEBUG    | __main__:trials:24 - Trial = 410/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.372 | DEBUG    | __main__:trials:29 - Trial = 410/30000 | Total reward = 56.92
2022-01-26 14:16:25.376 | DEBUG    | __main__:trials:24 - Trial = 411/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.377 | DEBUG    | __main__:trials:29 - Trial = 411/30000 | Total reward = 55.88
2022-01-26 14:16:25.381 | DEBUG    | __main__:trials:24 - Trial = 412/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.382 | DEBUG    | __main__:trials:29 - Trial = 412/30000 | Total reward = 20.90
2022-01-26 14:16:25.386 | DEBUG    | __main__:trials:24 - Trial = 413/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.387 | DEBUG    | __main__:trials:29 - Trial = 413/30000 | Total reward = 35.29
2022-01-26 14:16:25.391 | DEBUG    | __main__:trials:24 - Trial = 414/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.393 | DEBUG    | __main__:trials:29 - Trial = 414/30000 | Total reward = 30.45
2022-01-26 14:16:25.396 | DEBUG    | __main__:trials:24 - Trial = 415/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.397 | DEBUG    | __main__:trials:29 - Trial = 415/30000 | Total reward = 41.67
2022-01-26 14:16:25.400 | DEBUG    | __main__:trials:24 - Trial = 416/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.402 | DEBUG    | __main__:trials:29 - Trial = 416/30000 | Total reward = 40.64
2022-01-26 14:16:25.406 | DEBUG    | __main__:trials:24 - Trial = 417/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.407 | DEBUG    | __main__:trials:29 - Trial = 417/30000 | Total reward = 35.37
2022-01-26 14:16:25.411 | DEBUG    | __main__:trials:24 - Trial = 418/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.413 | DEBUG    | __main__:trials:29 - Trial = 418/30000 | Total reward = 42.49
2022-01-26 14:16:25.417 | DEBUG    | __main__:trials:24 - Trial = 419/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.419 | DEBUG    | __main__:trials:29 - Trial = 419/30000 | Total reward = 38.73
2022-01-26 14:16:25.423 | DEBUG    | __main__:trials:24 - Trial = 420/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.424 | DEBUG    | __main__:trials:29 - Trial = 420/30000 | Total reward = 31.03
2022-01-26 14:16:25.428 | DEBUG    | __main__:trials:24 - Trial = 421/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.430 | DEBUG    | __main__:trials:29 - Trial = 421/30000 | Total reward = 41.07
2022-01-26 14:16:25.434 | DEBUG    | __main__:trials:24 - Trial = 422/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.436 | DEBUG    | __main__:trials:29 - Trial = 422/30000 | Total reward = 40.44
2022-01-26 14:16:25.440 | DEBUG    | __main__:trials:24 - Trial = 423/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.442 | DEBUG    | __main__:trials:29 - Trial = 423/30000 | Total reward = 31.14
2022-01-26 14:16:25.446 | DEBUG    | __main__:trials:24 - Trial = 424/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.447 | DEBUG    | __main__:trials:29 - Trial = 424/30000 | Total reward = 50.84
2022-01-26 14:16:25.452 | DEBUG    | __main__:trials:24 - Trial = 425/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.453 | DEBUG    | __main__:trials:29 - Trial = 425/30000 | Total reward = 38.79
2022-01-26 14:16:25.457 | DEBUG    | __main__:trials:24 - Trial = 426/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.459 | DEBUG    | __main__:trials:29 - Trial = 426/30000 | Total reward = 33.84
2022-01-26 14:16:25.462 | DEBUG    | __main__:trials:24 - Trial = 427/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.464 | DEBUG    | __main__:trials:29 - Trial = 427/30000 | Total reward = 49.35
2022-01-26 14:16:25.467 | DEBUG    | __main__:trials:24 - Trial = 428/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.469 | DEBUG    | __main__:trials:29 - Trial = 428/30000 | Total reward = 32.92
2022-01-26 14:16:25.472 | DEBUG    | __main__:trials:26 - Trial = 429/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.474 | DEBUG    | __main__:trials:29 - Trial = 429/30000 | Total reward = 31.12
2022-01-26 14:16:25.478 | DEBUG    | __main__:trials:24 - Trial = 430/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.479 | DEBUG    | __main__:trials:29 - Trial = 430/30000 | Total reward = 32.50
2022-01-26 14:16:25.483 | DEBUG    | __main__:trials:24 - Trial = 431/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.485 | DEBUG    | __main__:trials:29 - Trial = 431/30000 | Total reward = 50.31
2022-01-26 14:16:25.488 | DEBUG    | __main__:trials:24 - Trial = 432/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.490 | DEBUG    | __main__:trials:29 - Trial = 432/30000 | Total reward = 36.98
2022-01-26 14:16:25.494 | DEBUG    | __main__:trials:24 - Trial = 433/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.495 | DEBUG    | __main__:trials:29 - Trial = 433/30000 | Total reward = 34.81
2022-01-26 14:16:25.499 | DEBUG    | __main__:trials:24 - Trial = 434/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.500 | DEBUG    | __main__:trials:29 - Trial = 434/30000 | Total reward = 34.21
2022-01-26 14:16:25.504 | DEBUG    | __main__:trials:24 - Trial = 435/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.506 | DEBUG    | __main__:trials:29 - Trial = 435/30000 | Total reward = 33.85
2022-01-26 14:16:25.509 | DEBUG    | __main__:trials:24 - Trial = 436/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.511 | DEBUG    | __main__:trials:29 - Trial = 436/30000 | Total reward = 32.77
2022-01-26 14:16:25.514 | DEBUG    | __main__:trials:24 - Trial = 437/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.516 | DEBUG    | __main__:trials:29 - Trial = 437/30000 | Total reward = 37.86
2022-01-26 14:16:25.520 | DEBUG    | __main__:trials:24 - Trial = 438/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.521 | DEBUG    | __main__:trials:29 - Trial = 438/30000 | Total reward = 49.75
2022-01-26 14:16:25.524 | DEBUG    | __main__:trials:24 - Trial = 439/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.526 | DEBUG    | __main__:trials:29 - Trial = 439/30000 | Total reward = 39.85
2022-01-26 14:16:25.528 | DEBUG    | __main__:trials:26 - Trial = 440/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.530 | DEBUG    | __main__:trials:29 - Trial = 440/30000 | Total reward = 16.15
2022-01-26 14:16:25.534 | DEBUG    | __main__:trials:24 - Trial = 441/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.536 | DEBUG    | __main__:trials:29 - Trial = 441/30000 | Total reward = 36.79
2022-01-26 14:16:25.539 | DEBUG    | __main__:trials:24 - Trial = 442/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.540 | DEBUG    | __main__:trials:29 - Trial = 442/30000 | Total reward = 30.61
2022-01-26 14:16:25.544 | DEBUG    | __main__:trials:24 - Trial = 443/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.544 | DEBUG    | __main__:trials:29 - Trial = 443/30000 | Total reward = 30.09
2022-01-26 14:16:25.548 | DEBUG    | __main__:trials:24 - Trial = 444/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.549 | DEBUG    | __main__:trials:29 - Trial = 444/30000 | Total reward = 41.53
2022-01-26 14:16:25.552 | DEBUG    | __main__:trials:26 - Trial = 445/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.554 | DEBUG    | __main__:trials:29 - Trial = 445/30000 | Total reward = 21.96
2022-01-26 14:16:25.557 | DEBUG    | __main__:trials:26 - Trial = 446/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.558 | DEBUG    | __main__:trials:29 - Trial = 446/30000 | Total reward = 9.18
2022-01-26 14:16:25.562 | DEBUG    | __main__:trials:24 - Trial = 447/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.563 | DEBUG    | __main__:trials:29 - Trial = 447/30000 | Total reward = 42.46
2022-01-26 14:16:25.567 | DEBUG    | __main__:trials:24 - Trial = 448/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.569 | DEBUG    | __main__:trials:29 - Trial = 448/30000 | Total reward = 38.10
2022-01-26 14:16:25.572 | DEBUG    | __main__:trials:24 - Trial = 449/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.573 | DEBUG    | __main__:trials:29 - Trial = 449/30000 | Total reward = 39.09
2022-01-26 14:16:25.577 | DEBUG    | __main__:trials:24 - Trial = 450/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.579 | DEBUG    | __main__:trials:29 - Trial = 450/30000 | Total reward = 35.65
2022-01-26 14:16:25.582 | DEBUG    | __main__:trials:24 - Trial = 451/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.584 | DEBUG    | __main__:trials:29 - Trial = 451/30000 | Total reward = 46.11
2022-01-26 14:16:25.588 | DEBUG    | __main__:trials:24 - Trial = 452/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.589 | DEBUG    | __main__:trials:29 - Trial = 452/30000 | Total reward = 36.44
2022-01-26 14:16:25.593 | DEBUG    | __main__:trials:24 - Trial = 453/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.594 | DEBUG    | __main__:trials:29 - Trial = 453/30000 | Total reward = 59.15
2022-01-26 14:16:25.598 | DEBUG    | __main__:trials:24 - Trial = 454/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.599 | DEBUG    | __main__:trials:29 - Trial = 454/30000 | Total reward = 51.77
2022-01-26 14:16:25.602 | DEBUG    | __main__:trials:24 - Trial = 455/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.604 | DEBUG    | __main__:trials:29 - Trial = 455/30000 | Total reward = 39.21
2022-01-26 14:16:25.607 | DEBUG    | __main__:trials:26 - Trial = 456/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.609 | DEBUG    | __main__:trials:29 - Trial = 456/30000 | Total reward = 20.08
2022-01-26 14:16:25.613 | DEBUG    | __main__:trials:24 - Trial = 457/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.613 | DEBUG    | __main__:trials:29 - Trial = 457/30000 | Total reward = 36.89
2022-01-26 14:16:25.618 | DEBUG    | __main__:trials:24 - Trial = 458/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.618 | DEBUG    | __main__:trials:29 - Trial = 458/30000 | Total reward = 32.54
2022-01-26 14:16:25.622 | DEBUG    | __main__:trials:24 - Trial = 459/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.624 | DEBUG    | __main__:trials:29 - Trial = 459/30000 | Total reward = 38.56
2022-01-26 14:16:25.627 | DEBUG    | __main__:trials:24 - Trial = 460/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.629 | DEBUG    | __main__:trials:29 - Trial = 460/30000 | Total reward = 37.57
2022-01-26 14:16:25.633 | DEBUG    | __main__:trials:24 - Trial = 461/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.634 | DEBUG    | __main__:trials:29 - Trial = 461/30000 | Total reward = 37.44
2022-01-26 14:16:25.637 | DEBUG    | __main__:trials:24 - Trial = 462/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.638 | DEBUG    | __main__:trials:29 - Trial = 462/30000 | Total reward = 28.90
2022-01-26 14:16:25.641 | DEBUG    | __main__:trials:24 - Trial = 463/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.643 | DEBUG    | __main__:trials:29 - Trial = 463/30000 | Total reward = 36.83
2022-01-26 14:16:25.646 | DEBUG    | __main__:trials:24 - Trial = 464/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.648 | DEBUG    | __main__:trials:29 - Trial = 464/30000 | Total reward = 50.86
2022-01-26 14:16:25.652 | DEBUG    | __main__:trials:24 - Trial = 465/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.653 | DEBUG    | __main__:trials:29 - Trial = 465/30000 | Total reward = 46.81
2022-01-26 14:16:25.657 | DEBUG    | __main__:trials:24 - Trial = 466/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.658 | DEBUG    | __main__:trials:29 - Trial = 466/30000 | Total reward = 14.12
2022-01-26 14:16:25.661 | DEBUG    | __main__:trials:26 - Trial = 467/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.663 | DEBUG    | __main__:trials:29 - Trial = 467/30000 | Total reward = 8.25
2022-01-26 14:16:25.666 | DEBUG    | __main__:trials:24 - Trial = 468/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.668 | DEBUG    | __main__:trials:29 - Trial = 468/30000 | Total reward = 54.64
2022-01-26 14:16:25.672 | DEBUG    | __main__:trials:24 - Trial = 469/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.673 | DEBUG    | __main__:trials:29 - Trial = 469/30000 | Total reward = 25.05
2022-01-26 14:16:25.677 | DEBUG    | __main__:trials:24 - Trial = 470/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.678 | DEBUG    | __main__:trials:29 - Trial = 470/30000 | Total reward = 31.06
2022-01-26 14:16:25.682 | DEBUG    | __main__:trials:26 - Trial = 471/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.683 | DEBUG    | __main__:trials:29 - Trial = 471/30000 | Total reward = 23.88
2022-01-26 14:16:25.687 | DEBUG    | __main__:trials:24 - Trial = 472/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.688 | DEBUG    | __main__:trials:29 - Trial = 472/30000 | Total reward = 27.66
2022-01-26 14:16:25.692 | DEBUG    | __main__:trials:24 - Trial = 473/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.693 | DEBUG    | __main__:trials:29 - Trial = 473/30000 | Total reward = 28.06
2022-01-26 14:16:25.697 | DEBUG    | __main__:trials:24 - Trial = 474/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.698 | DEBUG    | __main__:trials:29 - Trial = 474/30000 | Total reward = 29.74
2022-01-26 14:16:25.702 | DEBUG    | __main__:trials:24 - Trial = 475/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.704 | DEBUG    | __main__:trials:29 - Trial = 475/30000 | Total reward = 14.77
2022-01-26 14:16:25.707 | DEBUG    | __main__:trials:24 - Trial = 476/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.708 | DEBUG    | __main__:trials:29 - Trial = 476/30000 | Total reward = 28.72
2022-01-26 14:16:25.711 | DEBUG    | __main__:trials:24 - Trial = 477/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.713 | DEBUG    | __main__:trials:29 - Trial = 477/30000 | Total reward = 34.23
2022-01-26 14:16:25.717 | DEBUG    | __main__:trials:24 - Trial = 478/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.719 | DEBUG    | __main__:trials:29 - Trial = 478/30000 | Total reward = 34.08
2022-01-26 14:16:25.722 | DEBUG    | __main__:trials:24 - Trial = 479/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.724 | DEBUG    | __main__:trials:29 - Trial = 479/30000 | Total reward = 36.88
2022-01-26 14:16:25.728 | DEBUG    | __main__:trials:24 - Trial = 480/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.728 | DEBUG    | __main__:trials:29 - Trial = 480/30000 | Total reward = 22.78
2022-01-26 14:16:25.732 | DEBUG    | __main__:trials:24 - Trial = 481/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.733 | DEBUG    | __main__:trials:29 - Trial = 481/30000 | Total reward = 39.59
2022-01-26 14:16:25.736 | DEBUG    | __main__:trials:26 - Trial = 482/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.737 | DEBUG    | __main__:trials:29 - Trial = 482/30000 | Total reward = 16.87
2022-01-26 14:16:25.740 | DEBUG    | __main__:trials:24 - Trial = 483/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.742 | DEBUG    | __main__:trials:29 - Trial = 483/30000 | Total reward = 43.12
2022-01-26 14:16:25.744 | DEBUG    | __main__:trials:26 - Trial = 484/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.746 | DEBUG    | __main__:trials:29 - Trial = 484/30000 | Total reward = 20.14
2022-01-26 14:16:25.749 | DEBUG    | __main__:trials:24 - Trial = 485/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.750 | DEBUG    | __main__:trials:29 - Trial = 485/30000 | Total reward = 19.83
2022-01-26 14:16:25.754 | DEBUG    | __main__:trials:24 - Trial = 486/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.756 | DEBUG    | __main__:trials:29 - Trial = 486/30000 | Total reward = 35.83
2022-01-26 14:16:25.758 | DEBUG    | __main__:trials:24 - Trial = 487/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.760 | DEBUG    | __main__:trials:29 - Trial = 487/30000 | Total reward = 39.59
2022-01-26 14:16:25.764 | DEBUG    | __main__:trials:24 - Trial = 488/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.765 | DEBUG    | __main__:trials:29 - Trial = 488/30000 | Total reward = 31.90
2022-01-26 14:16:25.769 | DEBUG    | __main__:trials:24 - Trial = 489/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.770 | DEBUG    | __main__:trials:29 - Trial = 489/30000 | Total reward = 43.04
2022-01-26 14:16:25.773 | DEBUG    | __main__:trials:26 - Trial = 490/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.774 | DEBUG    | __main__:trials:29 - Trial = 490/30000 | Total reward = 17.22
2022-01-26 14:16:25.777 | DEBUG    | __main__:trials:24 - Trial = 491/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.779 | DEBUG    | __main__:trials:29 - Trial = 491/30000 | Total reward = 13.53
2022-01-26 14:16:25.782 | DEBUG    | __main__:trials:24 - Trial = 492/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.783 | DEBUG    | __main__:trials:29 - Trial = 492/30000 | Total reward = 32.47
2022-01-26 14:16:25.785 | DEBUG    | __main__:trials:26 - Trial = 493/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.785 | DEBUG    | __main__:trials:29 - Trial = 493/30000 | Total reward = 10.31
2022-01-26 14:16:25.789 | DEBUG    | __main__:trials:24 - Trial = 494/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.789 | DEBUG    | __main__:trials:29 - Trial = 494/30000 | Total reward = 41.35
2022-01-26 14:16:25.793 | DEBUG    | __main__:trials:24 - Trial = 495/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.795 | DEBUG    | __main__:trials:29 - Trial = 495/30000 | Total reward = 34.13
2022-01-26 14:16:25.798 | DEBUG    | __main__:trials:24 - Trial = 496/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.800 | DEBUG    | __main__:trials:29 - Trial = 496/30000 | Total reward = 34.97
2022-01-26 14:16:25.803 | DEBUG    | __main__:trials:24 - Trial = 497/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.805 | DEBUG    | __main__:trials:29 - Trial = 497/30000 | Total reward = 31.00
2022-01-26 14:16:25.808 | DEBUG    | __main__:trials:24 - Trial = 498/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.810 | DEBUG    | __main__:trials:29 - Trial = 498/30000 | Total reward = 20.75
2022-01-26 14:16:25.813 | DEBUG    | __main__:trials:24 - Trial = 499/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.814 | DEBUG    | __main__:trials:29 - Trial = 499/30000 | Total reward = 27.90
2022-01-26 14:16:25.818 | DEBUG    | __main__:trials:24 - Trial = 500/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.819 | DEBUG    | __main__:trials:29 - Trial = 500/30000 | Total reward = 35.38
2022-01-26 14:16:25.822 | DEBUG    | __main__:trials:24 - Trial = 501/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.823 | DEBUG    | __main__:trials:29 - Trial = 501/30000 | Total reward = 28.01
2022-01-26 14:16:25.827 | DEBUG    | __main__:trials:24 - Trial = 502/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.828 | DEBUG    | __main__:trials:29 - Trial = 502/30000 | Total reward = 32.27
2022-01-26 14:16:25.830 | DEBUG    | __main__:trials:26 - Trial = 503/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.832 | DEBUG    | __main__:trials:29 - Trial = 503/30000 | Total reward = 8.12
2022-01-26 14:16:25.836 | DEBUG    | __main__:trials:24 - Trial = 504/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.836 | DEBUG    | __main__:trials:29 - Trial = 504/30000 | Total reward = 38.16
2022-01-26 14:16:25.840 | DEBUG    | __main__:trials:24 - Trial = 505/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.841 | DEBUG    | __main__:trials:29 - Trial = 505/30000 | Total reward = 37.25
2022-01-26 14:16:25.844 | DEBUG    | __main__:trials:24 - Trial = 506/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.845 | DEBUG    | __main__:trials:29 - Trial = 506/30000 | Total reward = 43.66
2022-01-26 14:16:25.847 | DEBUG    | __main__:trials:26 - Trial = 507/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.848 | DEBUG    | __main__:trials:29 - Trial = 507/30000 | Total reward = 10.83
2022-01-26 14:16:25.852 | DEBUG    | __main__:trials:24 - Trial = 508/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.852 | DEBUG    | __main__:trials:29 - Trial = 508/30000 | Total reward = 30.76
2022-01-26 14:16:25.855 | DEBUG    | __main__:trials:24 - Trial = 509/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.857 | DEBUG    | __main__:trials:29 - Trial = 509/30000 | Total reward = 28.05
2022-01-26 14:16:25.860 | DEBUG    | __main__:trials:24 - Trial = 510/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.861 | DEBUG    | __main__:trials:29 - Trial = 510/30000 | Total reward = 31.60
2022-01-26 14:16:25.866 | DEBUG    | __main__:trials:24 - Trial = 511/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.866 | DEBUG    | __main__:trials:29 - Trial = 511/30000 | Total reward = 40.38
2022-01-26 14:16:25.870 | DEBUG    | __main__:trials:24 - Trial = 512/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.872 | DEBUG    | __main__:trials:29 - Trial = 512/30000 | Total reward = 50.44
2022-01-26 14:16:25.875 | DEBUG    | __main__:trials:24 - Trial = 513/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.876 | DEBUG    | __main__:trials:29 - Trial = 513/30000 | Total reward = 38.45
2022-01-26 14:16:25.880 | DEBUG    | __main__:trials:24 - Trial = 514/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.881 | DEBUG    | __main__:trials:29 - Trial = 514/30000 | Total reward = 37.62
2022-01-26 14:16:25.885 | DEBUG    | __main__:trials:24 - Trial = 515/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.887 | DEBUG    | __main__:trials:29 - Trial = 515/30000 | Total reward = 26.54
2022-01-26 14:16:25.890 | DEBUG    | __main__:trials:24 - Trial = 516/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.890 | DEBUG    | __main__:trials:29 - Trial = 516/30000 | Total reward = 41.45
2022-01-26 14:16:25.895 | DEBUG    | __main__:trials:24 - Trial = 517/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.896 | DEBUG    | __main__:trials:29 - Trial = 517/30000 | Total reward = 38.63
2022-01-26 14:16:25.900 | DEBUG    | __main__:trials:24 - Trial = 518/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.902 | DEBUG    | __main__:trials:29 - Trial = 518/30000 | Total reward = 30.96
2022-01-26 14:16:25.905 | DEBUG    | __main__:trials:24 - Trial = 519/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.905 | DEBUG    | __main__:trials:29 - Trial = 519/30000 | Total reward = 30.73
2022-01-26 14:16:25.909 | DEBUG    | __main__:trials:24 - Trial = 520/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.910 | DEBUG    | __main__:trials:29 - Trial = 520/30000 | Total reward = 25.58
2022-01-26 14:16:25.913 | DEBUG    | __main__:trials:26 - Trial = 521/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.914 | DEBUG    | __main__:trials:29 - Trial = 521/30000 | Total reward = 20.79
2022-01-26 14:16:25.918 | DEBUG    | __main__:trials:24 - Trial = 522/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.919 | DEBUG    | __main__:trials:29 - Trial = 522/30000 | Total reward = 30.17
2022-01-26 14:16:25.922 | DEBUG    | __main__:trials:24 - Trial = 523/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.923 | DEBUG    | __main__:trials:29 - Trial = 523/30000 | Total reward = 31.61
2022-01-26 14:16:25.927 | DEBUG    | __main__:trials:24 - Trial = 524/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.928 | DEBUG    | __main__:trials:29 - Trial = 524/30000 | Total reward = 47.73
2022-01-26 14:16:25.932 | DEBUG    | __main__:trials:24 - Trial = 525/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.933 | DEBUG    | __main__:trials:29 - Trial = 525/30000 | Total reward = 34.11
2022-01-26 14:16:25.936 | DEBUG    | __main__:trials:24 - Trial = 526/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.938 | DEBUG    | __main__:trials:29 - Trial = 526/30000 | Total reward = 27.16
2022-01-26 14:16:25.941 | DEBUG    | __main__:trials:24 - Trial = 527/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.942 | DEBUG    | __main__:trials:29 - Trial = 527/30000 | Total reward = 51.26
2022-01-26 14:16:25.945 | DEBUG    | __main__:trials:24 - Trial = 528/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.946 | DEBUG    | __main__:trials:29 - Trial = 528/30000 | Total reward = 17.09
2022-01-26 14:16:25.949 | DEBUG    | __main__:trials:24 - Trial = 529/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.951 | DEBUG    | __main__:trials:29 - Trial = 529/30000 | Total reward = 31.54
2022-01-26 14:16:25.954 | DEBUG    | __main__:trials:24 - Trial = 530/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.956 | DEBUG    | __main__:trials:29 - Trial = 530/30000 | Total reward = 38.70
2022-01-26 14:16:25.959 | DEBUG    | __main__:trials:24 - Trial = 531/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.959 | DEBUG    | __main__:trials:29 - Trial = 531/30000 | Total reward = 24.58
2022-01-26 14:16:25.963 | DEBUG    | __main__:trials:24 - Trial = 532/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.965 | DEBUG    | __main__:trials:29 - Trial = 532/30000 | Total reward = 20.64
2022-01-26 14:16:25.967 | DEBUG    | __main__:trials:26 - Trial = 533/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:25.969 | DEBUG    | __main__:trials:29 - Trial = 533/30000 | Total reward = 19.63
2022-01-26 14:16:25.972 | DEBUG    | __main__:trials:24 - Trial = 534/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.974 | DEBUG    | __main__:trials:29 - Trial = 534/30000 | Total reward = 50.11
2022-01-26 14:16:25.977 | DEBUG    | __main__:trials:24 - Trial = 535/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.977 | DEBUG    | __main__:trials:29 - Trial = 535/30000 | Total reward = 29.29
2022-01-26 14:16:25.981 | DEBUG    | __main__:trials:24 - Trial = 536/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.982 | DEBUG    | __main__:trials:29 - Trial = 536/30000 | Total reward = 30.61
2022-01-26 14:16:25.985 | DEBUG    | __main__:trials:24 - Trial = 537/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.987 | DEBUG    | __main__:trials:29 - Trial = 537/30000 | Total reward = 38.71
2022-01-26 14:16:25.989 | DEBUG    | __main__:trials:24 - Trial = 538/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.991 | DEBUG    | __main__:trials:29 - Trial = 538/30000 | Total reward = 42.43
2022-01-26 14:16:25.994 | DEBUG    | __main__:trials:24 - Trial = 539/30000 | Max number of steps (20) reached
2022-01-26 14:16:25.995 | DEBUG    | __main__:trials:29 - Trial = 539/30000 | Total reward = 37.67
2022-01-26 14:16:25.999 | DEBUG    | __main__:trials:24 - Trial = 540/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.000 | DEBUG    | __main__:trials:29 - Trial = 540/30000 | Total reward = 26.90
2022-01-26 14:16:26.003 | DEBUG    | __main__:trials:24 - Trial = 541/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.005 | DEBUG    | __main__:trials:29 - Trial = 541/30000 | Total reward = 25.88
2022-01-26 14:16:26.008 | DEBUG    | __main__:trials:24 - Trial = 542/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.009 | DEBUG    | __main__:trials:29 - Trial = 542/30000 | Total reward = 43.31
2022-01-26 14:16:26.013 | DEBUG    | __main__:trials:24 - Trial = 543/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.013 | DEBUG    | __main__:trials:29 - Trial = 543/30000 | Total reward = 42.61
2022-01-26 14:16:26.017 | DEBUG    | __main__:trials:24 - Trial = 544/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.018 | DEBUG    | __main__:trials:29 - Trial = 544/30000 | Total reward = 40.72
2022-01-26 14:16:26.022 | DEBUG    | __main__:trials:24 - Trial = 545/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.023 | DEBUG    | __main__:trials:29 - Trial = 545/30000 | Total reward = 45.72
2022-01-26 14:16:26.026 | DEBUG    | __main__:trials:24 - Trial = 546/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.029 | DEBUG    | __main__:trials:29 - Trial = 546/30000 | Total reward = 38.92
2022-01-26 14:16:26.032 | DEBUG    | __main__:trials:24 - Trial = 547/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.033 | DEBUG    | __main__:trials:29 - Trial = 547/30000 | Total reward = 35.88
2022-01-26 14:16:26.037 | DEBUG    | __main__:trials:24 - Trial = 548/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.038 | DEBUG    | __main__:trials:29 - Trial = 548/30000 | Total reward = 56.23
2022-01-26 14:16:26.042 | DEBUG    | __main__:trials:24 - Trial = 549/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.043 | DEBUG    | __main__:trials:29 - Trial = 549/30000 | Total reward = 38.53
2022-01-26 14:16:26.046 | DEBUG    | __main__:trials:24 - Trial = 550/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.048 | DEBUG    | __main__:trials:29 - Trial = 550/30000 | Total reward = 40.25
2022-01-26 14:16:26.051 | DEBUG    | __main__:trials:24 - Trial = 551/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.053 | DEBUG    | __main__:trials:29 - Trial = 551/30000 | Total reward = 37.09
2022-01-26 14:16:26.056 | DEBUG    | __main__:trials:24 - Trial = 552/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.057 | DEBUG    | __main__:trials:29 - Trial = 552/30000 | Total reward = 41.40
2022-01-26 14:16:26.061 | DEBUG    | __main__:trials:24 - Trial = 553/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.062 | DEBUG    | __main__:trials:29 - Trial = 553/30000 | Total reward = 38.44
2022-01-26 14:16:26.065 | DEBUG    | __main__:trials:24 - Trial = 554/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.066 | DEBUG    | __main__:trials:29 - Trial = 554/30000 | Total reward = 37.76
2022-01-26 14:16:26.069 | DEBUG    | __main__:trials:24 - Trial = 555/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.070 | DEBUG    | __main__:trials:29 - Trial = 555/30000 | Total reward = 23.21
2022-01-26 14:16:26.073 | DEBUG    | __main__:trials:24 - Trial = 556/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.074 | DEBUG    | __main__:trials:29 - Trial = 556/30000 | Total reward = 33.07
2022-01-26 14:16:26.078 | DEBUG    | __main__:trials:24 - Trial = 557/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.080 | DEBUG    | __main__:trials:29 - Trial = 557/30000 | Total reward = 45.52
2022-01-26 14:16:26.084 | DEBUG    | __main__:trials:24 - Trial = 558/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.084 | DEBUG    | __main__:trials:29 - Trial = 558/30000 | Total reward = 60.29
2022-01-26 14:16:26.088 | DEBUG    | __main__:trials:24 - Trial = 559/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.090 | DEBUG    | __main__:trials:29 - Trial = 559/30000 | Total reward = 39.97
2022-01-26 14:16:26.093 | DEBUG    | __main__:trials:24 - Trial = 560/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.095 | DEBUG    | __main__:trials:29 - Trial = 560/30000 | Total reward = 52.40
2022-01-26 14:16:26.098 | DEBUG    | __main__:trials:24 - Trial = 561/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.099 | DEBUG    | __main__:trials:29 - Trial = 561/30000 | Total reward = 30.22
2022-01-26 14:16:26.102 | DEBUG    | __main__:trials:24 - Trial = 562/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.104 | DEBUG    | __main__:trials:29 - Trial = 562/30000 | Total reward = 43.18
2022-01-26 14:16:26.106 | DEBUG    | __main__:trials:24 - Trial = 563/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.108 | DEBUG    | __main__:trials:29 - Trial = 563/30000 | Total reward = 36.00
2022-01-26 14:16:26.111 | DEBUG    | __main__:trials:24 - Trial = 564/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.112 | DEBUG    | __main__:trials:29 - Trial = 564/30000 | Total reward = 28.22
2022-01-26 14:16:26.116 | DEBUG    | __main__:trials:26 - Trial = 565/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.116 | DEBUG    | __main__:trials:29 - Trial = 565/30000 | Total reward = 16.01
2022-01-26 14:16:26.120 | DEBUG    | __main__:trials:24 - Trial = 566/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.121 | DEBUG    | __main__:trials:29 - Trial = 566/30000 | Total reward = 18.47
2022-01-26 14:16:26.124 | DEBUG    | __main__:trials:24 - Trial = 567/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.125 | DEBUG    | __main__:trials:29 - Trial = 567/30000 | Total reward = 45.99
2022-01-26 14:16:26.129 | DEBUG    | __main__:trials:24 - Trial = 568/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.130 | DEBUG    | __main__:trials:29 - Trial = 568/30000 | Total reward = 40.81
2022-01-26 14:16:26.134 | DEBUG    | __main__:trials:24 - Trial = 569/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.135 | DEBUG    | __main__:trials:29 - Trial = 569/30000 | Total reward = 30.69
2022-01-26 14:16:26.138 | DEBUG    | __main__:trials:24 - Trial = 570/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.139 | DEBUG    | __main__:trials:29 - Trial = 570/30000 | Total reward = 44.41
2022-01-26 14:16:26.143 | DEBUG    | __main__:trials:24 - Trial = 571/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.144 | DEBUG    | __main__:trials:29 - Trial = 571/30000 | Total reward = 44.56
2022-01-26 14:16:26.148 | DEBUG    | __main__:trials:24 - Trial = 572/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.148 | DEBUG    | __main__:trials:29 - Trial = 572/30000 | Total reward = 42.38
2022-01-26 14:16:26.152 | DEBUG    | __main__:trials:24 - Trial = 573/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.153 | DEBUG    | __main__:trials:29 - Trial = 573/30000 | Total reward = 42.95
2022-01-26 14:16:26.156 | DEBUG    | __main__:trials:24 - Trial = 574/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.157 | DEBUG    | __main__:trials:29 - Trial = 574/30000 | Total reward = 30.69
2022-01-26 14:16:26.160 | DEBUG    | __main__:trials:24 - Trial = 575/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.162 | DEBUG    | __main__:trials:29 - Trial = 575/30000 | Total reward = 51.22
2022-01-26 14:16:26.166 | DEBUG    | __main__:trials:24 - Trial = 576/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.167 | DEBUG    | __main__:trials:29 - Trial = 576/30000 | Total reward = 56.83
2022-01-26 14:16:26.170 | DEBUG    | __main__:trials:24 - Trial = 577/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.172 | DEBUG    | __main__:trials:29 - Trial = 577/30000 | Total reward = 36.79
2022-01-26 14:16:26.175 | DEBUG    | __main__:trials:24 - Trial = 578/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.176 | DEBUG    | __main__:trials:29 - Trial = 578/30000 | Total reward = 35.20
2022-01-26 14:16:26.179 | DEBUG    | __main__:trials:24 - Trial = 579/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.181 | DEBUG    | __main__:trials:29 - Trial = 579/30000 | Total reward = 38.36
2022-01-26 14:16:26.184 | DEBUG    | __main__:trials:24 - Trial = 580/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.186 | DEBUG    | __main__:trials:29 - Trial = 580/30000 | Total reward = 37.10
2022-01-26 14:16:26.189 | DEBUG    | __main__:trials:24 - Trial = 581/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.190 | DEBUG    | __main__:trials:29 - Trial = 581/30000 | Total reward = 27.46
2022-01-26 14:16:26.194 | DEBUG    | __main__:trials:24 - Trial = 582/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.196 | DEBUG    | __main__:trials:29 - Trial = 582/30000 | Total reward = 45.09
2022-01-26 14:16:26.199 | DEBUG    | __main__:trials:24 - Trial = 583/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.200 | DEBUG    | __main__:trials:29 - Trial = 583/30000 | Total reward = 44.17
2022-01-26 14:16:26.203 | DEBUG    | __main__:trials:26 - Trial = 584/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.203 | DEBUG    | __main__:trials:29 - Trial = 584/30000 | Total reward = 14.60
2022-01-26 14:16:26.208 | DEBUG    | __main__:trials:24 - Trial = 585/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.209 | DEBUG    | __main__:trials:29 - Trial = 585/30000 | Total reward = 30.69
2022-01-26 14:16:26.212 | DEBUG    | __main__:trials:24 - Trial = 586/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.213 | DEBUG    | __main__:trials:29 - Trial = 586/30000 | Total reward = 45.36
2022-01-26 14:16:26.216 | DEBUG    | __main__:trials:24 - Trial = 587/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.217 | DEBUG    | __main__:trials:29 - Trial = 587/30000 | Total reward = 52.24
2022-01-26 14:16:26.220 | DEBUG    | __main__:trials:24 - Trial = 588/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.221 | DEBUG    | __main__:trials:29 - Trial = 588/30000 | Total reward = 21.27
2022-01-26 14:16:26.224 | DEBUG    | __main__:trials:24 - Trial = 589/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.226 | DEBUG    | __main__:trials:29 - Trial = 589/30000 | Total reward = 28.40
2022-01-26 14:16:26.229 | DEBUG    | __main__:trials:24 - Trial = 590/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.230 | DEBUG    | __main__:trials:29 - Trial = 590/30000 | Total reward = 35.05
2022-01-26 14:16:26.233 | DEBUG    | __main__:trials:24 - Trial = 591/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.235 | DEBUG    | __main__:trials:29 - Trial = 591/30000 | Total reward = 56.14
2022-01-26 14:16:26.238 | DEBUG    | __main__:trials:24 - Trial = 592/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.240 | DEBUG    | __main__:trials:29 - Trial = 592/30000 | Total reward = 56.95
2022-01-26 14:16:26.243 | DEBUG    | __main__:trials:24 - Trial = 593/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.244 | DEBUG    | __main__:trials:29 - Trial = 593/30000 | Total reward = 57.17
2022-01-26 14:16:26.248 | DEBUG    | __main__:trials:24 - Trial = 594/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.248 | DEBUG    | __main__:trials:29 - Trial = 594/30000 | Total reward = 31.48
2022-01-26 14:16:26.252 | DEBUG    | __main__:trials:24 - Trial = 595/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.254 | DEBUG    | __main__:trials:29 - Trial = 595/30000 | Total reward = 29.12
2022-01-26 14:16:26.257 | DEBUG    | __main__:trials:24 - Trial = 596/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.258 | DEBUG    | __main__:trials:29 - Trial = 596/30000 | Total reward = 41.52
2022-01-26 14:16:26.262 | DEBUG    | __main__:trials:24 - Trial = 597/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.262 | DEBUG    | __main__:trials:29 - Trial = 597/30000 | Total reward = 38.12
2022-01-26 14:16:26.265 | DEBUG    | __main__:trials:26 - Trial = 598/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.266 | DEBUG    | __main__:trials:29 - Trial = 598/30000 | Total reward = 34.31
2022-01-26 14:16:26.269 | DEBUG    | __main__:trials:26 - Trial = 599/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.271 | DEBUG    | __main__:trials:29 - Trial = 599/30000 | Total reward = 17.71
2022-01-26 14:16:26.275 | DEBUG    | __main__:trials:24 - Trial = 600/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.276 | DEBUG    | __main__:trials:29 - Trial = 600/30000 | Total reward = 37.99
2022-01-26 14:16:26.279 | DEBUG    | __main__:trials:24 - Trial = 601/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.281 | DEBUG    | __main__:trials:29 - Trial = 601/30000 | Total reward = 36.80
2022-01-26 14:16:26.284 | DEBUG    | __main__:trials:24 - Trial = 602/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.285 | DEBUG    | __main__:trials:29 - Trial = 602/30000 | Total reward = 45.48
2022-01-26 14:16:26.288 | DEBUG    | __main__:trials:24 - Trial = 603/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.289 | DEBUG    | __main__:trials:29 - Trial = 603/30000 | Total reward = 15.88
2022-01-26 14:16:26.292 | DEBUG    | __main__:trials:24 - Trial = 604/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.294 | DEBUG    | __main__:trials:29 - Trial = 604/30000 | Total reward = 36.27
2022-01-26 14:16:26.297 | DEBUG    | __main__:trials:24 - Trial = 605/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.298 | DEBUG    | __main__:trials:29 - Trial = 605/30000 | Total reward = 45.86
2022-01-26 14:16:26.301 | DEBUG    | __main__:trials:24 - Trial = 606/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.303 | DEBUG    | __main__:trials:29 - Trial = 606/30000 | Total reward = 49.27
2022-01-26 14:16:26.306 | DEBUG    | __main__:trials:24 - Trial = 607/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.308 | DEBUG    | __main__:trials:29 - Trial = 607/30000 | Total reward = 44.13
2022-01-26 14:16:26.311 | DEBUG    | __main__:trials:24 - Trial = 608/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.312 | DEBUG    | __main__:trials:29 - Trial = 608/30000 | Total reward = 60.54
2022-01-26 14:16:26.316 | DEBUG    | __main__:trials:24 - Trial = 609/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.318 | DEBUG    | __main__:trials:29 - Trial = 609/30000 | Total reward = 46.10
2022-01-26 14:16:26.320 | DEBUG    | __main__:trials:26 - Trial = 610/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.322 | DEBUG    | __main__:trials:29 - Trial = 610/30000 | Total reward = 14.63
2022-01-26 14:16:26.325 | DEBUG    | __main__:trials:24 - Trial = 611/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.327 | DEBUG    | __main__:trials:29 - Trial = 611/30000 | Total reward = 35.98
2022-01-26 14:16:26.330 | DEBUG    | __main__:trials:24 - Trial = 612/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.332 | DEBUG    | __main__:trials:29 - Trial = 612/30000 | Total reward = 44.67
2022-01-26 14:16:26.336 | DEBUG    | __main__:trials:24 - Trial = 613/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.337 | DEBUG    | __main__:trials:29 - Trial = 613/30000 | Total reward = 38.24
2022-01-26 14:16:26.341 | DEBUG    | __main__:trials:24 - Trial = 614/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.343 | DEBUG    | __main__:trials:29 - Trial = 614/30000 | Total reward = 57.61
2022-01-26 14:16:26.346 | DEBUG    | __main__:trials:24 - Trial = 615/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.348 | DEBUG    | __main__:trials:29 - Trial = 615/30000 | Total reward = 37.54
2022-01-26 14:16:26.352 | DEBUG    | __main__:trials:24 - Trial = 616/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.353 | DEBUG    | __main__:trials:29 - Trial = 616/30000 | Total reward = 44.76
2022-01-26 14:16:26.357 | DEBUG    | __main__:trials:24 - Trial = 617/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.359 | DEBUG    | __main__:trials:29 - Trial = 617/30000 | Total reward = 47.02
2022-01-26 14:16:26.362 | DEBUG    | __main__:trials:24 - Trial = 618/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.364 | DEBUG    | __main__:trials:29 - Trial = 618/30000 | Total reward = 54.25
2022-01-26 14:16:26.368 | DEBUG    | __main__:trials:24 - Trial = 619/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.369 | DEBUG    | __main__:trials:29 - Trial = 619/30000 | Total reward = 59.22
2022-01-26 14:16:26.373 | DEBUG    | __main__:trials:24 - Trial = 620/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.374 | DEBUG    | __main__:trials:29 - Trial = 620/30000 | Total reward = 23.79
2022-01-26 14:16:26.378 | DEBUG    | __main__:trials:24 - Trial = 621/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.380 | DEBUG    | __main__:trials:29 - Trial = 621/30000 | Total reward = 53.77
2022-01-26 14:16:26.383 | DEBUG    | __main__:trials:24 - Trial = 622/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.385 | DEBUG    | __main__:trials:29 - Trial = 622/30000 | Total reward = 44.54
2022-01-26 14:16:26.389 | DEBUG    | __main__:trials:24 - Trial = 623/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.391 | DEBUG    | __main__:trials:29 - Trial = 623/30000 | Total reward = 44.76
2022-01-26 14:16:26.394 | DEBUG    | __main__:trials:24 - Trial = 624/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.396 | DEBUG    | __main__:trials:29 - Trial = 624/30000 | Total reward = 42.29
2022-01-26 14:16:26.399 | DEBUG    | __main__:trials:24 - Trial = 625/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.401 | DEBUG    | __main__:trials:29 - Trial = 625/30000 | Total reward = 59.04
2022-01-26 14:16:26.405 | DEBUG    | __main__:trials:24 - Trial = 626/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.405 | DEBUG    | __main__:trials:29 - Trial = 626/30000 | Total reward = 44.40
2022-01-26 14:16:26.410 | DEBUG    | __main__:trials:24 - Trial = 627/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.411 | DEBUG    | __main__:trials:29 - Trial = 627/30000 | Total reward = 45.21
2022-01-26 14:16:26.414 | DEBUG    | __main__:trials:24 - Trial = 628/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.417 | DEBUG    | __main__:trials:29 - Trial = 628/30000 | Total reward = 36.90
2022-01-26 14:16:26.421 | DEBUG    | __main__:trials:24 - Trial = 629/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.421 | DEBUG    | __main__:trials:29 - Trial = 629/30000 | Total reward = 39.79
2022-01-26 14:16:26.425 | DEBUG    | __main__:trials:26 - Trial = 630/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.427 | DEBUG    | __main__:trials:29 - Trial = 630/30000 | Total reward = 15.40
2022-01-26 14:16:26.431 | DEBUG    | __main__:trials:24 - Trial = 631/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.432 | DEBUG    | __main__:trials:29 - Trial = 631/30000 | Total reward = 45.90
2022-01-26 14:16:26.435 | DEBUG    | __main__:trials:24 - Trial = 632/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.437 | DEBUG    | __main__:trials:29 - Trial = 632/30000 | Total reward = 38.87
2022-01-26 14:16:26.441 | DEBUG    | __main__:trials:24 - Trial = 633/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.442 | DEBUG    | __main__:trials:29 - Trial = 633/30000 | Total reward = 39.03
2022-01-26 14:16:26.446 | DEBUG    | __main__:trials:24 - Trial = 634/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.448 | DEBUG    | __main__:trials:29 - Trial = 634/30000 | Total reward = 46.42
2022-01-26 14:16:26.451 | DEBUG    | __main__:trials:26 - Trial = 635/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.453 | DEBUG    | __main__:trials:29 - Trial = 635/30000 | Total reward = 30.91
2022-01-26 14:16:26.456 | DEBUG    | __main__:trials:24 - Trial = 636/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.458 | DEBUG    | __main__:trials:29 - Trial = 636/30000 | Total reward = 18.23
2022-01-26 14:16:26.462 | DEBUG    | __main__:trials:24 - Trial = 637/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.463 | DEBUG    | __main__:trials:29 - Trial = 637/30000 | Total reward = 46.20
2022-01-26 14:16:26.467 | DEBUG    | __main__:trials:24 - Trial = 638/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.469 | DEBUG    | __main__:trials:29 - Trial = 638/30000 | Total reward = 37.66
2022-01-26 14:16:26.472 | DEBUG    | __main__:trials:24 - Trial = 639/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.474 | DEBUG    | __main__:trials:29 - Trial = 639/30000 | Total reward = 61.53
2022-01-26 14:16:26.478 | DEBUG    | __main__:trials:24 - Trial = 640/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.479 | DEBUG    | __main__:trials:29 - Trial = 640/30000 | Total reward = 35.60
2022-01-26 14:16:26.483 | DEBUG    | __main__:trials:24 - Trial = 641/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.484 | DEBUG    | __main__:trials:29 - Trial = 641/30000 | Total reward = 34.71
2022-01-26 14:16:26.488 | DEBUG    | __main__:trials:24 - Trial = 642/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.489 | DEBUG    | __main__:trials:29 - Trial = 642/30000 | Total reward = 45.75
2022-01-26 14:16:26.493 | DEBUG    | __main__:trials:24 - Trial = 643/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.495 | DEBUG    | __main__:trials:29 - Trial = 643/30000 | Total reward = 44.24
2022-01-26 14:16:26.498 | DEBUG    | __main__:trials:24 - Trial = 644/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.500 | DEBUG    | __main__:trials:29 - Trial = 644/30000 | Total reward = 43.80
2022-01-26 14:16:26.504 | DEBUG    | __main__:trials:24 - Trial = 645/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.505 | DEBUG    | __main__:trials:29 - Trial = 645/30000 | Total reward = 44.78
2022-01-26 14:16:26.509 | DEBUG    | __main__:trials:24 - Trial = 646/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.510 | DEBUG    | __main__:trials:29 - Trial = 646/30000 | Total reward = 42.43
2022-01-26 14:16:26.514 | DEBUG    | __main__:trials:24 - Trial = 647/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.516 | DEBUG    | __main__:trials:29 - Trial = 647/30000 | Total reward = 45.25
2022-01-26 14:16:26.520 | DEBUG    | __main__:trials:24 - Trial = 648/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.521 | DEBUG    | __main__:trials:29 - Trial = 648/30000 | Total reward = 44.19
2022-01-26 14:16:26.524 | DEBUG    | __main__:trials:26 - Trial = 649/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.526 | DEBUG    | __main__:trials:29 - Trial = 649/30000 | Total reward = 30.63
2022-01-26 14:16:26.530 | DEBUG    | __main__:trials:24 - Trial = 650/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.531 | DEBUG    | __main__:trials:29 - Trial = 650/30000 | Total reward = 44.24
2022-01-26 14:16:26.535 | DEBUG    | __main__:trials:24 - Trial = 651/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.537 | DEBUG    | __main__:trials:29 - Trial = 651/30000 | Total reward = 41.47
2022-01-26 14:16:26.540 | DEBUG    | __main__:trials:24 - Trial = 652/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.541 | DEBUG    | __main__:trials:29 - Trial = 652/30000 | Total reward = 42.42
2022-01-26 14:16:26.545 | DEBUG    | __main__:trials:24 - Trial = 653/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.545 | DEBUG    | __main__:trials:29 - Trial = 653/30000 | Total reward = 42.14
2022-01-26 14:16:26.550 | DEBUG    | __main__:trials:24 - Trial = 654/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.551 | DEBUG    | __main__:trials:29 - Trial = 654/30000 | Total reward = 53.84
2022-01-26 14:16:26.555 | DEBUG    | __main__:trials:24 - Trial = 655/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.556 | DEBUG    | __main__:trials:29 - Trial = 655/30000 | Total reward = 48.03
2022-01-26 14:16:26.560 | DEBUG    | __main__:trials:24 - Trial = 656/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.562 | DEBUG    | __main__:trials:29 - Trial = 656/30000 | Total reward = 52.79
2022-01-26 14:16:26.565 | DEBUG    | __main__:trials:24 - Trial = 657/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.567 | DEBUG    | __main__:trials:29 - Trial = 657/30000 | Total reward = 45.31
2022-01-26 14:16:26.571 | DEBUG    | __main__:trials:24 - Trial = 658/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.572 | DEBUG    | __main__:trials:29 - Trial = 658/30000 | Total reward = 39.24
2022-01-26 14:16:26.575 | DEBUG    | __main__:trials:24 - Trial = 659/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.577 | DEBUG    | __main__:trials:29 - Trial = 659/30000 | Total reward = 41.87
2022-01-26 14:16:26.581 | DEBUG    | __main__:trials:24 - Trial = 660/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.583 | DEBUG    | __main__:trials:29 - Trial = 660/30000 | Total reward = 42.03
2022-01-26 14:16:26.587 | DEBUG    | __main__:trials:24 - Trial = 661/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.588 | DEBUG    | __main__:trials:29 - Trial = 661/30000 | Total reward = 43.02
2022-01-26 14:16:26.591 | DEBUG    | __main__:trials:24 - Trial = 662/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.593 | DEBUG    | __main__:trials:29 - Trial = 662/30000 | Total reward = 31.73
2022-01-26 14:16:26.597 | DEBUG    | __main__:trials:24 - Trial = 663/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.598 | DEBUG    | __main__:trials:29 - Trial = 663/30000 | Total reward = 44.61
2022-01-26 14:16:26.602 | DEBUG    | __main__:trials:24 - Trial = 664/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.603 | DEBUG    | __main__:trials:29 - Trial = 664/30000 | Total reward = 42.64
2022-01-26 14:16:26.607 | DEBUG    | __main__:trials:24 - Trial = 665/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.609 | DEBUG    | __main__:trials:29 - Trial = 665/30000 | Total reward = 44.24
2022-01-26 14:16:26.612 | DEBUG    | __main__:trials:26 - Trial = 666/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.613 | DEBUG    | __main__:trials:29 - Trial = 666/30000 | Total reward = 32.22
2022-01-26 14:16:26.616 | DEBUG    | __main__:trials:24 - Trial = 667/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.618 | DEBUG    | __main__:trials:29 - Trial = 667/30000 | Total reward = 32.52
2022-01-26 14:16:26.622 | DEBUG    | __main__:trials:24 - Trial = 668/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.623 | DEBUG    | __main__:trials:29 - Trial = 668/30000 | Total reward = 48.20
2022-01-26 14:16:26.627 | DEBUG    | __main__:trials:24 - Trial = 669/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.628 | DEBUG    | __main__:trials:29 - Trial = 669/30000 | Total reward = 44.61
2022-01-26 14:16:26.631 | DEBUG    | __main__:trials:24 - Trial = 670/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.633 | DEBUG    | __main__:trials:29 - Trial = 670/30000 | Total reward = 44.11
2022-01-26 14:16:26.637 | DEBUG    | __main__:trials:24 - Trial = 671/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.639 | DEBUG    | __main__:trials:29 - Trial = 671/30000 | Total reward = 40.12
2022-01-26 14:16:26.642 | DEBUG    | __main__:trials:24 - Trial = 672/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.644 | DEBUG    | __main__:trials:29 - Trial = 672/30000 | Total reward = 40.73
2022-01-26 14:16:26.647 | DEBUG    | __main__:trials:24 - Trial = 673/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.649 | DEBUG    | __main__:trials:29 - Trial = 673/30000 | Total reward = 43.69
2022-01-26 14:16:26.652 | DEBUG    | __main__:trials:24 - Trial = 674/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.654 | DEBUG    | __main__:trials:29 - Trial = 674/30000 | Total reward = 41.73
2022-01-26 14:16:26.658 | DEBUG    | __main__:trials:24 - Trial = 675/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.659 | DEBUG    | __main__:trials:29 - Trial = 675/30000 | Total reward = 45.18
2022-01-26 14:16:26.663 | DEBUG    | __main__:trials:24 - Trial = 676/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.664 | DEBUG    | __main__:trials:29 - Trial = 676/30000 | Total reward = 45.09
2022-01-26 14:16:26.668 | DEBUG    | __main__:trials:24 - Trial = 677/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.670 | DEBUG    | __main__:trials:29 - Trial = 677/30000 | Total reward = 42.42
2022-01-26 14:16:26.673 | DEBUG    | __main__:trials:24 - Trial = 678/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.675 | DEBUG    | __main__:trials:29 - Trial = 678/30000 | Total reward = 47.28
2022-01-26 14:16:26.678 | DEBUG    | __main__:trials:24 - Trial = 679/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.680 | DEBUG    | __main__:trials:29 - Trial = 679/30000 | Total reward = 32.76
2022-01-26 14:16:26.683 | DEBUG    | __main__:trials:24 - Trial = 680/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.685 | DEBUG    | __main__:trials:29 - Trial = 680/30000 | Total reward = 43.31
2022-01-26 14:16:26.688 | DEBUG    | __main__:trials:24 - Trial = 681/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.690 | DEBUG    | __main__:trials:29 - Trial = 681/30000 | Total reward = 62.16
2022-01-26 14:16:26.694 | DEBUG    | __main__:trials:24 - Trial = 682/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.695 | DEBUG    | __main__:trials:29 - Trial = 682/30000 | Total reward = 42.34
2022-01-26 14:16:26.699 | DEBUG    | __main__:trials:24 - Trial = 683/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.700 | DEBUG    | __main__:trials:29 - Trial = 683/30000 | Total reward = 43.63
2022-01-26 14:16:26.704 | DEBUG    | __main__:trials:24 - Trial = 684/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.706 | DEBUG    | __main__:trials:29 - Trial = 684/30000 | Total reward = 37.00
2022-01-26 14:16:26.710 | DEBUG    | __main__:trials:24 - Trial = 685/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.711 | DEBUG    | __main__:trials:29 - Trial = 685/30000 | Total reward = 33.10
2022-01-26 14:16:26.715 | DEBUG    | __main__:trials:24 - Trial = 686/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.717 | DEBUG    | __main__:trials:29 - Trial = 686/30000 | Total reward = 35.63
2022-01-26 14:16:26.720 | DEBUG    | __main__:trials:26 - Trial = 687/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.721 | DEBUG    | __main__:trials:29 - Trial = 687/30000 | Total reward = 20.34
2022-01-26 14:16:26.725 | DEBUG    | __main__:trials:24 - Trial = 688/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.727 | DEBUG    | __main__:trials:29 - Trial = 688/30000 | Total reward = 40.03
2022-01-26 14:16:26.731 | DEBUG    | __main__:trials:24 - Trial = 689/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.732 | DEBUG    | __main__:trials:29 - Trial = 689/30000 | Total reward = 30.93
2022-01-26 14:16:26.735 | DEBUG    | __main__:trials:24 - Trial = 690/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.737 | DEBUG    | __main__:trials:29 - Trial = 690/30000 | Total reward = 41.09
2022-01-26 14:16:26.740 | DEBUG    | __main__:trials:24 - Trial = 691/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.742 | DEBUG    | __main__:trials:29 - Trial = 691/30000 | Total reward = 33.67
2022-01-26 14:16:26.745 | DEBUG    | __main__:trials:26 - Trial = 692/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:26.747 | DEBUG    | __main__:trials:29 - Trial = 692/30000 | Total reward = 14.48
2022-01-26 14:16:26.750 | DEBUG    | __main__:trials:24 - Trial = 693/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.752 | DEBUG    | __main__:trials:29 - Trial = 693/30000 | Total reward = 40.58
2022-01-26 14:16:26.756 | DEBUG    | __main__:trials:24 - Trial = 694/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.757 | DEBUG    | __main__:trials:29 - Trial = 694/30000 | Total reward = 47.88
2022-01-26 14:16:26.761 | DEBUG    | __main__:trials:24 - Trial = 695/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.763 | DEBUG    | __main__:trials:29 - Trial = 695/30000 | Total reward = 44.10
2022-01-26 14:16:26.766 | DEBUG    | __main__:trials:24 - Trial = 696/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.767 | DEBUG    | __main__:trials:29 - Trial = 696/30000 | Total reward = 44.18
2022-01-26 14:16:26.771 | DEBUG    | __main__:trials:24 - Trial = 697/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.773 | DEBUG    | __main__:trials:29 - Trial = 697/30000 | Total reward = 57.03
2022-01-26 14:16:26.776 | DEBUG    | __main__:trials:24 - Trial = 698/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.777 | DEBUG    | __main__:trials:29 - Trial = 698/30000 | Total reward = 43.53
2022-01-26 14:16:26.781 | DEBUG    | __main__:trials:24 - Trial = 699/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.783 | DEBUG    | __main__:trials:29 - Trial = 699/30000 | Total reward = 32.45
2022-01-26 14:16:26.786 | DEBUG    | __main__:trials:24 - Trial = 700/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.788 | DEBUG    | __main__:trials:29 - Trial = 700/30000 | Total reward = 42.84
2022-01-26 14:16:26.792 | DEBUG    | __main__:trials:24 - Trial = 701/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.792 | DEBUG    | __main__:trials:29 - Trial = 701/30000 | Total reward = 29.03
2022-01-26 14:16:26.796 | DEBUG    | __main__:trials:24 - Trial = 702/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.797 | DEBUG    | __main__:trials:29 - Trial = 702/30000 | Total reward = 24.78
2022-01-26 14:16:26.800 | DEBUG    | __main__:trials:24 - Trial = 703/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.802 | DEBUG    | __main__:trials:29 - Trial = 703/30000 | Total reward = 64.72
2022-01-26 14:16:26.806 | DEBUG    | __main__:trials:24 - Trial = 704/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.807 | DEBUG    | __main__:trials:29 - Trial = 704/30000 | Total reward = 53.31
2022-01-26 14:16:26.811 | DEBUG    | __main__:trials:24 - Trial = 705/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.813 | DEBUG    | __main__:trials:29 - Trial = 705/30000 | Total reward = 47.05
2022-01-26 14:16:26.816 | DEBUG    | __main__:trials:24 - Trial = 706/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.818 | DEBUG    | __main__:trials:29 - Trial = 706/30000 | Total reward = 20.65
2022-01-26 14:16:26.822 | DEBUG    | __main__:trials:24 - Trial = 707/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.823 | DEBUG    | __main__:trials:29 - Trial = 707/30000 | Total reward = 35.94
2022-01-26 14:16:26.827 | DEBUG    | __main__:trials:24 - Trial = 708/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.829 | DEBUG    | __main__:trials:29 - Trial = 708/30000 | Total reward = 46.99
2022-01-26 14:16:26.832 | DEBUG    | __main__:trials:24 - Trial = 709/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.834 | DEBUG    | __main__:trials:29 - Trial = 709/30000 | Total reward = 35.72
2022-01-26 14:16:26.839 | DEBUG    | __main__:trials:24 - Trial = 710/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.840 | DEBUG    | __main__:trials:29 - Trial = 710/30000 | Total reward = 51.55
2022-01-26 14:16:26.844 | DEBUG    | __main__:trials:24 - Trial = 711/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.845 | DEBUG    | __main__:trials:29 - Trial = 711/30000 | Total reward = 44.30
2022-01-26 14:16:26.849 | DEBUG    | __main__:trials:24 - Trial = 712/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.850 | DEBUG    | __main__:trials:29 - Trial = 712/30000 | Total reward = 43.81
2022-01-26 14:16:26.854 | DEBUG    | __main__:trials:24 - Trial = 713/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.856 | DEBUG    | __main__:trials:29 - Trial = 713/30000 | Total reward = 38.22
2022-01-26 14:16:26.858 | DEBUG    | __main__:trials:24 - Trial = 714/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.860 | DEBUG    | __main__:trials:29 - Trial = 714/30000 | Total reward = 42.76
2022-01-26 14:16:26.864 | DEBUG    | __main__:trials:24 - Trial = 715/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.866 | DEBUG    | __main__:trials:29 - Trial = 715/30000 | Total reward = 44.17
2022-01-26 14:16:26.869 | DEBUG    | __main__:trials:24 - Trial = 716/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.871 | DEBUG    | __main__:trials:29 - Trial = 716/30000 | Total reward = 43.14
2022-01-26 14:16:26.874 | DEBUG    | __main__:trials:24 - Trial = 717/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.876 | DEBUG    | __main__:trials:29 - Trial = 717/30000 | Total reward = 37.44
2022-01-26 14:16:26.880 | DEBUG    | __main__:trials:24 - Trial = 718/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.881 | DEBUG    | __main__:trials:29 - Trial = 718/30000 | Total reward = 44.34
2022-01-26 14:16:26.885 | DEBUG    | __main__:trials:24 - Trial = 719/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.887 | DEBUG    | __main__:trials:29 - Trial = 719/30000 | Total reward = 46.90
2022-01-26 14:16:26.891 | DEBUG    | __main__:trials:24 - Trial = 720/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.891 | DEBUG    | __main__:trials:29 - Trial = 720/30000 | Total reward = 54.92
2022-01-26 14:16:26.896 | DEBUG    | __main__:trials:24 - Trial = 721/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.897 | DEBUG    | __main__:trials:29 - Trial = 721/30000 | Total reward = 44.51
2022-01-26 14:16:26.900 | DEBUG    | __main__:trials:24 - Trial = 722/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.902 | DEBUG    | __main__:trials:29 - Trial = 722/30000 | Total reward = 44.52
2022-01-26 14:16:26.906 | DEBUG    | __main__:trials:24 - Trial = 723/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.907 | DEBUG    | __main__:trials:29 - Trial = 723/30000 | Total reward = 43.62
2022-01-26 14:16:26.911 | DEBUG    | __main__:trials:24 - Trial = 724/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.912 | DEBUG    | __main__:trials:29 - Trial = 724/30000 | Total reward = 47.31
2022-01-26 14:16:26.915 | DEBUG    | __main__:trials:24 - Trial = 725/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.917 | DEBUG    | __main__:trials:29 - Trial = 725/30000 | Total reward = 46.53
2022-01-26 14:16:26.920 | DEBUG    | __main__:trials:24 - Trial = 726/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.922 | DEBUG    | __main__:trials:29 - Trial = 726/30000 | Total reward = 39.84
2022-01-26 14:16:26.926 | DEBUG    | __main__:trials:24 - Trial = 727/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.927 | DEBUG    | __main__:trials:29 - Trial = 727/30000 | Total reward = 53.64
2022-01-26 14:16:26.931 | DEBUG    | __main__:trials:24 - Trial = 728/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.932 | DEBUG    | __main__:trials:29 - Trial = 728/30000 | Total reward = 41.57
2022-01-26 14:16:26.936 | DEBUG    | __main__:trials:24 - Trial = 729/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.937 | DEBUG    | __main__:trials:29 - Trial = 729/30000 | Total reward = 44.98
2022-01-26 14:16:26.940 | DEBUG    | __main__:trials:24 - Trial = 730/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.942 | DEBUG    | __main__:trials:29 - Trial = 730/30000 | Total reward = 41.41
2022-01-26 14:16:26.946 | DEBUG    | __main__:trials:24 - Trial = 731/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.947 | DEBUG    | __main__:trials:29 - Trial = 731/30000 | Total reward = 42.20
2022-01-26 14:16:26.951 | DEBUG    | __main__:trials:24 - Trial = 732/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.952 | DEBUG    | __main__:trials:29 - Trial = 732/30000 | Total reward = 44.20
2022-01-26 14:16:26.956 | DEBUG    | __main__:trials:24 - Trial = 733/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.957 | DEBUG    | __main__:trials:29 - Trial = 733/30000 | Total reward = 56.30
2022-01-26 14:16:26.961 | DEBUG    | __main__:trials:24 - Trial = 734/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.962 | DEBUG    | __main__:trials:29 - Trial = 734/30000 | Total reward = 42.62
2022-01-26 14:16:26.966 | DEBUG    | __main__:trials:24 - Trial = 735/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.968 | DEBUG    | __main__:trials:29 - Trial = 735/30000 | Total reward = 46.90
2022-01-26 14:16:26.971 | DEBUG    | __main__:trials:24 - Trial = 736/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.973 | DEBUG    | __main__:trials:29 - Trial = 736/30000 | Total reward = 41.24
2022-01-26 14:16:26.976 | DEBUG    | __main__:trials:24 - Trial = 737/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.978 | DEBUG    | __main__:trials:29 - Trial = 737/30000 | Total reward = 40.34
2022-01-26 14:16:26.982 | DEBUG    | __main__:trials:24 - Trial = 738/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.984 | DEBUG    | __main__:trials:29 - Trial = 738/30000 | Total reward = 45.33
2022-01-26 14:16:26.987 | DEBUG    | __main__:trials:24 - Trial = 739/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.989 | DEBUG    | __main__:trials:29 - Trial = 739/30000 | Total reward = 45.32
2022-01-26 14:16:26.992 | DEBUG    | __main__:trials:24 - Trial = 740/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.994 | DEBUG    | __main__:trials:29 - Trial = 740/30000 | Total reward = 53.28
2022-01-26 14:16:26.998 | DEBUG    | __main__:trials:24 - Trial = 741/30000 | Max number of steps (20) reached
2022-01-26 14:16:26.999 | DEBUG    | __main__:trials:29 - Trial = 741/30000 | Total reward = 48.49
2022-01-26 14:16:27.003 | DEBUG    | __main__:trials:24 - Trial = 742/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.005 | DEBUG    | __main__:trials:29 - Trial = 742/30000 | Total reward = 49.53
2022-01-26 14:16:27.008 | DEBUG    | __main__:trials:24 - Trial = 743/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.010 | DEBUG    | __main__:trials:29 - Trial = 743/30000 | Total reward = 53.89
2022-01-26 14:16:27.014 | DEBUG    | __main__:trials:24 - Trial = 744/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.014 | DEBUG    | __main__:trials:29 - Trial = 744/30000 | Total reward = 45.41
2022-01-26 14:16:27.018 | DEBUG    | __main__:trials:24 - Trial = 745/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.020 | DEBUG    | __main__:trials:29 - Trial = 745/30000 | Total reward = 31.97
2022-01-26 14:16:27.023 | DEBUG    | __main__:trials:24 - Trial = 746/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.025 | DEBUG    | __main__:trials:29 - Trial = 746/30000 | Total reward = 27.21
2022-01-26 14:16:27.029 | DEBUG    | __main__:trials:24 - Trial = 747/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.031 | DEBUG    | __main__:trials:29 - Trial = 747/30000 | Total reward = 46.84
2022-01-26 14:16:27.034 | DEBUG    | __main__:trials:24 - Trial = 748/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.036 | DEBUG    | __main__:trials:29 - Trial = 748/30000 | Total reward = 41.39
2022-01-26 14:16:27.040 | DEBUG    | __main__:trials:24 - Trial = 749/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.041 | DEBUG    | __main__:trials:29 - Trial = 749/30000 | Total reward = 29.73
2022-01-26 14:16:27.044 | DEBUG    | __main__:trials:26 - Trial = 750/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.045 | DEBUG    | __main__:trials:29 - Trial = 750/30000 | Total reward = 34.94
2022-01-26 14:16:27.049 | DEBUG    | __main__:trials:24 - Trial = 751/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.050 | DEBUG    | __main__:trials:29 - Trial = 751/30000 | Total reward = 35.58
2022-01-26 14:16:27.054 | DEBUG    | __main__:trials:24 - Trial = 752/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.056 | DEBUG    | __main__:trials:29 - Trial = 752/30000 | Total reward = 43.96
2022-01-26 14:16:27.059 | DEBUG    | __main__:trials:24 - Trial = 753/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.060 | DEBUG    | __main__:trials:29 - Trial = 753/30000 | Total reward = 46.71
2022-01-26 14:16:27.064 | DEBUG    | __main__:trials:24 - Trial = 754/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.066 | DEBUG    | __main__:trials:29 - Trial = 754/30000 | Total reward = 42.65
2022-01-26 14:16:27.069 | DEBUG    | __main__:trials:24 - Trial = 755/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.071 | DEBUG    | __main__:trials:29 - Trial = 755/30000 | Total reward = 46.14
2022-01-26 14:16:27.074 | DEBUG    | __main__:trials:24 - Trial = 756/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.076 | DEBUG    | __main__:trials:29 - Trial = 756/30000 | Total reward = 40.66
2022-01-26 14:16:27.080 | DEBUG    | __main__:trials:24 - Trial = 757/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.081 | DEBUG    | __main__:trials:29 - Trial = 757/30000 | Total reward = 46.78
2022-01-26 14:16:27.085 | DEBUG    | __main__:trials:24 - Trial = 758/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.087 | DEBUG    | __main__:trials:29 - Trial = 758/30000 | Total reward = 46.86
2022-01-26 14:16:27.091 | DEBUG    | __main__:trials:24 - Trial = 759/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.092 | DEBUG    | __main__:trials:29 - Trial = 759/30000 | Total reward = 38.22
2022-01-26 14:16:27.096 | DEBUG    | __main__:trials:24 - Trial = 760/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.097 | DEBUG    | __main__:trials:29 - Trial = 760/30000 | Total reward = 45.82
2022-01-26 14:16:27.101 | DEBUG    | __main__:trials:24 - Trial = 761/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.103 | DEBUG    | __main__:trials:29 - Trial = 761/30000 | Total reward = 39.14
2022-01-26 14:16:27.106 | DEBUG    | __main__:trials:24 - Trial = 762/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.108 | DEBUG    | __main__:trials:29 - Trial = 762/30000 | Total reward = 45.71
2022-01-26 14:16:27.111 | DEBUG    | __main__:trials:24 - Trial = 763/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.113 | DEBUG    | __main__:trials:29 - Trial = 763/30000 | Total reward = 38.87
2022-01-26 14:16:27.117 | DEBUG    | __main__:trials:24 - Trial = 764/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.118 | DEBUG    | __main__:trials:29 - Trial = 764/30000 | Total reward = 38.56
2022-01-26 14:16:27.122 | DEBUG    | __main__:trials:24 - Trial = 765/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.123 | DEBUG    | __main__:trials:29 - Trial = 765/30000 | Total reward = 47.04
2022-01-26 14:16:27.127 | DEBUG    | __main__:trials:24 - Trial = 766/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.129 | DEBUG    | __main__:trials:29 - Trial = 766/30000 | Total reward = 56.14
2022-01-26 14:16:27.132 | DEBUG    | __main__:trials:24 - Trial = 767/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.134 | DEBUG    | __main__:trials:29 - Trial = 767/30000 | Total reward = 59.42
2022-01-26 14:16:27.137 | DEBUG    | __main__:trials:24 - Trial = 768/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.139 | DEBUG    | __main__:trials:29 - Trial = 768/30000 | Total reward = 43.61
2022-01-26 14:16:27.143 | DEBUG    | __main__:trials:24 - Trial = 769/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.144 | DEBUG    | __main__:trials:29 - Trial = 769/30000 | Total reward = 47.39
2022-01-26 14:16:27.148 | DEBUG    | __main__:trials:24 - Trial = 770/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.150 | DEBUG    | __main__:trials:29 - Trial = 770/30000 | Total reward = 43.33
2022-01-26 14:16:27.153 | DEBUG    | __main__:trials:24 - Trial = 771/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.154 | DEBUG    | __main__:trials:29 - Trial = 771/30000 | Total reward = 46.62
2022-01-26 14:16:27.158 | DEBUG    | __main__:trials:24 - Trial = 772/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.159 | DEBUG    | __main__:trials:29 - Trial = 772/30000 | Total reward = 45.71
2022-01-26 14:16:27.162 | DEBUG    | __main__:trials:24 - Trial = 773/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.163 | DEBUG    | __main__:trials:29 - Trial = 773/30000 | Total reward = 44.29
2022-01-26 14:16:27.167 | DEBUG    | __main__:trials:24 - Trial = 774/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.169 | DEBUG    | __main__:trials:29 - Trial = 774/30000 | Total reward = 46.61
2022-01-26 14:16:27.172 | DEBUG    | __main__:trials:24 - Trial = 775/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.173 | DEBUG    | __main__:trials:29 - Trial = 775/30000 | Total reward = 10.52
2022-01-26 14:16:27.176 | DEBUG    | __main__:trials:24 - Trial = 776/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.178 | DEBUG    | __main__:trials:29 - Trial = 776/30000 | Total reward = 47.21
2022-01-26 14:16:27.181 | DEBUG    | __main__:trials:24 - Trial = 777/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.182 | DEBUG    | __main__:trials:29 - Trial = 777/30000 | Total reward = 41.08
2022-01-26 14:16:27.185 | DEBUG    | __main__:trials:24 - Trial = 778/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.186 | DEBUG    | __main__:trials:29 - Trial = 778/30000 | Total reward = 46.40
2022-01-26 14:16:27.189 | DEBUG    | __main__:trials:24 - Trial = 779/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.191 | DEBUG    | __main__:trials:29 - Trial = 779/30000 | Total reward = 46.28
2022-01-26 14:16:27.194 | DEBUG    | __main__:trials:24 - Trial = 780/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.196 | DEBUG    | __main__:trials:29 - Trial = 780/30000 | Total reward = 48.19
2022-01-26 14:16:27.198 | DEBUG    | __main__:trials:24 - Trial = 781/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.200 | DEBUG    | __main__:trials:29 - Trial = 781/30000 | Total reward = 43.74
2022-01-26 14:16:27.204 | DEBUG    | __main__:trials:24 - Trial = 782/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.205 | DEBUG    | __main__:trials:29 - Trial = 782/30000 | Total reward = 39.68
2022-01-26 14:16:27.208 | DEBUG    | __main__:trials:24 - Trial = 783/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.210 | DEBUG    | __main__:trials:29 - Trial = 783/30000 | Total reward = 46.48
2022-01-26 14:16:27.213 | DEBUG    | __main__:trials:24 - Trial = 784/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.215 | DEBUG    | __main__:trials:29 - Trial = 784/30000 | Total reward = 35.04
2022-01-26 14:16:27.219 | DEBUG    | __main__:trials:24 - Trial = 785/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.220 | DEBUG    | __main__:trials:29 - Trial = 785/30000 | Total reward = 43.52
2022-01-26 14:16:27.224 | DEBUG    | __main__:trials:24 - Trial = 786/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.224 | DEBUG    | __main__:trials:29 - Trial = 786/30000 | Total reward = 46.40
2022-01-26 14:16:27.228 | DEBUG    | __main__:trials:24 - Trial = 787/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.229 | DEBUG    | __main__:trials:29 - Trial = 787/30000 | Total reward = 42.03
2022-01-26 14:16:27.233 | DEBUG    | __main__:trials:24 - Trial = 788/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.234 | DEBUG    | __main__:trials:29 - Trial = 788/30000 | Total reward = 47.85
2022-01-26 14:16:27.238 | DEBUG    | __main__:trials:24 - Trial = 789/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.238 | DEBUG    | __main__:trials:29 - Trial = 789/30000 | Total reward = 41.55
2022-01-26 14:16:27.242 | DEBUG    | __main__:trials:24 - Trial = 790/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.244 | DEBUG    | __main__:trials:29 - Trial = 790/30000 | Total reward = 34.11
2022-01-26 14:16:27.247 | DEBUG    | __main__:trials:24 - Trial = 791/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.249 | DEBUG    | __main__:trials:29 - Trial = 791/30000 | Total reward = 39.46
2022-01-26 14:16:27.252 | DEBUG    | __main__:trials:24 - Trial = 792/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.254 | DEBUG    | __main__:trials:29 - Trial = 792/30000 | Total reward = 46.53
2022-01-26 14:16:27.257 | DEBUG    | __main__:trials:24 - Trial = 793/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.259 | DEBUG    | __main__:trials:29 - Trial = 793/30000 | Total reward = 41.71
2022-01-26 14:16:27.264 | DEBUG    | __main__:trials:24 - Trial = 794/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.265 | DEBUG    | __main__:trials:29 - Trial = 794/30000 | Total reward = 37.92
2022-01-26 14:16:27.269 | DEBUG    | __main__:trials:24 - Trial = 795/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.271 | DEBUG    | __main__:trials:29 - Trial = 795/30000 | Total reward = 44.04
2022-01-26 14:16:27.275 | DEBUG    | __main__:trials:24 - Trial = 796/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.276 | DEBUG    | __main__:trials:29 - Trial = 796/30000 | Total reward = 47.04
2022-01-26 14:16:27.280 | DEBUG    | __main__:trials:24 - Trial = 797/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.282 | DEBUG    | __main__:trials:29 - Trial = 797/30000 | Total reward = 50.35
2022-01-26 14:16:27.286 | DEBUG    | __main__:trials:24 - Trial = 798/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.287 | DEBUG    | __main__:trials:29 - Trial = 798/30000 | Total reward = 43.40
2022-01-26 14:16:27.291 | DEBUG    | __main__:trials:24 - Trial = 799/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.292 | DEBUG    | __main__:trials:29 - Trial = 799/30000 | Total reward = 29.75
2022-01-26 14:16:27.295 | DEBUG    | __main__:trials:24 - Trial = 800/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.297 | DEBUG    | __main__:trials:29 - Trial = 800/30000 | Total reward = 41.75
2022-01-26 14:16:27.301 | DEBUG    | __main__:trials:24 - Trial = 801/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.302 | DEBUG    | __main__:trials:29 - Trial = 801/30000 | Total reward = 44.65
2022-01-26 14:16:27.306 | DEBUG    | __main__:trials:24 - Trial = 802/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.308 | DEBUG    | __main__:trials:29 - Trial = 802/30000 | Total reward = 42.36
2022-01-26 14:16:27.311 | DEBUG    | __main__:trials:24 - Trial = 803/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.313 | DEBUG    | __main__:trials:29 - Trial = 803/30000 | Total reward = 45.78
2022-01-26 14:16:27.316 | DEBUG    | __main__:trials:24 - Trial = 804/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.318 | DEBUG    | __main__:trials:29 - Trial = 804/30000 | Total reward = 43.42
2022-01-26 14:16:27.321 | DEBUG    | __main__:trials:24 - Trial = 805/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.321 | DEBUG    | __main__:trials:29 - Trial = 805/30000 | Total reward = 47.69
2022-01-26 14:16:27.326 | DEBUG    | __main__:trials:24 - Trial = 806/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.326 | DEBUG    | __main__:trials:29 - Trial = 806/30000 | Total reward = 48.22
2022-01-26 14:16:27.331 | DEBUG    | __main__:trials:24 - Trial = 807/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.332 | DEBUG    | __main__:trials:29 - Trial = 807/30000 | Total reward = 59.81
2022-01-26 14:16:27.335 | DEBUG    | __main__:trials:24 - Trial = 808/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.337 | DEBUG    | __main__:trials:29 - Trial = 808/30000 | Total reward = 46.40
2022-01-26 14:16:27.340 | DEBUG    | __main__:trials:24 - Trial = 809/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.342 | DEBUG    | __main__:trials:29 - Trial = 809/30000 | Total reward = 46.09
2022-01-26 14:16:27.346 | DEBUG    | __main__:trials:24 - Trial = 810/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.347 | DEBUG    | __main__:trials:29 - Trial = 810/30000 | Total reward = 41.38
2022-01-26 14:16:27.351 | DEBUG    | __main__:trials:24 - Trial = 811/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.353 | DEBUG    | __main__:trials:29 - Trial = 811/30000 | Total reward = 44.49
2022-01-26 14:16:27.357 | DEBUG    | __main__:trials:24 - Trial = 812/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.358 | DEBUG    | __main__:trials:29 - Trial = 812/30000 | Total reward = 47.12
2022-01-26 14:16:27.362 | DEBUG    | __main__:trials:24 - Trial = 813/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.363 | DEBUG    | __main__:trials:29 - Trial = 813/30000 | Total reward = 48.56
2022-01-26 14:16:27.366 | DEBUG    | __main__:trials:24 - Trial = 814/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.367 | DEBUG    | __main__:trials:29 - Trial = 814/30000 | Total reward = 46.78
2022-01-26 14:16:27.371 | DEBUG    | __main__:trials:26 - Trial = 815/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.372 | DEBUG    | __main__:trials:29 - Trial = 815/30000 | Total reward = 30.10
2022-01-26 14:16:27.375 | DEBUG    | __main__:trials:26 - Trial = 816/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.377 | DEBUG    | __main__:trials:29 - Trial = 816/30000 | Total reward = 17.17
2022-01-26 14:16:27.380 | DEBUG    | __main__:trials:24 - Trial = 817/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.382 | DEBUG    | __main__:trials:29 - Trial = 817/30000 | Total reward = 37.71
2022-01-26 14:16:27.385 | DEBUG    | __main__:trials:24 - Trial = 818/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.387 | DEBUG    | __main__:trials:29 - Trial = 818/30000 | Total reward = 44.92
2022-01-26 14:16:27.391 | DEBUG    | __main__:trials:24 - Trial = 819/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.392 | DEBUG    | __main__:trials:29 - Trial = 819/30000 | Total reward = 46.27
2022-01-26 14:16:27.396 | DEBUG    | __main__:trials:24 - Trial = 820/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.398 | DEBUG    | __main__:trials:29 - Trial = 820/30000 | Total reward = 38.61
2022-01-26 14:16:27.401 | DEBUG    | __main__:trials:24 - Trial = 821/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.402 | DEBUG    | __main__:trials:29 - Trial = 821/30000 | Total reward = 50.69
2022-01-26 14:16:27.406 | DEBUG    | __main__:trials:24 - Trial = 822/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.408 | DEBUG    | __main__:trials:29 - Trial = 822/30000 | Total reward = 47.04
2022-01-26 14:16:27.411 | DEBUG    | __main__:trials:24 - Trial = 823/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.413 | DEBUG    | __main__:trials:29 - Trial = 823/30000 | Total reward = 45.94
2022-01-26 14:16:27.416 | DEBUG    | __main__:trials:24 - Trial = 824/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.418 | DEBUG    | __main__:trials:29 - Trial = 824/30000 | Total reward = 46.03
2022-01-26 14:16:27.422 | DEBUG    | __main__:trials:24 - Trial = 825/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.424 | DEBUG    | __main__:trials:29 - Trial = 825/30000 | Total reward = 47.04
2022-01-26 14:16:27.428 | DEBUG    | __main__:trials:24 - Trial = 826/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.429 | DEBUG    | __main__:trials:29 - Trial = 826/30000 | Total reward = 43.97
2022-01-26 14:16:27.433 | DEBUG    | __main__:trials:24 - Trial = 827/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.434 | DEBUG    | __main__:trials:29 - Trial = 827/30000 | Total reward = 52.32
2022-01-26 14:16:27.438 | DEBUG    | __main__:trials:24 - Trial = 828/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.439 | DEBUG    | __main__:trials:29 - Trial = 828/30000 | Total reward = 44.64
2022-01-26 14:16:27.443 | DEBUG    | __main__:trials:24 - Trial = 829/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.445 | DEBUG    | __main__:trials:29 - Trial = 829/30000 | Total reward = 45.99
2022-01-26 14:16:27.447 | DEBUG    | __main__:trials:24 - Trial = 830/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.449 | DEBUG    | __main__:trials:29 - Trial = 830/30000 | Total reward = 40.21
2022-01-26 14:16:27.453 | DEBUG    | __main__:trials:24 - Trial = 831/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.455 | DEBUG    | __main__:trials:29 - Trial = 831/30000 | Total reward = 47.84
2022-01-26 14:16:27.531 | DEBUG    | __main__:trials:24 - Trial = 832/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.532 | DEBUG    | __main__:trials:29 - Trial = 832/30000 | Total reward = 42.93
2022-01-26 14:16:27.537 | DEBUG    | __main__:trials:24 - Trial = 833/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.539 | DEBUG    | __main__:trials:29 - Trial = 833/30000 | Total reward = 42.01
2022-01-26 14:16:27.542 | DEBUG    | __main__:trials:24 - Trial = 834/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.544 | DEBUG    | __main__:trials:29 - Trial = 834/30000 | Total reward = 58.25
2022-01-26 14:16:27.548 | DEBUG    | __main__:trials:24 - Trial = 835/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.549 | DEBUG    | __main__:trials:29 - Trial = 835/30000 | Total reward = 36.94
2022-01-26 14:16:27.553 | DEBUG    | __main__:trials:24 - Trial = 836/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.555 | DEBUG    | __main__:trials:29 - Trial = 836/30000 | Total reward = 42.87
2022-01-26 14:16:27.558 | DEBUG    | __main__:trials:24 - Trial = 837/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.560 | DEBUG    | __main__:trials:29 - Trial = 837/30000 | Total reward = 55.42
2022-01-26 14:16:27.563 | DEBUG    | __main__:trials:24 - Trial = 838/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.565 | DEBUG    | __main__:trials:29 - Trial = 838/30000 | Total reward = 46.71
2022-01-26 14:16:27.568 | DEBUG    | __main__:trials:24 - Trial = 839/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.570 | DEBUG    | __main__:trials:29 - Trial = 839/30000 | Total reward = 46.53
2022-01-26 14:16:27.574 | DEBUG    | __main__:trials:24 - Trial = 840/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.575 | DEBUG    | __main__:trials:29 - Trial = 840/30000 | Total reward = 47.64
2022-01-26 14:16:27.578 | DEBUG    | __main__:trials:24 - Trial = 841/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.580 | DEBUG    | __main__:trials:29 - Trial = 841/30000 | Total reward = 52.58
2022-01-26 14:16:27.584 | DEBUG    | __main__:trials:24 - Trial = 842/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.585 | DEBUG    | __main__:trials:29 - Trial = 842/30000 | Total reward = 39.45
2022-01-26 14:16:27.589 | DEBUG    | __main__:trials:24 - Trial = 843/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.591 | DEBUG    | __main__:trials:29 - Trial = 843/30000 | Total reward = 34.72
2022-01-26 14:16:27.595 | DEBUG    | __main__:trials:24 - Trial = 844/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.598 | DEBUG    | __main__:trials:29 - Trial = 844/30000 | Total reward = 44.50
2022-01-26 14:16:27.601 | DEBUG    | __main__:trials:24 - Trial = 845/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.603 | DEBUG    | __main__:trials:29 - Trial = 845/30000 | Total reward = 41.50
2022-01-26 14:16:27.606 | DEBUG    | __main__:trials:24 - Trial = 846/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.608 | DEBUG    | __main__:trials:29 - Trial = 846/30000 | Total reward = 38.17
2022-01-26 14:16:27.611 | DEBUG    | __main__:trials:24 - Trial = 847/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.613 | DEBUG    | __main__:trials:29 - Trial = 847/30000 | Total reward = 58.15
2022-01-26 14:16:27.617 | DEBUG    | __main__:trials:24 - Trial = 848/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.618 | DEBUG    | __main__:trials:29 - Trial = 848/30000 | Total reward = 46.39
2022-01-26 14:16:27.622 | DEBUG    | __main__:trials:24 - Trial = 849/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.624 | DEBUG    | __main__:trials:29 - Trial = 849/30000 | Total reward = 50.76
2022-01-26 14:16:27.627 | DEBUG    | __main__:trials:24 - Trial = 850/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.629 | DEBUG    | __main__:trials:29 - Trial = 850/30000 | Total reward = 44.54
2022-01-26 14:16:27.633 | DEBUG    | __main__:trials:24 - Trial = 851/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.633 | DEBUG    | __main__:trials:29 - Trial = 851/30000 | Total reward = 39.45
2022-01-26 14:16:27.637 | DEBUG    | __main__:trials:24 - Trial = 852/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.639 | DEBUG    | __main__:trials:29 - Trial = 852/30000 | Total reward = 47.20
2022-01-26 14:16:27.642 | DEBUG    | __main__:trials:24 - Trial = 853/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.644 | DEBUG    | __main__:trials:29 - Trial = 853/30000 | Total reward = 46.03
2022-01-26 14:16:27.647 | DEBUG    | __main__:trials:24 - Trial = 854/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.649 | DEBUG    | __main__:trials:29 - Trial = 854/30000 | Total reward = 45.14
2022-01-26 14:16:27.653 | DEBUG    | __main__:trials:24 - Trial = 855/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.654 | DEBUG    | __main__:trials:29 - Trial = 855/30000 | Total reward = 46.27
2022-01-26 14:16:27.657 | DEBUG    | __main__:trials:24 - Trial = 856/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.659 | DEBUG    | __main__:trials:29 - Trial = 856/30000 | Total reward = 44.85
2022-01-26 14:16:27.662 | DEBUG    | __main__:trials:24 - Trial = 857/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.664 | DEBUG    | __main__:trials:29 - Trial = 857/30000 | Total reward = 47.04
2022-01-26 14:16:27.668 | DEBUG    | __main__:trials:24 - Trial = 858/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.670 | DEBUG    | __main__:trials:29 - Trial = 858/30000 | Total reward = 45.97
2022-01-26 14:16:27.673 | DEBUG    | __main__:trials:24 - Trial = 859/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.675 | DEBUG    | __main__:trials:29 - Trial = 859/30000 | Total reward = 53.79
2022-01-26 14:16:27.679 | DEBUG    | __main__:trials:24 - Trial = 860/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.680 | DEBUG    | __main__:trials:29 - Trial = 860/30000 | Total reward = 53.79
2022-01-26 14:16:27.684 | DEBUG    | __main__:trials:24 - Trial = 861/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.685 | DEBUG    | __main__:trials:29 - Trial = 861/30000 | Total reward = 43.68
2022-01-26 14:16:27.688 | DEBUG    | __main__:trials:24 - Trial = 862/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.690 | DEBUG    | __main__:trials:29 - Trial = 862/30000 | Total reward = 33.61
2022-01-26 14:16:27.694 | DEBUG    | __main__:trials:24 - Trial = 863/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.695 | DEBUG    | __main__:trials:29 - Trial = 863/30000 | Total reward = 49.91
2022-01-26 14:16:27.698 | DEBUG    | __main__:trials:24 - Trial = 864/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.700 | DEBUG    | __main__:trials:29 - Trial = 864/30000 | Total reward = 44.20
2022-01-26 14:16:27.703 | DEBUG    | __main__:trials:24 - Trial = 865/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.705 | DEBUG    | __main__:trials:29 - Trial = 865/30000 | Total reward = 40.25
2022-01-26 14:16:27.708 | DEBUG    | __main__:trials:24 - Trial = 866/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.709 | DEBUG    | __main__:trials:29 - Trial = 866/30000 | Total reward = 47.04
2022-01-26 14:16:27.713 | DEBUG    | __main__:trials:24 - Trial = 867/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.715 | DEBUG    | __main__:trials:29 - Trial = 867/30000 | Total reward = 54.02
2022-01-26 14:16:27.718 | DEBUG    | __main__:trials:26 - Trial = 868/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.720 | DEBUG    | __main__:trials:29 - Trial = 868/30000 | Total reward = 28.94
2022-01-26 14:16:27.724 | DEBUG    | __main__:trials:24 - Trial = 869/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.725 | DEBUG    | __main__:trials:29 - Trial = 869/30000 | Total reward = 47.22
2022-01-26 14:16:27.729 | DEBUG    | __main__:trials:24 - Trial = 870/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.730 | DEBUG    | __main__:trials:29 - Trial = 870/30000 | Total reward = 50.44
2022-01-26 14:16:27.733 | DEBUG    | __main__:trials:26 - Trial = 871/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.734 | DEBUG    | __main__:trials:29 - Trial = 871/30000 | Total reward = 26.34
2022-01-26 14:16:27.737 | DEBUG    | __main__:trials:26 - Trial = 872/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.738 | DEBUG    | __main__:trials:29 - Trial = 872/30000 | Total reward = 20.91
2022-01-26 14:16:27.742 | DEBUG    | __main__:trials:24 - Trial = 873/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.744 | DEBUG    | __main__:trials:29 - Trial = 873/30000 | Total reward = 44.80
2022-01-26 14:16:27.748 | DEBUG    | __main__:trials:24 - Trial = 874/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.749 | DEBUG    | __main__:trials:29 - Trial = 874/30000 | Total reward = 42.68
2022-01-26 14:16:27.753 | DEBUG    | __main__:trials:24 - Trial = 875/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.755 | DEBUG    | __main__:trials:29 - Trial = 875/30000 | Total reward = 42.23
2022-01-26 14:16:27.758 | DEBUG    | __main__:trials:24 - Trial = 876/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.759 | DEBUG    | __main__:trials:29 - Trial = 876/30000 | Total reward = 48.12
2022-01-26 14:16:27.764 | DEBUG    | __main__:trials:26 - Trial = 877/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.765 | DEBUG    | __main__:trials:29 - Trial = 877/30000 | Total reward = 41.14
2022-01-26 14:16:27.769 | DEBUG    | __main__:trials:24 - Trial = 878/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.771 | DEBUG    | __main__:trials:29 - Trial = 878/30000 | Total reward = 47.58
2022-01-26 14:16:27.774 | DEBUG    | __main__:trials:24 - Trial = 879/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.776 | DEBUG    | __main__:trials:29 - Trial = 879/30000 | Total reward = 36.84
2022-01-26 14:16:27.779 | DEBUG    | __main__:trials:24 - Trial = 880/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.780 | DEBUG    | __main__:trials:29 - Trial = 880/30000 | Total reward = 57.96
2022-01-26 14:16:27.784 | DEBUG    | __main__:trials:24 - Trial = 881/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.785 | DEBUG    | __main__:trials:29 - Trial = 881/30000 | Total reward = 45.77
2022-01-26 14:16:27.789 | DEBUG    | __main__:trials:24 - Trial = 882/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.790 | DEBUG    | __main__:trials:29 - Trial = 882/30000 | Total reward = 39.24
2022-01-26 14:16:27.794 | DEBUG    | __main__:trials:24 - Trial = 883/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.796 | DEBUG    | __main__:trials:29 - Trial = 883/30000 | Total reward = 48.95
2022-01-26 14:16:27.799 | DEBUG    | __main__:trials:24 - Trial = 884/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.801 | DEBUG    | __main__:trials:29 - Trial = 884/30000 | Total reward = 25.24
2022-01-26 14:16:27.805 | DEBUG    | __main__:trials:24 - Trial = 885/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.805 | DEBUG    | __main__:trials:29 - Trial = 885/30000 | Total reward = 41.27
2022-01-26 14:16:27.810 | DEBUG    | __main__:trials:24 - Trial = 886/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.810 | DEBUG    | __main__:trials:29 - Trial = 886/30000 | Total reward = 49.74
2022-01-26 14:16:27.815 | DEBUG    | __main__:trials:24 - Trial = 887/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.817 | DEBUG    | __main__:trials:29 - Trial = 887/30000 | Total reward = 33.03
2022-01-26 14:16:27.819 | DEBUG    | __main__:trials:26 - Trial = 888/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.820 | DEBUG    | __main__:trials:29 - Trial = 888/30000 | Total reward = 10.12
2022-01-26 14:16:27.824 | DEBUG    | __main__:trials:24 - Trial = 889/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.825 | DEBUG    | __main__:trials:29 - Trial = 889/30000 | Total reward = 50.54
2022-01-26 14:16:27.828 | DEBUG    | __main__:trials:24 - Trial = 890/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.830 | DEBUG    | __main__:trials:29 - Trial = 890/30000 | Total reward = 46.27
2022-01-26 14:16:27.835 | DEBUG    | __main__:trials:24 - Trial = 891/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.836 | DEBUG    | __main__:trials:29 - Trial = 891/30000 | Total reward = 43.30
2022-01-26 14:16:27.840 | DEBUG    | __main__:trials:26 - Trial = 892/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.841 | DEBUG    | __main__:trials:29 - Trial = 892/30000 | Total reward = 32.65
2022-01-26 14:16:27.845 | DEBUG    | __main__:trials:24 - Trial = 893/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.847 | DEBUG    | __main__:trials:29 - Trial = 893/30000 | Total reward = 45.71
2022-01-26 14:16:27.849 | DEBUG    | __main__:trials:26 - Trial = 894/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.850 | DEBUG    | __main__:trials:29 - Trial = 894/30000 | Total reward = 16.55
2022-01-26 14:16:27.853 | DEBUG    | __main__:trials:24 - Trial = 895/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.854 | DEBUG    | __main__:trials:29 - Trial = 895/30000 | Total reward = 47.62
2022-01-26 14:16:27.856 | DEBUG    | __main__:trials:26 - Trial = 896/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.857 | DEBUG    | __main__:trials:29 - Trial = 896/30000 | Total reward = 9.46
2022-01-26 14:16:27.860 | DEBUG    | __main__:trials:24 - Trial = 897/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.862 | DEBUG    | __main__:trials:29 - Trial = 897/30000 | Total reward = 44.66
2022-01-26 14:16:27.865 | DEBUG    | __main__:trials:24 - Trial = 898/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.866 | DEBUG    | __main__:trials:29 - Trial = 898/30000 | Total reward = 48.35
2022-01-26 14:16:27.870 | DEBUG    | __main__:trials:24 - Trial = 899/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.871 | DEBUG    | __main__:trials:29 - Trial = 899/30000 | Total reward = 45.28
2022-01-26 14:16:27.875 | DEBUG    | __main__:trials:24 - Trial = 900/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.877 | DEBUG    | __main__:trials:29 - Trial = 900/30000 | Total reward = 47.77
2022-01-26 14:16:27.881 | DEBUG    | __main__:trials:24 - Trial = 901/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.882 | DEBUG    | __main__:trials:29 - Trial = 901/30000 | Total reward = 53.67
2022-01-26 14:16:27.886 | DEBUG    | __main__:trials:24 - Trial = 902/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.887 | DEBUG    | __main__:trials:29 - Trial = 902/30000 | Total reward = 42.37
2022-01-26 14:16:27.890 | DEBUG    | __main__:trials:24 - Trial = 903/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.892 | DEBUG    | __main__:trials:29 - Trial = 903/30000 | Total reward = 54.54
2022-01-26 14:16:27.895 | DEBUG    | __main__:trials:24 - Trial = 904/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.898 | DEBUG    | __main__:trials:29 - Trial = 904/30000 | Total reward = 46.57
2022-01-26 14:16:27.901 | DEBUG    | __main__:trials:26 - Trial = 905/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.903 | DEBUG    | __main__:trials:29 - Trial = 905/30000 | Total reward = 31.44
2022-01-26 14:16:27.907 | DEBUG    | __main__:trials:24 - Trial = 906/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.909 | DEBUG    | __main__:trials:29 - Trial = 906/30000 | Total reward = 42.19
2022-01-26 14:16:27.912 | DEBUG    | __main__:trials:24 - Trial = 907/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.914 | DEBUG    | __main__:trials:29 - Trial = 907/30000 | Total reward = 44.09
2022-01-26 14:16:27.917 | DEBUG    | __main__:trials:26 - Trial = 908/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:27.917 | DEBUG    | __main__:trials:29 - Trial = 908/30000 | Total reward = 13.21
2022-01-26 14:16:27.922 | DEBUG    | __main__:trials:24 - Trial = 909/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.923 | DEBUG    | __main__:trials:29 - Trial = 909/30000 | Total reward = 37.92
2022-01-26 14:16:27.927 | DEBUG    | __main__:trials:24 - Trial = 910/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.928 | DEBUG    | __main__:trials:29 - Trial = 910/30000 | Total reward = 40.97
2022-01-26 14:16:27.932 | DEBUG    | __main__:trials:24 - Trial = 911/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.934 | DEBUG    | __main__:trials:29 - Trial = 911/30000 | Total reward = 42.28
2022-01-26 14:16:27.938 | DEBUG    | __main__:trials:24 - Trial = 912/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.940 | DEBUG    | __main__:trials:29 - Trial = 912/30000 | Total reward = 42.64
2022-01-26 14:16:27.942 | DEBUG    | __main__:trials:24 - Trial = 913/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.944 | DEBUG    | __main__:trials:29 - Trial = 913/30000 | Total reward = 46.27
2022-01-26 14:16:27.947 | DEBUG    | __main__:trials:24 - Trial = 914/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.949 | DEBUG    | __main__:trials:29 - Trial = 914/30000 | Total reward = 43.99
2022-01-26 14:16:27.953 | DEBUG    | __main__:trials:24 - Trial = 915/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.954 | DEBUG    | __main__:trials:29 - Trial = 915/30000 | Total reward = 47.43
2022-01-26 14:16:27.958 | DEBUG    | __main__:trials:24 - Trial = 916/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.959 | DEBUG    | __main__:trials:29 - Trial = 916/30000 | Total reward = 47.28
2022-01-26 14:16:27.963 | DEBUG    | __main__:trials:24 - Trial = 917/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.964 | DEBUG    | __main__:trials:29 - Trial = 917/30000 | Total reward = 42.70
2022-01-26 14:16:27.968 | DEBUG    | __main__:trials:24 - Trial = 918/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.970 | DEBUG    | __main__:trials:29 - Trial = 918/30000 | Total reward = 41.18
2022-01-26 14:16:27.973 | DEBUG    | __main__:trials:24 - Trial = 919/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.975 | DEBUG    | __main__:trials:29 - Trial = 919/30000 | Total reward = 50.02
2022-01-26 14:16:27.979 | DEBUG    | __main__:trials:24 - Trial = 920/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.980 | DEBUG    | __main__:trials:29 - Trial = 920/30000 | Total reward = 44.92
2022-01-26 14:16:27.984 | DEBUG    | __main__:trials:24 - Trial = 921/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.984 | DEBUG    | __main__:trials:29 - Trial = 921/30000 | Total reward = 43.95
2022-01-26 14:16:27.988 | DEBUG    | __main__:trials:24 - Trial = 922/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.989 | DEBUG    | __main__:trials:29 - Trial = 922/30000 | Total reward = 41.16
2022-01-26 14:16:27.992 | DEBUG    | __main__:trials:24 - Trial = 923/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.994 | DEBUG    | __main__:trials:29 - Trial = 923/30000 | Total reward = 32.79
2022-01-26 14:16:27.998 | DEBUG    | __main__:trials:24 - Trial = 924/30000 | Max number of steps (20) reached
2022-01-26 14:16:27.999 | DEBUG    | __main__:trials:29 - Trial = 924/30000 | Total reward = 48.38
2022-01-26 14:16:28.002 | DEBUG    | __main__:trials:24 - Trial = 925/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.004 | DEBUG    | __main__:trials:29 - Trial = 925/30000 | Total reward = 44.37
2022-01-26 14:16:28.008 | DEBUG    | __main__:trials:24 - Trial = 926/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.009 | DEBUG    | __main__:trials:29 - Trial = 926/30000 | Total reward = 47.35
2022-01-26 14:16:28.013 | DEBUG    | __main__:trials:24 - Trial = 927/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.015 | DEBUG    | __main__:trials:29 - Trial = 927/30000 | Total reward = 51.81
2022-01-26 14:16:28.019 | DEBUG    | __main__:trials:24 - Trial = 928/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.021 | DEBUG    | __main__:trials:29 - Trial = 928/30000 | Total reward = 44.49
2022-01-26 14:16:28.025 | DEBUG    | __main__:trials:24 - Trial = 929/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.026 | DEBUG    | __main__:trials:29 - Trial = 929/30000 | Total reward = 43.21
2022-01-26 14:16:28.029 | DEBUG    | __main__:trials:24 - Trial = 930/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.030 | DEBUG    | __main__:trials:29 - Trial = 930/30000 | Total reward = 53.01
2022-01-26 14:16:28.033 | DEBUG    | __main__:trials:24 - Trial = 931/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.035 | DEBUG    | __main__:trials:29 - Trial = 931/30000 | Total reward = 53.37
2022-01-26 14:16:28.039 | DEBUG    | __main__:trials:24 - Trial = 932/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.041 | DEBUG    | __main__:trials:29 - Trial = 932/30000 | Total reward = 41.85
2022-01-26 14:16:28.044 | DEBUG    | __main__:trials:24 - Trial = 933/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.045 | DEBUG    | __main__:trials:29 - Trial = 933/30000 | Total reward = 41.16
2022-01-26 14:16:28.048 | DEBUG    | __main__:trials:24 - Trial = 934/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.049 | DEBUG    | __main__:trials:29 - Trial = 934/30000 | Total reward = 46.79
2022-01-26 14:16:28.052 | DEBUG    | __main__:trials:24 - Trial = 935/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.054 | DEBUG    | __main__:trials:29 - Trial = 935/30000 | Total reward = 46.14
2022-01-26 14:16:28.056 | DEBUG    | __main__:trials:26 - Trial = 936/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.058 | DEBUG    | __main__:trials:29 - Trial = 936/30000 | Total reward = 21.79
2022-01-26 14:16:28.062 | DEBUG    | __main__:trials:24 - Trial = 937/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.064 | DEBUG    | __main__:trials:29 - Trial = 937/30000 | Total reward = 47.04
2022-01-26 14:16:28.067 | DEBUG    | __main__:trials:24 - Trial = 938/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.068 | DEBUG    | __main__:trials:29 - Trial = 938/30000 | Total reward = 51.04
2022-01-26 14:16:28.071 | DEBUG    | __main__:trials:26 - Trial = 939/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.073 | DEBUG    | __main__:trials:29 - Trial = 939/30000 | Total reward = 32.46
2022-01-26 14:16:28.077 | DEBUG    | __main__:trials:24 - Trial = 940/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.078 | DEBUG    | __main__:trials:29 - Trial = 940/30000 | Total reward = 45.71
2022-01-26 14:16:28.081 | DEBUG    | __main__:trials:24 - Trial = 941/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.082 | DEBUG    | __main__:trials:29 - Trial = 941/30000 | Total reward = 49.50
2022-01-26 14:16:28.085 | DEBUG    | __main__:trials:26 - Trial = 942/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.086 | DEBUG    | __main__:trials:29 - Trial = 942/30000 | Total reward = 32.57
2022-01-26 14:16:28.089 | DEBUG    | __main__:trials:24 - Trial = 943/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.090 | DEBUG    | __main__:trials:29 - Trial = 943/30000 | Total reward = 47.04
2022-01-26 14:16:28.093 | DEBUG    | __main__:trials:24 - Trial = 944/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.095 | DEBUG    | __main__:trials:29 - Trial = 944/30000 | Total reward = 45.54
2022-01-26 14:16:28.098 | DEBUG    | __main__:trials:24 - Trial = 945/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.100 | DEBUG    | __main__:trials:29 - Trial = 945/30000 | Total reward = 46.71
2022-01-26 14:16:28.103 | DEBUG    | __main__:trials:24 - Trial = 946/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.105 | DEBUG    | __main__:trials:29 - Trial = 946/30000 | Total reward = 46.33
2022-01-26 14:16:28.109 | DEBUG    | __main__:trials:24 - Trial = 947/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.111 | DEBUG    | __main__:trials:29 - Trial = 947/30000 | Total reward = 9.23
2022-01-26 14:16:28.115 | DEBUG    | __main__:trials:24 - Trial = 948/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.116 | DEBUG    | __main__:trials:29 - Trial = 948/30000 | Total reward = 46.88
2022-01-26 14:16:28.120 | DEBUG    | __main__:trials:24 - Trial = 949/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.122 | DEBUG    | __main__:trials:29 - Trial = 949/30000 | Total reward = 46.53
2022-01-26 14:16:28.125 | DEBUG    | __main__:trials:24 - Trial = 950/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.127 | DEBUG    | __main__:trials:29 - Trial = 950/30000 | Total reward = 46.32
2022-01-26 14:16:28.131 | DEBUG    | __main__:trials:24 - Trial = 951/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.132 | DEBUG    | __main__:trials:29 - Trial = 951/30000 | Total reward = 45.09
2022-01-26 14:16:28.136 | DEBUG    | __main__:trials:24 - Trial = 952/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.137 | DEBUG    | __main__:trials:29 - Trial = 952/30000 | Total reward = 44.77
2022-01-26 14:16:28.140 | DEBUG    | __main__:trials:24 - Trial = 953/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.141 | DEBUG    | __main__:trials:29 - Trial = 953/30000 | Total reward = 44.78
2022-01-26 14:16:28.143 | DEBUG    | __main__:trials:26 - Trial = 954/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.144 | DEBUG    | __main__:trials:29 - Trial = 954/30000 | Total reward = 10.56
2022-01-26 14:16:28.148 | DEBUG    | __main__:trials:24 - Trial = 955/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.150 | DEBUG    | __main__:trials:29 - Trial = 955/30000 | Total reward = 45.00
2022-01-26 14:16:28.153 | DEBUG    | __main__:trials:24 - Trial = 956/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.154 | DEBUG    | __main__:trials:29 - Trial = 956/30000 | Total reward = 27.05
2022-01-26 14:16:28.157 | DEBUG    | __main__:trials:24 - Trial = 957/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.158 | DEBUG    | __main__:trials:29 - Trial = 957/30000 | Total reward = 47.04
2022-01-26 14:16:28.160 | DEBUG    | __main__:trials:26 - Trial = 958/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.162 | DEBUG    | __main__:trials:29 - Trial = 958/30000 | Total reward = 12.40
2022-01-26 14:16:28.166 | DEBUG    | __main__:trials:24 - Trial = 959/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.167 | DEBUG    | __main__:trials:29 - Trial = 959/30000 | Total reward = 34.97
2022-01-26 14:16:28.170 | DEBUG    | __main__:trials:24 - Trial = 960/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.172 | DEBUG    | __main__:trials:29 - Trial = 960/30000 | Total reward = 42.47
2022-01-26 14:16:28.176 | DEBUG    | __main__:trials:24 - Trial = 961/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.178 | DEBUG    | __main__:trials:29 - Trial = 961/30000 | Total reward = 45.49
2022-01-26 14:16:28.181 | DEBUG    | __main__:trials:24 - Trial = 962/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.183 | DEBUG    | __main__:trials:29 - Trial = 962/30000 | Total reward = 41.95
2022-01-26 14:16:28.187 | DEBUG    | __main__:trials:24 - Trial = 963/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.189 | DEBUG    | __main__:trials:29 - Trial = 963/30000 | Total reward = 47.79
2022-01-26 14:16:28.192 | DEBUG    | __main__:trials:24 - Trial = 964/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.193 | DEBUG    | __main__:trials:29 - Trial = 964/30000 | Total reward = 47.22
2022-01-26 14:16:28.198 | DEBUG    | __main__:trials:24 - Trial = 965/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.199 | DEBUG    | __main__:trials:29 - Trial = 965/30000 | Total reward = 48.99
2022-01-26 14:16:28.202 | DEBUG    | __main__:trials:26 - Trial = 966/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.204 | DEBUG    | __main__:trials:29 - Trial = 966/30000 | Total reward = 20.52
2022-01-26 14:16:28.207 | DEBUG    | __main__:trials:24 - Trial = 967/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.209 | DEBUG    | __main__:trials:29 - Trial = 967/30000 | Total reward = 27.13
2022-01-26 14:16:28.212 | DEBUG    | __main__:trials:24 - Trial = 968/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.214 | DEBUG    | __main__:trials:29 - Trial = 968/30000 | Total reward = 44.18
2022-01-26 14:16:28.218 | DEBUG    | __main__:trials:24 - Trial = 969/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.220 | DEBUG    | __main__:trials:29 - Trial = 969/30000 | Total reward = 51.55
2022-01-26 14:16:28.224 | DEBUG    | __main__:trials:24 - Trial = 970/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.226 | DEBUG    | __main__:trials:29 - Trial = 970/30000 | Total reward = 37.60
2022-01-26 14:16:28.230 | DEBUG    | __main__:trials:24 - Trial = 971/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.230 | DEBUG    | __main__:trials:29 - Trial = 971/30000 | Total reward = 44.04
2022-01-26 14:16:28.234 | DEBUG    | __main__:trials:24 - Trial = 972/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.236 | DEBUG    | __main__:trials:29 - Trial = 972/30000 | Total reward = 47.63
2022-01-26 14:16:28.240 | DEBUG    | __main__:trials:24 - Trial = 973/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.241 | DEBUG    | __main__:trials:29 - Trial = 973/30000 | Total reward = 46.26
2022-01-26 14:16:28.245 | DEBUG    | __main__:trials:24 - Trial = 974/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.246 | DEBUG    | __main__:trials:29 - Trial = 974/30000 | Total reward = 31.22
2022-01-26 14:16:28.248 | DEBUG    | __main__:trials:26 - Trial = 975/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.250 | DEBUG    | __main__:trials:29 - Trial = 975/30000 | Total reward = 9.16
2022-01-26 14:16:28.254 | DEBUG    | __main__:trials:24 - Trial = 976/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.255 | DEBUG    | __main__:trials:29 - Trial = 976/30000 | Total reward = 45.90
2022-01-26 14:16:28.258 | DEBUG    | __main__:trials:24 - Trial = 977/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.260 | DEBUG    | __main__:trials:29 - Trial = 977/30000 | Total reward = 45.18
2022-01-26 14:16:28.264 | DEBUG    | __main__:trials:24 - Trial = 978/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.265 | DEBUG    | __main__:trials:29 - Trial = 978/30000 | Total reward = 45.56
2022-01-26 14:16:28.269 | DEBUG    | __main__:trials:24 - Trial = 979/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.271 | DEBUG    | __main__:trials:29 - Trial = 979/30000 | Total reward = 28.46
2022-01-26 14:16:28.274 | DEBUG    | __main__:trials:24 - Trial = 980/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.276 | DEBUG    | __main__:trials:29 - Trial = 980/30000 | Total reward = 39.48
2022-01-26 14:16:28.280 | DEBUG    | __main__:trials:24 - Trial = 981/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.281 | DEBUG    | __main__:trials:29 - Trial = 981/30000 | Total reward = 37.94
2022-01-26 14:16:28.285 | DEBUG    | __main__:trials:24 - Trial = 982/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.286 | DEBUG    | __main__:trials:29 - Trial = 982/30000 | Total reward = 43.57
2022-01-26 14:16:28.290 | DEBUG    | __main__:trials:24 - Trial = 983/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.291 | DEBUG    | __main__:trials:29 - Trial = 983/30000 | Total reward = 44.35
2022-01-26 14:16:28.294 | DEBUG    | __main__:trials:24 - Trial = 984/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.296 | DEBUG    | __main__:trials:29 - Trial = 984/30000 | Total reward = 46.10
2022-01-26 14:16:28.300 | DEBUG    | __main__:trials:24 - Trial = 985/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.301 | DEBUG    | __main__:trials:29 - Trial = 985/30000 | Total reward = 51.61
2022-01-26 14:16:28.305 | DEBUG    | __main__:trials:24 - Trial = 986/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.307 | DEBUG    | __main__:trials:29 - Trial = 986/30000 | Total reward = 47.14
2022-01-26 14:16:28.311 | DEBUG    | __main__:trials:24 - Trial = 987/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.311 | DEBUG    | __main__:trials:29 - Trial = 987/30000 | Total reward = 44.13
2022-01-26 14:16:28.315 | DEBUG    | __main__:trials:24 - Trial = 988/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.316 | DEBUG    | __main__:trials:29 - Trial = 988/30000 | Total reward = 50.55
2022-01-26 14:16:28.320 | DEBUG    | __main__:trials:24 - Trial = 989/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.322 | DEBUG    | __main__:trials:29 - Trial = 989/30000 | Total reward = 38.16
2022-01-26 14:16:28.325 | DEBUG    | __main__:trials:24 - Trial = 990/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.326 | DEBUG    | __main__:trials:29 - Trial = 990/30000 | Total reward = 44.10
2022-01-26 14:16:28.329 | DEBUG    | __main__:trials:24 - Trial = 991/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.331 | DEBUG    | __main__:trials:29 - Trial = 991/30000 | Total reward = 46.33
2022-01-26 14:16:28.334 | DEBUG    | __main__:trials:24 - Trial = 992/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.335 | DEBUG    | __main__:trials:29 - Trial = 992/30000 | Total reward = 47.03
2022-01-26 14:16:28.338 | DEBUG    | __main__:trials:24 - Trial = 993/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.340 | DEBUG    | __main__:trials:29 - Trial = 993/30000 | Total reward = 31.60
2022-01-26 14:16:28.343 | DEBUG    | __main__:trials:24 - Trial = 994/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.345 | DEBUG    | __main__:trials:29 - Trial = 994/30000 | Total reward = 59.80
2022-01-26 14:16:28.348 | DEBUG    | __main__:trials:24 - Trial = 995/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.350 | DEBUG    | __main__:trials:29 - Trial = 995/30000 | Total reward = 52.26
2022-01-26 14:16:28.354 | DEBUG    | __main__:trials:24 - Trial = 996/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.354 | DEBUG    | __main__:trials:29 - Trial = 996/30000 | Total reward = 42.12
2022-01-26 14:16:28.358 | DEBUG    | __main__:trials:24 - Trial = 997/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.359 | DEBUG    | __main__:trials:29 - Trial = 997/30000 | Total reward = 39.88
2022-01-26 14:16:28.363 | DEBUG    | __main__:trials:24 - Trial = 998/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.365 | DEBUG    | __main__:trials:29 - Trial = 998/30000 | Total reward = 48.82
2022-01-26 14:16:28.367 | DEBUG    | __main__:trials:26 - Trial = 999/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.369 | DEBUG    | __main__:trials:29 - Trial = 999/30000 | Total reward = 16.23
2022-01-26 14:16:28.372 | DEBUG    | __main__:trials:24 - Trial = 1000/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.373 | DEBUG    | __main__:trials:29 - Trial = 1000/30000 | Total reward = 48.35
2022-01-26 14:16:28.377 | DEBUG    | __main__:trials:24 - Trial = 1001/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.379 | DEBUG    | __main__:trials:29 - Trial = 1001/30000 | Total reward = 42.83
2022-01-26 14:16:28.381 | DEBUG    | __main__:trials:26 - Trial = 1002/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.382 | DEBUG    | __main__:trials:29 - Trial = 1002/30000 | Total reward = 8.62
2022-01-26 14:16:28.387 | DEBUG    | __main__:trials:24 - Trial = 1003/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.389 | DEBUG    | __main__:trials:29 - Trial = 1003/30000 | Total reward = 47.03
2022-01-26 14:16:28.391 | DEBUG    | __main__:trials:26 - Trial = 1004/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.393 | DEBUG    | __main__:trials:29 - Trial = 1004/30000 | Total reward = 15.92
2022-01-26 14:16:28.397 | DEBUG    | __main__:trials:24 - Trial = 1005/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.398 | DEBUG    | __main__:trials:29 - Trial = 1005/30000 | Total reward = 41.46
2022-01-26 14:16:28.402 | DEBUG    | __main__:trials:24 - Trial = 1006/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.403 | DEBUG    | __main__:trials:29 - Trial = 1006/30000 | Total reward = 46.37
2022-01-26 14:16:28.407 | DEBUG    | __main__:trials:24 - Trial = 1007/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.408 | DEBUG    | __main__:trials:29 - Trial = 1007/30000 | Total reward = 44.49
2022-01-26 14:16:28.412 | DEBUG    | __main__:trials:24 - Trial = 1008/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.414 | DEBUG    | __main__:trials:29 - Trial = 1008/30000 | Total reward = 46.84
2022-01-26 14:16:28.417 | DEBUG    | __main__:trials:24 - Trial = 1009/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.418 | DEBUG    | __main__:trials:29 - Trial = 1009/30000 | Total reward = 57.75
2022-01-26 14:16:28.423 | DEBUG    | __main__:trials:24 - Trial = 1010/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.424 | DEBUG    | __main__:trials:29 - Trial = 1010/30000 | Total reward = 46.99
2022-01-26 14:16:28.428 | DEBUG    | __main__:trials:24 - Trial = 1011/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.429 | DEBUG    | __main__:trials:29 - Trial = 1011/30000 | Total reward = 41.32
2022-01-26 14:16:28.434 | DEBUG    | __main__:trials:24 - Trial = 1012/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.434 | DEBUG    | __main__:trials:29 - Trial = 1012/30000 | Total reward = 40.43
2022-01-26 14:16:28.439 | DEBUG    | __main__:trials:24 - Trial = 1013/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.441 | DEBUG    | __main__:trials:29 - Trial = 1013/30000 | Total reward = 45.76
2022-01-26 14:16:28.444 | DEBUG    | __main__:trials:24 - Trial = 1014/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.446 | DEBUG    | __main__:trials:29 - Trial = 1014/30000 | Total reward = 42.47
2022-01-26 14:16:28.450 | DEBUG    | __main__:trials:24 - Trial = 1015/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.451 | DEBUG    | __main__:trials:29 - Trial = 1015/30000 | Total reward = 44.78
2022-01-26 14:16:28.454 | DEBUG    | __main__:trials:24 - Trial = 1016/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.456 | DEBUG    | __main__:trials:29 - Trial = 1016/30000 | Total reward = 31.89
2022-01-26 14:16:28.460 | DEBUG    | __main__:trials:24 - Trial = 1017/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.462 | DEBUG    | __main__:trials:29 - Trial = 1017/30000 | Total reward = 48.44
2022-01-26 14:16:28.465 | DEBUG    | __main__:trials:24 - Trial = 1018/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.466 | DEBUG    | __main__:trials:29 - Trial = 1018/30000 | Total reward = 45.12
2022-01-26 14:16:28.471 | DEBUG    | __main__:trials:24 - Trial = 1019/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.472 | DEBUG    | __main__:trials:29 - Trial = 1019/30000 | Total reward = 43.83
2022-01-26 14:16:28.475 | DEBUG    | __main__:trials:24 - Trial = 1020/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.477 | DEBUG    | __main__:trials:29 - Trial = 1020/30000 | Total reward = 42.37
2022-01-26 14:16:28.480 | DEBUG    | __main__:trials:24 - Trial = 1021/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.481 | DEBUG    | __main__:trials:29 - Trial = 1021/30000 | Total reward = 52.11
2022-01-26 14:16:28.484 | DEBUG    | __main__:trials:24 - Trial = 1022/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.486 | DEBUG    | __main__:trials:29 - Trial = 1022/30000 | Total reward = 39.64
2022-01-26 14:16:28.490 | DEBUG    | __main__:trials:24 - Trial = 1023/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.491 | DEBUG    | __main__:trials:29 - Trial = 1023/30000 | Total reward = 42.54
2022-01-26 14:16:28.495 | DEBUG    | __main__:trials:24 - Trial = 1024/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.496 | DEBUG    | __main__:trials:29 - Trial = 1024/30000 | Total reward = 37.75
2022-01-26 14:16:28.500 | DEBUG    | __main__:trials:24 - Trial = 1025/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.501 | DEBUG    | __main__:trials:29 - Trial = 1025/30000 | Total reward = 50.10
2022-01-26 14:16:28.505 | DEBUG    | __main__:trials:24 - Trial = 1026/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.507 | DEBUG    | __main__:trials:29 - Trial = 1026/30000 | Total reward = 52.83
2022-01-26 14:16:28.511 | DEBUG    | __main__:trials:24 - Trial = 1027/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.513 | DEBUG    | __main__:trials:29 - Trial = 1027/30000 | Total reward = 44.28
2022-01-26 14:16:28.517 | DEBUG    | __main__:trials:24 - Trial = 1028/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.518 | DEBUG    | __main__:trials:29 - Trial = 1028/30000 | Total reward = 40.63
2022-01-26 14:16:28.521 | DEBUG    | __main__:trials:26 - Trial = 1029/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.522 | DEBUG    | __main__:trials:29 - Trial = 1029/30000 | Total reward = 11.40
2022-01-26 14:16:28.526 | DEBUG    | __main__:trials:24 - Trial = 1030/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.527 | DEBUG    | __main__:trials:29 - Trial = 1030/30000 | Total reward = 41.84
2022-01-26 14:16:28.530 | DEBUG    | __main__:trials:24 - Trial = 1031/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.532 | DEBUG    | __main__:trials:29 - Trial = 1031/30000 | Total reward = 46.99
2022-01-26 14:16:28.536 | DEBUG    | __main__:trials:24 - Trial = 1032/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.537 | DEBUG    | __main__:trials:29 - Trial = 1032/30000 | Total reward = 44.72
2022-01-26 14:16:28.541 | DEBUG    | __main__:trials:26 - Trial = 1033/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.542 | DEBUG    | __main__:trials:29 - Trial = 1033/30000 | Total reward = 25.18
2022-01-26 14:16:28.546 | DEBUG    | __main__:trials:24 - Trial = 1034/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.547 | DEBUG    | __main__:trials:29 - Trial = 1034/30000 | Total reward = 46.71
2022-01-26 14:16:28.551 | DEBUG    | __main__:trials:24 - Trial = 1035/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.553 | DEBUG    | __main__:trials:29 - Trial = 1035/30000 | Total reward = 47.04
2022-01-26 14:16:28.556 | DEBUG    | __main__:trials:24 - Trial = 1036/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.557 | DEBUG    | __main__:trials:29 - Trial = 1036/30000 | Total reward = 44.47
2022-01-26 14:16:28.561 | DEBUG    | __main__:trials:24 - Trial = 1037/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.562 | DEBUG    | __main__:trials:29 - Trial = 1037/30000 | Total reward = 43.62
2022-01-26 14:16:28.567 | DEBUG    | __main__:trials:24 - Trial = 1038/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.567 | DEBUG    | __main__:trials:29 - Trial = 1038/30000 | Total reward = 43.17
2022-01-26 14:16:28.571 | DEBUG    | __main__:trials:24 - Trial = 1039/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.572 | DEBUG    | __main__:trials:29 - Trial = 1039/30000 | Total reward = 52.08
2022-01-26 14:16:28.576 | DEBUG    | __main__:trials:24 - Trial = 1040/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.578 | DEBUG    | __main__:trials:29 - Trial = 1040/30000 | Total reward = 42.44
2022-01-26 14:16:28.581 | DEBUG    | __main__:trials:24 - Trial = 1041/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.582 | DEBUG    | __main__:trials:29 - Trial = 1041/30000 | Total reward = 39.24
2022-01-26 14:16:28.585 | DEBUG    | __main__:trials:24 - Trial = 1042/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.586 | DEBUG    | __main__:trials:29 - Trial = 1042/30000 | Total reward = 43.86
2022-01-26 14:16:28.589 | DEBUG    | __main__:trials:24 - Trial = 1043/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.591 | DEBUG    | __main__:trials:29 - Trial = 1043/30000 | Total reward = 43.81
2022-01-26 14:16:28.595 | DEBUG    | __main__:trials:24 - Trial = 1044/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.596 | DEBUG    | __main__:trials:29 - Trial = 1044/30000 | Total reward = 44.29
2022-01-26 14:16:28.599 | DEBUG    | __main__:trials:26 - Trial = 1045/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.600 | DEBUG    | __main__:trials:29 - Trial = 1045/30000 | Total reward = 14.67
2022-01-26 14:16:28.604 | DEBUG    | __main__:trials:24 - Trial = 1046/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.605 | DEBUG    | __main__:trials:29 - Trial = 1046/30000 | Total reward = 52.46
2022-01-26 14:16:28.609 | DEBUG    | __main__:trials:24 - Trial = 1047/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.610 | DEBUG    | __main__:trials:29 - Trial = 1047/30000 | Total reward = 43.96
2022-01-26 14:16:28.614 | DEBUG    | __main__:trials:24 - Trial = 1048/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.614 | DEBUG    | __main__:trials:29 - Trial = 1048/30000 | Total reward = 42.86
2022-01-26 14:16:28.618 | DEBUG    | __main__:trials:24 - Trial = 1049/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.620 | DEBUG    | __main__:trials:29 - Trial = 1049/30000 | Total reward = 47.37
2022-01-26 14:16:28.623 | DEBUG    | __main__:trials:24 - Trial = 1050/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.625 | DEBUG    | __main__:trials:29 - Trial = 1050/30000 | Total reward = 47.04
2022-01-26 14:16:28.629 | DEBUG    | __main__:trials:24 - Trial = 1051/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.629 | DEBUG    | __main__:trials:29 - Trial = 1051/30000 | Total reward = 45.95
2022-01-26 14:16:28.633 | DEBUG    | __main__:trials:24 - Trial = 1052/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.634 | DEBUG    | __main__:trials:29 - Trial = 1052/30000 | Total reward = 47.63
2022-01-26 14:16:28.638 | DEBUG    | __main__:trials:24 - Trial = 1053/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.639 | DEBUG    | __main__:trials:29 - Trial = 1053/30000 | Total reward = 43.56
2022-01-26 14:16:28.643 | DEBUG    | __main__:trials:24 - Trial = 1054/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.644 | DEBUG    | __main__:trials:29 - Trial = 1054/30000 | Total reward = 42.80
2022-01-26 14:16:28.648 | DEBUG    | __main__:trials:24 - Trial = 1055/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.650 | DEBUG    | __main__:trials:29 - Trial = 1055/30000 | Total reward = 44.47
2022-01-26 14:16:28.654 | DEBUG    | __main__:trials:24 - Trial = 1056/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.655 | DEBUG    | __main__:trials:29 - Trial = 1056/30000 | Total reward = 45.59
2022-01-26 14:16:28.658 | DEBUG    | __main__:trials:26 - Trial = 1057/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.660 | DEBUG    | __main__:trials:29 - Trial = 1057/30000 | Total reward = 9.23
2022-01-26 14:16:28.663 | DEBUG    | __main__:trials:24 - Trial = 1058/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.664 | DEBUG    | __main__:trials:29 - Trial = 1058/30000 | Total reward = 44.27
2022-01-26 14:16:28.668 | DEBUG    | __main__:trials:24 - Trial = 1059/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.670 | DEBUG    | __main__:trials:29 - Trial = 1059/30000 | Total reward = 41.65
2022-01-26 14:16:28.674 | DEBUG    | __main__:trials:24 - Trial = 1060/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.675 | DEBUG    | __main__:trials:29 - Trial = 1060/30000 | Total reward = 45.00
2022-01-26 14:16:28.679 | DEBUG    | __main__:trials:24 - Trial = 1061/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.680 | DEBUG    | __main__:trials:29 - Trial = 1061/30000 | Total reward = 45.61
2022-01-26 14:16:28.684 | DEBUG    | __main__:trials:24 - Trial = 1062/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.685 | DEBUG    | __main__:trials:29 - Trial = 1062/30000 | Total reward = 45.94
2022-01-26 14:16:28.689 | DEBUG    | __main__:trials:24 - Trial = 1063/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.691 | DEBUG    | __main__:trials:29 - Trial = 1063/30000 | Total reward = 51.24
2022-01-26 14:16:28.695 | DEBUG    | __main__:trials:24 - Trial = 1064/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.696 | DEBUG    | __main__:trials:29 - Trial = 1064/30000 | Total reward = 52.92
2022-01-26 14:16:28.700 | DEBUG    | __main__:trials:24 - Trial = 1065/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.702 | DEBUG    | __main__:trials:29 - Trial = 1065/30000 | Total reward = 46.63
2022-01-26 14:16:28.705 | DEBUG    | __main__:trials:24 - Trial = 1066/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.706 | DEBUG    | __main__:trials:29 - Trial = 1066/30000 | Total reward = 45.55
2022-01-26 14:16:28.711 | DEBUG    | __main__:trials:24 - Trial = 1067/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.712 | DEBUG    | __main__:trials:29 - Trial = 1067/30000 | Total reward = 45.90
2022-01-26 14:16:28.715 | DEBUG    | __main__:trials:26 - Trial = 1068/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.716 | DEBUG    | __main__:trials:29 - Trial = 1068/30000 | Total reward = 16.00
2022-01-26 14:16:28.721 | DEBUG    | __main__:trials:24 - Trial = 1069/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.722 | DEBUG    | __main__:trials:29 - Trial = 1069/30000 | Total reward = 50.17
2022-01-26 14:16:28.726 | DEBUG    | __main__:trials:24 - Trial = 1070/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.726 | DEBUG    | __main__:trials:29 - Trial = 1070/30000 | Total reward = 46.42
2022-01-26 14:16:28.731 | DEBUG    | __main__:trials:24 - Trial = 1071/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.732 | DEBUG    | __main__:trials:29 - Trial = 1071/30000 | Total reward = 48.68
2022-01-26 14:16:28.735 | DEBUG    | __main__:trials:24 - Trial = 1072/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.737 | DEBUG    | __main__:trials:29 - Trial = 1072/30000 | Total reward = 31.79
2022-01-26 14:16:28.740 | DEBUG    | __main__:trials:24 - Trial = 1073/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.741 | DEBUG    | __main__:trials:29 - Trial = 1073/30000 | Total reward = 26.28
2022-01-26 14:16:28.746 | DEBUG    | __main__:trials:24 - Trial = 1074/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.748 | DEBUG    | __main__:trials:29 - Trial = 1074/30000 | Total reward = 40.82
2022-01-26 14:16:28.751 | DEBUG    | __main__:trials:24 - Trial = 1075/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.752 | DEBUG    | __main__:trials:29 - Trial = 1075/30000 | Total reward = 27.74
2022-01-26 14:16:28.756 | DEBUG    | __main__:trials:24 - Trial = 1076/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.757 | DEBUG    | __main__:trials:29 - Trial = 1076/30000 | Total reward = 45.94
2022-01-26 14:16:28.760 | DEBUG    | __main__:trials:24 - Trial = 1077/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.762 | DEBUG    | __main__:trials:29 - Trial = 1077/30000 | Total reward = 47.04
2022-01-26 14:16:28.766 | DEBUG    | __main__:trials:24 - Trial = 1078/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.766 | DEBUG    | __main__:trials:29 - Trial = 1078/30000 | Total reward = 49.58
2022-01-26 14:16:28.770 | DEBUG    | __main__:trials:26 - Trial = 1079/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.772 | DEBUG    | __main__:trials:29 - Trial = 1079/30000 | Total reward = 19.19
2022-01-26 14:16:28.774 | DEBUG    | __main__:trials:24 - Trial = 1080/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.776 | DEBUG    | __main__:trials:29 - Trial = 1080/30000 | Total reward = 37.95
2022-01-26 14:16:28.779 | DEBUG    | __main__:trials:24 - Trial = 1081/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.781 | DEBUG    | __main__:trials:29 - Trial = 1081/30000 | Total reward = 41.21
2022-01-26 14:16:28.784 | DEBUG    | __main__:trials:24 - Trial = 1082/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.785 | DEBUG    | __main__:trials:29 - Trial = 1082/30000 | Total reward = 44.97
2022-01-26 14:16:28.788 | DEBUG    | __main__:trials:24 - Trial = 1083/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.790 | DEBUG    | __main__:trials:29 - Trial = 1083/30000 | Total reward = 46.18
2022-01-26 14:16:28.794 | DEBUG    | __main__:trials:24 - Trial = 1084/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.796 | DEBUG    | __main__:trials:29 - Trial = 1084/30000 | Total reward = 46.69
2022-01-26 14:16:28.799 | DEBUG    | __main__:trials:24 - Trial = 1085/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.800 | DEBUG    | __main__:trials:29 - Trial = 1085/30000 | Total reward = 46.86
2022-01-26 14:16:28.804 | DEBUG    | __main__:trials:24 - Trial = 1086/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.806 | DEBUG    | __main__:trials:29 - Trial = 1086/30000 | Total reward = 46.93
2022-01-26 14:16:28.809 | DEBUG    | __main__:trials:24 - Trial = 1087/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.811 | DEBUG    | __main__:trials:29 - Trial = 1087/30000 | Total reward = 42.91
2022-01-26 14:16:28.814 | DEBUG    | __main__:trials:24 - Trial = 1088/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.815 | DEBUG    | __main__:trials:29 - Trial = 1088/30000 | Total reward = 42.69
2022-01-26 14:16:28.817 | DEBUG    | __main__:trials:26 - Trial = 1089/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.819 | DEBUG    | __main__:trials:29 - Trial = 1089/30000 | Total reward = 15.99
2022-01-26 14:16:28.822 | DEBUG    | __main__:trials:26 - Trial = 1090/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.823 | DEBUG    | __main__:trials:29 - Trial = 1090/30000 | Total reward = 16.32
2022-01-26 14:16:28.828 | DEBUG    | __main__:trials:24 - Trial = 1091/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.829 | DEBUG    | __main__:trials:29 - Trial = 1091/30000 | Total reward = 47.76
2022-01-26 14:16:28.833 | DEBUG    | __main__:trials:24 - Trial = 1092/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.833 | DEBUG    | __main__:trials:29 - Trial = 1092/30000 | Total reward = 44.02
2022-01-26 14:16:28.838 | DEBUG    | __main__:trials:24 - Trial = 1093/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.838 | DEBUG    | __main__:trials:29 - Trial = 1093/30000 | Total reward = 47.62
2022-01-26 14:16:28.842 | DEBUG    | __main__:trials:24 - Trial = 1094/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.844 | DEBUG    | __main__:trials:29 - Trial = 1094/30000 | Total reward = 43.27
2022-01-26 14:16:28.848 | DEBUG    | __main__:trials:24 - Trial = 1095/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.850 | DEBUG    | __main__:trials:29 - Trial = 1095/30000 | Total reward = 58.86
2022-01-26 14:16:28.853 | DEBUG    | __main__:trials:24 - Trial = 1096/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.854 | DEBUG    | __main__:trials:29 - Trial = 1096/30000 | Total reward = 53.26
2022-01-26 14:16:28.857 | DEBUG    | __main__:trials:24 - Trial = 1097/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.859 | DEBUG    | __main__:trials:29 - Trial = 1097/30000 | Total reward = 45.34
2022-01-26 14:16:28.862 | DEBUG    | __main__:trials:24 - Trial = 1098/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.863 | DEBUG    | __main__:trials:29 - Trial = 1098/30000 | Total reward = 45.07
2022-01-26 14:16:28.867 | DEBUG    | __main__:trials:24 - Trial = 1099/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.869 | DEBUG    | __main__:trials:29 - Trial = 1099/30000 | Total reward = 50.49
2022-01-26 14:16:28.872 | DEBUG    | __main__:trials:24 - Trial = 1100/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.873 | DEBUG    | __main__:trials:29 - Trial = 1100/30000 | Total reward = 47.18
2022-01-26 14:16:28.877 | DEBUG    | __main__:trials:24 - Trial = 1101/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.879 | DEBUG    | __main__:trials:29 - Trial = 1101/30000 | Total reward = 33.05
2022-01-26 14:16:28.882 | DEBUG    | __main__:trials:24 - Trial = 1102/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.883 | DEBUG    | __main__:trials:29 - Trial = 1102/30000 | Total reward = 43.89
2022-01-26 14:16:28.885 | DEBUG    | __main__:trials:26 - Trial = 1103/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.887 | DEBUG    | __main__:trials:29 - Trial = 1103/30000 | Total reward = 10.51
2022-01-26 14:16:28.889 | DEBUG    | __main__:trials:26 - Trial = 1104/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.891 | DEBUG    | __main__:trials:29 - Trial = 1104/30000 | Total reward = 13.72
2022-01-26 14:16:28.895 | DEBUG    | __main__:trials:24 - Trial = 1105/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.895 | DEBUG    | __main__:trials:29 - Trial = 1105/30000 | Total reward = 39.68
2022-01-26 14:16:28.899 | DEBUG    | __main__:trials:26 - Trial = 1106/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.900 | DEBUG    | __main__:trials:29 - Trial = 1106/30000 | Total reward = 17.78
2022-01-26 14:16:28.904 | DEBUG    | __main__:trials:24 - Trial = 1107/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.905 | DEBUG    | __main__:trials:29 - Trial = 1107/30000 | Total reward = 45.51
2022-01-26 14:16:28.909 | DEBUG    | __main__:trials:24 - Trial = 1108/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.911 | DEBUG    | __main__:trials:29 - Trial = 1108/30000 | Total reward = 41.28
2022-01-26 14:16:28.914 | DEBUG    | __main__:trials:24 - Trial = 1109/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.915 | DEBUG    | __main__:trials:29 - Trial = 1109/30000 | Total reward = 52.23
2022-01-26 14:16:28.919 | DEBUG    | __main__:trials:24 - Trial = 1110/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.921 | DEBUG    | __main__:trials:29 - Trial = 1110/30000 | Total reward = 44.85
2022-01-26 14:16:28.924 | DEBUG    | __main__:trials:24 - Trial = 1111/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.925 | DEBUG    | __main__:trials:29 - Trial = 1111/30000 | Total reward = 47.54
2022-01-26 14:16:28.928 | DEBUG    | __main__:trials:26 - Trial = 1112/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.929 | DEBUG    | __main__:trials:29 - Trial = 1112/30000 | Total reward = 18.75
2022-01-26 14:16:28.932 | DEBUG    | __main__:trials:24 - Trial = 1113/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.933 | DEBUG    | __main__:trials:29 - Trial = 1113/30000 | Total reward = 53.75
2022-01-26 14:16:28.937 | DEBUG    | __main__:trials:24 - Trial = 1114/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.938 | DEBUG    | __main__:trials:29 - Trial = 1114/30000 | Total reward = 46.71
2022-01-26 14:16:28.942 | DEBUG    | __main__:trials:24 - Trial = 1115/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.943 | DEBUG    | __main__:trials:29 - Trial = 1115/30000 | Total reward = 53.66
2022-01-26 14:16:28.946 | DEBUG    | __main__:trials:24 - Trial = 1116/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.947 | DEBUG    | __main__:trials:29 - Trial = 1116/30000 | Total reward = 54.96
2022-01-26 14:16:28.950 | DEBUG    | __main__:trials:26 - Trial = 1117/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:28.951 | DEBUG    | __main__:trials:29 - Trial = 1117/30000 | Total reward = 18.35
2022-01-26 14:16:28.955 | DEBUG    | __main__:trials:24 - Trial = 1118/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.956 | DEBUG    | __main__:trials:29 - Trial = 1118/30000 | Total reward = 21.09
2022-01-26 14:16:28.959 | DEBUG    | __main__:trials:24 - Trial = 1119/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.960 | DEBUG    | __main__:trials:29 - Trial = 1119/30000 | Total reward = 39.35
2022-01-26 14:16:28.963 | DEBUG    | __main__:trials:24 - Trial = 1120/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.965 | DEBUG    | __main__:trials:29 - Trial = 1120/30000 | Total reward = 60.71
2022-01-26 14:16:28.968 | DEBUG    | __main__:trials:24 - Trial = 1121/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.970 | DEBUG    | __main__:trials:29 - Trial = 1121/30000 | Total reward = 43.67
2022-01-26 14:16:28.973 | DEBUG    | __main__:trials:24 - Trial = 1122/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.975 | DEBUG    | __main__:trials:29 - Trial = 1122/30000 | Total reward = 45.50
2022-01-26 14:16:28.978 | DEBUG    | __main__:trials:24 - Trial = 1123/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.979 | DEBUG    | __main__:trials:29 - Trial = 1123/30000 | Total reward = 53.87
2022-01-26 14:16:28.983 | DEBUG    | __main__:trials:24 - Trial = 1124/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.985 | DEBUG    | __main__:trials:29 - Trial = 1124/30000 | Total reward = 47.63
2022-01-26 14:16:28.988 | DEBUG    | __main__:trials:24 - Trial = 1125/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.990 | DEBUG    | __main__:trials:29 - Trial = 1125/30000 | Total reward = 43.96
2022-01-26 14:16:28.992 | DEBUG    | __main__:trials:24 - Trial = 1126/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.994 | DEBUG    | __main__:trials:29 - Trial = 1126/30000 | Total reward = 41.88
2022-01-26 14:16:28.998 | DEBUG    | __main__:trials:24 - Trial = 1127/30000 | Max number of steps (20) reached
2022-01-26 14:16:28.998 | DEBUG    | __main__:trials:29 - Trial = 1127/30000 | Total reward = 42.49
2022-01-26 14:16:29.002 | DEBUG    | __main__:trials:26 - Trial = 1128/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.004 | DEBUG    | __main__:trials:29 - Trial = 1128/30000 | Total reward = 20.14
2022-01-26 14:16:29.008 | DEBUG    | __main__:trials:24 - Trial = 1129/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.009 | DEBUG    | __main__:trials:29 - Trial = 1129/30000 | Total reward = 60.35
2022-01-26 14:16:29.013 | DEBUG    | __main__:trials:24 - Trial = 1130/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.014 | DEBUG    | __main__:trials:29 - Trial = 1130/30000 | Total reward = 42.29
2022-01-26 14:16:29.018 | DEBUG    | __main__:trials:24 - Trial = 1131/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.019 | DEBUG    | __main__:trials:29 - Trial = 1131/30000 | Total reward = 47.63
2022-01-26 14:16:29.022 | DEBUG    | __main__:trials:26 - Trial = 1132/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.023 | DEBUG    | __main__:trials:29 - Trial = 1132/30000 | Total reward = 21.79
2022-01-26 14:16:29.027 | DEBUG    | __main__:trials:24 - Trial = 1133/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.029 | DEBUG    | __main__:trials:29 - Trial = 1133/30000 | Total reward = 44.99
2022-01-26 14:16:29.031 | DEBUG    | __main__:trials:26 - Trial = 1134/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.032 | DEBUG    | __main__:trials:29 - Trial = 1134/30000 | Total reward = 10.51
2022-01-26 14:16:29.036 | DEBUG    | __main__:trials:24 - Trial = 1135/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.037 | DEBUG    | __main__:trials:29 - Trial = 1135/30000 | Total reward = 38.63
2022-01-26 14:16:29.039 | DEBUG    | __main__:trials:26 - Trial = 1136/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.041 | DEBUG    | __main__:trials:29 - Trial = 1136/30000 | Total reward = 11.80
2022-01-26 14:16:29.042 | DEBUG    | __main__:trials:26 - Trial = 1137/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.044 | DEBUG    | __main__:trials:29 - Trial = 1137/30000 | Total reward = 13.40
2022-01-26 14:16:29.047 | DEBUG    | __main__:trials:26 - Trial = 1138/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.048 | DEBUG    | __main__:trials:29 - Trial = 1138/30000 | Total reward = 31.70
2022-01-26 14:16:29.052 | DEBUG    | __main__:trials:24 - Trial = 1139/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.054 | DEBUG    | __main__:trials:29 - Trial = 1139/30000 | Total reward = 45.95
2022-01-26 14:16:29.057 | DEBUG    | __main__:trials:26 - Trial = 1140/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.058 | DEBUG    | __main__:trials:29 - Trial = 1140/30000 | Total reward = 24.79
2022-01-26 14:16:29.062 | DEBUG    | __main__:trials:24 - Trial = 1141/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.062 | DEBUG    | __main__:trials:29 - Trial = 1141/30000 | Total reward = 41.50
2022-01-26 14:16:29.067 | DEBUG    | __main__:trials:24 - Trial = 1142/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.068 | DEBUG    | __main__:trials:29 - Trial = 1142/30000 | Total reward = 29.91
2022-01-26 14:16:29.072 | DEBUG    | __main__:trials:24 - Trial = 1143/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.074 | DEBUG    | __main__:trials:29 - Trial = 1143/30000 | Total reward = 51.24
2022-01-26 14:16:29.077 | DEBUG    | __main__:trials:24 - Trial = 1144/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.079 | DEBUG    | __main__:trials:29 - Trial = 1144/30000 | Total reward = 52.07
2022-01-26 14:16:29.083 | DEBUG    | __main__:trials:24 - Trial = 1145/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.084 | DEBUG    | __main__:trials:29 - Trial = 1145/30000 | Total reward = 45.51
2022-01-26 14:16:29.087 | DEBUG    | __main__:trials:26 - Trial = 1146/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.088 | DEBUG    | __main__:trials:29 - Trial = 1146/30000 | Total reward = 23.18
2022-01-26 14:16:29.092 | DEBUG    | __main__:trials:24 - Trial = 1147/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.093 | DEBUG    | __main__:trials:29 - Trial = 1147/30000 | Total reward = 51.34
2022-01-26 14:16:29.097 | DEBUG    | __main__:trials:26 - Trial = 1148/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.098 | DEBUG    | __main__:trials:29 - Trial = 1148/30000 | Total reward = 8.51
2022-01-26 14:16:29.102 | DEBUG    | __main__:trials:24 - Trial = 1149/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.103 | DEBUG    | __main__:trials:29 - Trial = 1149/30000 | Total reward = 43.76
2022-01-26 14:16:29.107 | DEBUG    | __main__:trials:24 - Trial = 1150/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.109 | DEBUG    | __main__:trials:29 - Trial = 1150/30000 | Total reward = 41.68
2022-01-26 14:16:29.111 | DEBUG    | __main__:trials:24 - Trial = 1151/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.113 | DEBUG    | __main__:trials:29 - Trial = 1151/30000 | Total reward = 41.98
2022-01-26 14:16:29.117 | DEBUG    | __main__:trials:24 - Trial = 1152/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.118 | DEBUG    | __main__:trials:29 - Trial = 1152/30000 | Total reward = 14.80
2022-01-26 14:16:29.122 | DEBUG    | __main__:trials:24 - Trial = 1153/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.123 | DEBUG    | __main__:trials:29 - Trial = 1153/30000 | Total reward = 44.40
2022-01-26 14:16:29.126 | DEBUG    | __main__:trials:24 - Trial = 1154/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.128 | DEBUG    | __main__:trials:29 - Trial = 1154/30000 | Total reward = 47.64
2022-01-26 14:16:29.130 | DEBUG    | __main__:trials:26 - Trial = 1155/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.132 | DEBUG    | __main__:trials:29 - Trial = 1155/30000 | Total reward = 15.42
2022-01-26 14:16:29.136 | DEBUG    | __main__:trials:24 - Trial = 1156/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.137 | DEBUG    | __main__:trials:29 - Trial = 1156/30000 | Total reward = 48.43
2022-01-26 14:16:29.141 | DEBUG    | __main__:trials:24 - Trial = 1157/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.142 | DEBUG    | __main__:trials:29 - Trial = 1157/30000 | Total reward = 52.38
2022-01-26 14:16:29.145 | DEBUG    | __main__:trials:24 - Trial = 1158/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.146 | DEBUG    | __main__:trials:29 - Trial = 1158/30000 | Total reward = 42.42
2022-01-26 14:16:29.150 | DEBUG    | __main__:trials:24 - Trial = 1159/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.152 | DEBUG    | __main__:trials:29 - Trial = 1159/30000 | Total reward = 48.80
2022-01-26 14:16:29.155 | DEBUG    | __main__:trials:24 - Trial = 1160/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.157 | DEBUG    | __main__:trials:29 - Trial = 1160/30000 | Total reward = 51.60
2022-01-26 14:16:29.160 | DEBUG    | __main__:trials:24 - Trial = 1161/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.160 | DEBUG    | __main__:trials:29 - Trial = 1161/30000 | Total reward = 38.24
2022-01-26 14:16:29.164 | DEBUG    | __main__:trials:24 - Trial = 1162/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.165 | DEBUG    | __main__:trials:29 - Trial = 1162/30000 | Total reward = 44.71
2022-01-26 14:16:29.168 | DEBUG    | __main__:trials:24 - Trial = 1163/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.169 | DEBUG    | __main__:trials:29 - Trial = 1163/30000 | Total reward = 50.81
2022-01-26 14:16:29.172 | DEBUG    | __main__:trials:24 - Trial = 1164/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.174 | DEBUG    | __main__:trials:29 - Trial = 1164/30000 | Total reward = 55.08
2022-01-26 14:16:29.177 | DEBUG    | __main__:trials:24 - Trial = 1165/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.178 | DEBUG    | __main__:trials:29 - Trial = 1165/30000 | Total reward = 49.73
2022-01-26 14:16:29.182 | DEBUG    | __main__:trials:24 - Trial = 1166/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.183 | DEBUG    | __main__:trials:29 - Trial = 1166/30000 | Total reward = 53.72
2022-01-26 14:16:29.186 | DEBUG    | __main__:trials:24 - Trial = 1167/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.188 | DEBUG    | __main__:trials:29 - Trial = 1167/30000 | Total reward = 58.62
2022-01-26 14:16:29.191 | DEBUG    | __main__:trials:24 - Trial = 1168/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.193 | DEBUG    | __main__:trials:29 - Trial = 1168/30000 | Total reward = 50.24
2022-01-26 14:16:29.196 | DEBUG    | __main__:trials:24 - Trial = 1169/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.198 | DEBUG    | __main__:trials:29 - Trial = 1169/30000 | Total reward = 51.26
2022-01-26 14:16:29.200 | DEBUG    | __main__:trials:24 - Trial = 1170/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.201 | DEBUG    | __main__:trials:29 - Trial = 1170/30000 | Total reward = 51.89
2022-01-26 14:16:29.205 | DEBUG    | __main__:trials:24 - Trial = 1171/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.207 | DEBUG    | __main__:trials:29 - Trial = 1171/30000 | Total reward = 42.31
2022-01-26 14:16:29.209 | DEBUG    | __main__:trials:24 - Trial = 1172/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.211 | DEBUG    | __main__:trials:29 - Trial = 1172/30000 | Total reward = 45.52
2022-01-26 14:16:29.213 | DEBUG    | __main__:trials:24 - Trial = 1173/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.214 | DEBUG    | __main__:trials:29 - Trial = 1173/30000 | Total reward = 47.26
2022-01-26 14:16:29.217 | DEBUG    | __main__:trials:24 - Trial = 1174/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.218 | DEBUG    | __main__:trials:29 - Trial = 1174/30000 | Total reward = 33.89
2022-01-26 14:16:29.221 | DEBUG    | __main__:trials:24 - Trial = 1175/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.223 | DEBUG    | __main__:trials:29 - Trial = 1175/30000 | Total reward = 47.94
2022-01-26 14:16:29.226 | DEBUG    | __main__:trials:24 - Trial = 1176/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.227 | DEBUG    | __main__:trials:29 - Trial = 1176/30000 | Total reward = 50.06
2022-01-26 14:16:29.230 | DEBUG    | __main__:trials:24 - Trial = 1177/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.230 | DEBUG    | __main__:trials:29 - Trial = 1177/30000 | Total reward = 45.65
2022-01-26 14:16:29.234 | DEBUG    | __main__:trials:24 - Trial = 1178/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.235 | DEBUG    | __main__:trials:29 - Trial = 1178/30000 | Total reward = 45.98
2022-01-26 14:16:29.238 | DEBUG    | __main__:trials:24 - Trial = 1179/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.240 | DEBUG    | __main__:trials:29 - Trial = 1179/30000 | Total reward = 55.06
2022-01-26 14:16:29.243 | DEBUG    | __main__:trials:24 - Trial = 1180/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.243 | DEBUG    | __main__:trials:29 - Trial = 1180/30000 | Total reward = 52.53
2022-01-26 14:16:29.246 | DEBUG    | __main__:trials:26 - Trial = 1181/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.248 | DEBUG    | __main__:trials:29 - Trial = 1181/30000 | Total reward = 28.72
2022-01-26 14:16:29.252 | DEBUG    | __main__:trials:24 - Trial = 1182/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.252 | DEBUG    | __main__:trials:29 - Trial = 1182/30000 | Total reward = 47.37
2022-01-26 14:16:29.256 | DEBUG    | __main__:trials:24 - Trial = 1183/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.256 | DEBUG    | __main__:trials:29 - Trial = 1183/30000 | Total reward = 48.48
2022-01-26 14:16:29.260 | DEBUG    | __main__:trials:24 - Trial = 1184/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.262 | DEBUG    | __main__:trials:29 - Trial = 1184/30000 | Total reward = 56.41
2022-01-26 14:16:29.265 | DEBUG    | __main__:trials:24 - Trial = 1185/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.266 | DEBUG    | __main__:trials:29 - Trial = 1185/30000 | Total reward = 51.40
2022-01-26 14:16:29.269 | DEBUG    | __main__:trials:24 - Trial = 1186/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.270 | DEBUG    | __main__:trials:29 - Trial = 1186/30000 | Total reward = 45.35
2022-01-26 14:16:29.274 | DEBUG    | __main__:trials:24 - Trial = 1187/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.275 | DEBUG    | __main__:trials:29 - Trial = 1187/30000 | Total reward = 43.79
2022-01-26 14:16:29.278 | DEBUG    | __main__:trials:24 - Trial = 1188/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.279 | DEBUG    | __main__:trials:29 - Trial = 1188/30000 | Total reward = 46.67
2022-01-26 14:16:29.282 | DEBUG    | __main__:trials:24 - Trial = 1189/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.283 | DEBUG    | __main__:trials:29 - Trial = 1189/30000 | Total reward = 45.58
2022-01-26 14:16:29.287 | DEBUG    | __main__:trials:24 - Trial = 1190/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.287 | DEBUG    | __main__:trials:29 - Trial = 1190/30000 | Total reward = 46.76
2022-01-26 14:16:29.291 | DEBUG    | __main__:trials:24 - Trial = 1191/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.292 | DEBUG    | __main__:trials:29 - Trial = 1191/30000 | Total reward = 47.47
2022-01-26 14:16:29.295 | DEBUG    | __main__:trials:24 - Trial = 1192/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.296 | DEBUG    | __main__:trials:29 - Trial = 1192/30000 | Total reward = 48.22
2022-01-26 14:16:29.299 | DEBUG    | __main__:trials:24 - Trial = 1193/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.300 | DEBUG    | __main__:trials:29 - Trial = 1193/30000 | Total reward = 54.83
2022-01-26 14:16:29.304 | DEBUG    | __main__:trials:24 - Trial = 1194/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.304 | DEBUG    | __main__:trials:29 - Trial = 1194/30000 | Total reward = 46.95
2022-01-26 14:16:29.308 | DEBUG    | __main__:trials:24 - Trial = 1195/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.308 | DEBUG    | __main__:trials:29 - Trial = 1195/30000 | Total reward = 51.41
2022-01-26 14:16:29.312 | DEBUG    | __main__:trials:24 - Trial = 1196/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.312 | DEBUG    | __main__:trials:29 - Trial = 1196/30000 | Total reward = 48.15
2022-01-26 14:16:29.316 | DEBUG    | __main__:trials:24 - Trial = 1197/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.317 | DEBUG    | __main__:trials:29 - Trial = 1197/30000 | Total reward = 43.44
2022-01-26 14:16:29.320 | DEBUG    | __main__:trials:26 - Trial = 1198/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.321 | DEBUG    | __main__:trials:29 - Trial = 1198/30000 | Total reward = 14.28
2022-01-26 14:16:29.324 | DEBUG    | __main__:trials:24 - Trial = 1199/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.326 | DEBUG    | __main__:trials:29 - Trial = 1199/30000 | Total reward = 49.86
2022-01-26 14:16:29.329 | DEBUG    | __main__:trials:24 - Trial = 1200/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.331 | DEBUG    | __main__:trials:29 - Trial = 1200/30000 | Total reward = 48.47
2022-01-26 14:16:29.335 | DEBUG    | __main__:trials:24 - Trial = 1201/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.335 | DEBUG    | __main__:trials:29 - Trial = 1201/30000 | Total reward = 49.81
2022-01-26 14:16:29.340 | DEBUG    | __main__:trials:24 - Trial = 1202/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.340 | DEBUG    | __main__:trials:29 - Trial = 1202/30000 | Total reward = 51.83
2022-01-26 14:16:29.345 | DEBUG    | __main__:trials:24 - Trial = 1203/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.347 | DEBUG    | __main__:trials:29 - Trial = 1203/30000 | Total reward = 49.81
2022-01-26 14:16:29.350 | DEBUG    | __main__:trials:24 - Trial = 1204/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.352 | DEBUG    | __main__:trials:29 - Trial = 1204/30000 | Total reward = 52.63
2022-01-26 14:16:29.355 | DEBUG    | __main__:trials:24 - Trial = 1205/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.356 | DEBUG    | __main__:trials:29 - Trial = 1205/30000 | Total reward = 44.91
2022-01-26 14:16:29.360 | DEBUG    | __main__:trials:24 - Trial = 1206/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.360 | DEBUG    | __main__:trials:29 - Trial = 1206/30000 | Total reward = 31.76
2022-01-26 14:16:29.365 | DEBUG    | __main__:trials:24 - Trial = 1207/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.365 | DEBUG    | __main__:trials:29 - Trial = 1207/30000 | Total reward = 51.34
2022-01-26 14:16:29.369 | DEBUG    | __main__:trials:26 - Trial = 1208/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.371 | DEBUG    | __main__:trials:29 - Trial = 1208/30000 | Total reward = 20.67
2022-01-26 14:16:29.374 | DEBUG    | __main__:trials:24 - Trial = 1209/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.376 | DEBUG    | __main__:trials:29 - Trial = 1209/30000 | Total reward = 50.82
2022-01-26 14:16:29.379 | DEBUG    | __main__:trials:24 - Trial = 1210/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.380 | DEBUG    | __main__:trials:29 - Trial = 1210/30000 | Total reward = 51.54
2022-01-26 14:16:29.383 | DEBUG    | __main__:trials:24 - Trial = 1211/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.385 | DEBUG    | __main__:trials:29 - Trial = 1211/30000 | Total reward = 51.24
2022-01-26 14:16:29.388 | DEBUG    | __main__:trials:24 - Trial = 1212/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.389 | DEBUG    | __main__:trials:29 - Trial = 1212/30000 | Total reward = 50.56
2022-01-26 14:16:29.392 | DEBUG    | __main__:trials:24 - Trial = 1213/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.394 | DEBUG    | __main__:trials:29 - Trial = 1213/30000 | Total reward = 52.39
2022-01-26 14:16:29.397 | DEBUG    | __main__:trials:24 - Trial = 1214/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.397 | DEBUG    | __main__:trials:29 - Trial = 1214/30000 | Total reward = 50.50
2022-01-26 14:16:29.402 | DEBUG    | __main__:trials:24 - Trial = 1215/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.403 | DEBUG    | __main__:trials:29 - Trial = 1215/30000 | Total reward = 45.23
2022-01-26 14:16:29.407 | DEBUG    | __main__:trials:24 - Trial = 1216/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.409 | DEBUG    | __main__:trials:29 - Trial = 1216/30000 | Total reward = 54.15
2022-01-26 14:16:29.412 | DEBUG    | __main__:trials:24 - Trial = 1217/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.414 | DEBUG    | __main__:trials:29 - Trial = 1217/30000 | Total reward = 53.63
2022-01-26 14:16:29.417 | DEBUG    | __main__:trials:24 - Trial = 1218/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.418 | DEBUG    | __main__:trials:29 - Trial = 1218/30000 | Total reward = 46.74
2022-01-26 14:16:29.422 | DEBUG    | __main__:trials:24 - Trial = 1219/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.424 | DEBUG    | __main__:trials:29 - Trial = 1219/30000 | Total reward = 50.18
2022-01-26 14:16:29.428 | DEBUG    | __main__:trials:24 - Trial = 1220/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.429 | DEBUG    | __main__:trials:29 - Trial = 1220/30000 | Total reward = 47.11
2022-01-26 14:16:29.433 | DEBUG    | __main__:trials:24 - Trial = 1221/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.434 | DEBUG    | __main__:trials:29 - Trial = 1221/30000 | Total reward = 47.03
2022-01-26 14:16:29.438 | DEBUG    | __main__:trials:24 - Trial = 1222/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.439 | DEBUG    | __main__:trials:29 - Trial = 1222/30000 | Total reward = 49.13
2022-01-26 14:16:29.443 | DEBUG    | __main__:trials:24 - Trial = 1223/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.444 | DEBUG    | __main__:trials:29 - Trial = 1223/30000 | Total reward = 49.60
2022-01-26 14:16:29.448 | DEBUG    | __main__:trials:24 - Trial = 1224/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.450 | DEBUG    | __main__:trials:29 - Trial = 1224/30000 | Total reward = 44.80
2022-01-26 14:16:29.453 | DEBUG    | __main__:trials:24 - Trial = 1225/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.454 | DEBUG    | __main__:trials:29 - Trial = 1225/30000 | Total reward = 48.16
2022-01-26 14:16:29.458 | DEBUG    | __main__:trials:26 - Trial = 1226/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.459 | DEBUG    | __main__:trials:29 - Trial = 1226/30000 | Total reward = 24.85
2022-01-26 14:16:29.463 | DEBUG    | __main__:trials:24 - Trial = 1227/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.464 | DEBUG    | __main__:trials:29 - Trial = 1227/30000 | Total reward = 50.83
2022-01-26 14:16:29.467 | DEBUG    | __main__:trials:26 - Trial = 1228/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.468 | DEBUG    | __main__:trials:29 - Trial = 1228/30000 | Total reward = 17.44
2022-01-26 14:16:29.473 | DEBUG    | __main__:trials:24 - Trial = 1229/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.474 | DEBUG    | __main__:trials:29 - Trial = 1229/30000 | Total reward = 29.32
2022-01-26 14:16:29.478 | DEBUG    | __main__:trials:24 - Trial = 1230/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.479 | DEBUG    | __main__:trials:29 - Trial = 1230/30000 | Total reward = 44.57
2022-01-26 14:16:29.483 | DEBUG    | __main__:trials:24 - Trial = 1231/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.483 | DEBUG    | __main__:trials:29 - Trial = 1231/30000 | Total reward = 59.07
2022-01-26 14:16:29.488 | DEBUG    | __main__:trials:24 - Trial = 1232/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.489 | DEBUG    | __main__:trials:29 - Trial = 1232/30000 | Total reward = 32.81
2022-01-26 14:16:29.493 | DEBUG    | __main__:trials:24 - Trial = 1233/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.494 | DEBUG    | __main__:trials:29 - Trial = 1233/30000 | Total reward = 25.59
2022-01-26 14:16:29.497 | DEBUG    | __main__:trials:24 - Trial = 1234/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.499 | DEBUG    | __main__:trials:29 - Trial = 1234/30000 | Total reward = 45.07
2022-01-26 14:16:29.502 | DEBUG    | __main__:trials:26 - Trial = 1235/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.504 | DEBUG    | __main__:trials:29 - Trial = 1235/30000 | Total reward = 20.83
2022-01-26 14:16:29.507 | DEBUG    | __main__:trials:24 - Trial = 1236/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.508 | DEBUG    | __main__:trials:29 - Trial = 1236/30000 | Total reward = 37.88
2022-01-26 14:16:29.511 | DEBUG    | __main__:trials:24 - Trial = 1237/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.513 | DEBUG    | __main__:trials:29 - Trial = 1237/30000 | Total reward = 43.51
2022-01-26 14:16:29.516 | DEBUG    | __main__:trials:26 - Trial = 1238/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.517 | DEBUG    | __main__:trials:29 - Trial = 1238/30000 | Total reward = 37.59
2022-01-26 14:16:29.520 | DEBUG    | __main__:trials:24 - Trial = 1239/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.521 | DEBUG    | __main__:trials:29 - Trial = 1239/30000 | Total reward = 44.05
2022-01-26 14:16:29.524 | DEBUG    | __main__:trials:24 - Trial = 1240/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.525 | DEBUG    | __main__:trials:29 - Trial = 1240/30000 | Total reward = 45.52
2022-01-26 14:16:29.528 | DEBUG    | __main__:trials:24 - Trial = 1241/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.530 | DEBUG    | __main__:trials:29 - Trial = 1241/30000 | Total reward = 54.74
2022-01-26 14:16:29.534 | DEBUG    | __main__:trials:24 - Trial = 1242/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.535 | DEBUG    | __main__:trials:29 - Trial = 1242/30000 | Total reward = 47.29
2022-01-26 14:16:29.539 | DEBUG    | __main__:trials:24 - Trial = 1243/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.539 | DEBUG    | __main__:trials:29 - Trial = 1243/30000 | Total reward = 44.00
2022-01-26 14:16:29.544 | DEBUG    | __main__:trials:24 - Trial = 1244/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.545 | DEBUG    | __main__:trials:29 - Trial = 1244/30000 | Total reward = 53.69
2022-01-26 14:16:29.549 | DEBUG    | __main__:trials:24 - Trial = 1245/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.551 | DEBUG    | __main__:trials:29 - Trial = 1245/30000 | Total reward = 48.99
2022-01-26 14:16:29.554 | DEBUG    | __main__:trials:24 - Trial = 1246/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.556 | DEBUG    | __main__:trials:29 - Trial = 1246/30000 | Total reward = 38.33
2022-01-26 14:16:29.559 | DEBUG    | __main__:trials:24 - Trial = 1247/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.560 | DEBUG    | __main__:trials:29 - Trial = 1247/30000 | Total reward = 44.60
2022-01-26 14:16:29.564 | DEBUG    | __main__:trials:24 - Trial = 1248/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.566 | DEBUG    | __main__:trials:29 - Trial = 1248/30000 | Total reward = 50.29
2022-01-26 14:16:29.569 | DEBUG    | __main__:trials:26 - Trial = 1249/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.570 | DEBUG    | __main__:trials:29 - Trial = 1249/30000 | Total reward = 18.19
2022-01-26 14:16:29.573 | DEBUG    | __main__:trials:24 - Trial = 1250/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.575 | DEBUG    | __main__:trials:29 - Trial = 1250/30000 | Total reward = 47.94
2022-01-26 14:16:29.577 | DEBUG    | __main__:trials:26 - Trial = 1251/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.578 | DEBUG    | __main__:trials:29 - Trial = 1251/30000 | Total reward = 10.14
2022-01-26 14:16:29.582 | DEBUG    | __main__:trials:26 - Trial = 1252/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.583 | DEBUG    | __main__:trials:29 - Trial = 1252/30000 | Total reward = 32.48
2022-01-26 14:16:29.587 | DEBUG    | __main__:trials:24 - Trial = 1253/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.588 | DEBUG    | __main__:trials:29 - Trial = 1253/30000 | Total reward = 55.57
2022-01-26 14:16:29.592 | DEBUG    | __main__:trials:24 - Trial = 1254/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.593 | DEBUG    | __main__:trials:29 - Trial = 1254/30000 | Total reward = 47.61
2022-01-26 14:16:29.597 | DEBUG    | __main__:trials:24 - Trial = 1255/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.598 | DEBUG    | __main__:trials:29 - Trial = 1255/30000 | Total reward = 40.20
2022-01-26 14:16:29.602 | DEBUG    | __main__:trials:24 - Trial = 1256/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.603 | DEBUG    | __main__:trials:29 - Trial = 1256/30000 | Total reward = 53.52
2022-01-26 14:16:29.606 | DEBUG    | __main__:trials:24 - Trial = 1257/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.608 | DEBUG    | __main__:trials:29 - Trial = 1257/30000 | Total reward = 57.22
2022-01-26 14:16:29.612 | DEBUG    | __main__:trials:24 - Trial = 1258/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.612 | DEBUG    | __main__:trials:29 - Trial = 1258/30000 | Total reward = 52.17
2022-01-26 14:16:29.617 | DEBUG    | __main__:trials:24 - Trial = 1259/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.617 | DEBUG    | __main__:trials:29 - Trial = 1259/30000 | Total reward = 45.14
2022-01-26 14:16:29.622 | DEBUG    | __main__:trials:24 - Trial = 1260/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.622 | DEBUG    | __main__:trials:29 - Trial = 1260/30000 | Total reward = 57.90
2022-01-26 14:16:29.626 | DEBUG    | __main__:trials:24 - Trial = 1261/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.628 | DEBUG    | __main__:trials:29 - Trial = 1261/30000 | Total reward = 42.95
2022-01-26 14:16:29.631 | DEBUG    | __main__:trials:24 - Trial = 1262/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.633 | DEBUG    | __main__:trials:29 - Trial = 1262/30000 | Total reward = 47.69
2022-01-26 14:16:29.636 | DEBUG    | __main__:trials:24 - Trial = 1263/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.637 | DEBUG    | __main__:trials:29 - Trial = 1263/30000 | Total reward = 51.44
2022-01-26 14:16:29.640 | DEBUG    | __main__:trials:26 - Trial = 1264/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.641 | DEBUG    | __main__:trials:29 - Trial = 1264/30000 | Total reward = 20.67
2022-01-26 14:16:29.644 | DEBUG    | __main__:trials:24 - Trial = 1265/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.646 | DEBUG    | __main__:trials:29 - Trial = 1265/30000 | Total reward = 47.24
2022-01-26 14:16:29.649 | DEBUG    | __main__:trials:24 - Trial = 1266/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.651 | DEBUG    | __main__:trials:29 - Trial = 1266/30000 | Total reward = 49.80
2022-01-26 14:16:29.654 | DEBUG    | __main__:trials:24 - Trial = 1267/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.656 | DEBUG    | __main__:trials:29 - Trial = 1267/30000 | Total reward = 30.50
2022-01-26 14:16:29.659 | DEBUG    | __main__:trials:24 - Trial = 1268/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.661 | DEBUG    | __main__:trials:29 - Trial = 1268/30000 | Total reward = 52.87
2022-01-26 14:16:29.664 | DEBUG    | __main__:trials:24 - Trial = 1269/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.666 | DEBUG    | __main__:trials:29 - Trial = 1269/30000 | Total reward = 49.85
2022-01-26 14:16:29.668 | DEBUG    | __main__:trials:26 - Trial = 1270/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.670 | DEBUG    | __main__:trials:29 - Trial = 1270/30000 | Total reward = 9.34
2022-01-26 14:16:29.673 | DEBUG    | __main__:trials:24 - Trial = 1271/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.675 | DEBUG    | __main__:trials:29 - Trial = 1271/30000 | Total reward = 45.82
2022-01-26 14:16:29.678 | DEBUG    | __main__:trials:24 - Trial = 1272/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.680 | DEBUG    | __main__:trials:29 - Trial = 1272/30000 | Total reward = 33.03
2022-01-26 14:16:29.683 | DEBUG    | __main__:trials:24 - Trial = 1273/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.684 | DEBUG    | __main__:trials:29 - Trial = 1273/30000 | Total reward = 44.96
2022-01-26 14:16:29.688 | DEBUG    | __main__:trials:24 - Trial = 1274/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.689 | DEBUG    | __main__:trials:29 - Trial = 1274/30000 | Total reward = 55.67
2022-01-26 14:16:29.692 | DEBUG    | __main__:trials:24 - Trial = 1275/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.694 | DEBUG    | __main__:trials:29 - Trial = 1275/30000 | Total reward = 38.44
2022-01-26 14:16:29.698 | DEBUG    | __main__:trials:24 - Trial = 1276/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.698 | DEBUG    | __main__:trials:29 - Trial = 1276/30000 | Total reward = 38.03
2022-01-26 14:16:29.703 | DEBUG    | __main__:trials:24 - Trial = 1277/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.704 | DEBUG    | __main__:trials:29 - Trial = 1277/30000 | Total reward = 45.85
2022-01-26 14:16:29.708 | DEBUG    | __main__:trials:24 - Trial = 1278/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.708 | DEBUG    | __main__:trials:29 - Trial = 1278/30000 | Total reward = 45.14
2022-01-26 14:16:29.712 | DEBUG    | __main__:trials:24 - Trial = 1279/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.714 | DEBUG    | __main__:trials:29 - Trial = 1279/30000 | Total reward = 46.27
2022-01-26 14:16:29.717 | DEBUG    | __main__:trials:24 - Trial = 1280/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.718 | DEBUG    | __main__:trials:29 - Trial = 1280/30000 | Total reward = 42.17
2022-01-26 14:16:29.723 | DEBUG    | __main__:trials:24 - Trial = 1281/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.724 | DEBUG    | __main__:trials:29 - Trial = 1281/30000 | Total reward = 52.28
2022-01-26 14:16:29.728 | DEBUG    | __main__:trials:24 - Trial = 1282/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.729 | DEBUG    | __main__:trials:29 - Trial = 1282/30000 | Total reward = 37.91
2022-01-26 14:16:29.733 | DEBUG    | __main__:trials:24 - Trial = 1283/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.735 | DEBUG    | __main__:trials:29 - Trial = 1283/30000 | Total reward = 50.26
2022-01-26 14:16:29.738 | DEBUG    | __main__:trials:24 - Trial = 1284/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.739 | DEBUG    | __main__:trials:29 - Trial = 1284/30000 | Total reward = 38.40
2022-01-26 14:16:29.743 | DEBUG    | __main__:trials:24 - Trial = 1285/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.745 | DEBUG    | __main__:trials:29 - Trial = 1285/30000 | Total reward = 45.06
2022-01-26 14:16:29.748 | DEBUG    | __main__:trials:24 - Trial = 1286/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.750 | DEBUG    | __main__:trials:29 - Trial = 1286/30000 | Total reward = 47.26
2022-01-26 14:16:29.754 | DEBUG    | __main__:trials:24 - Trial = 1287/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.755 | DEBUG    | __main__:trials:29 - Trial = 1287/30000 | Total reward = 35.18
2022-01-26 14:16:29.758 | DEBUG    | __main__:trials:24 - Trial = 1288/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.760 | DEBUG    | __main__:trials:29 - Trial = 1288/30000 | Total reward = 48.27
2022-01-26 14:16:29.763 | DEBUG    | __main__:trials:24 - Trial = 1289/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.765 | DEBUG    | __main__:trials:29 - Trial = 1289/30000 | Total reward = 52.10
2022-01-26 14:16:29.768 | DEBUG    | __main__:trials:26 - Trial = 1290/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.770 | DEBUG    | __main__:trials:29 - Trial = 1290/30000 | Total reward = 32.82
2022-01-26 14:16:29.773 | DEBUG    | __main__:trials:24 - Trial = 1291/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.774 | DEBUG    | __main__:trials:29 - Trial = 1291/30000 | Total reward = 39.08
2022-01-26 14:16:29.779 | DEBUG    | __main__:trials:24 - Trial = 1292/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.780 | DEBUG    | __main__:trials:29 - Trial = 1292/30000 | Total reward = 50.57
2022-01-26 14:16:29.783 | DEBUG    | __main__:trials:24 - Trial = 1293/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.785 | DEBUG    | __main__:trials:29 - Trial = 1293/30000 | Total reward = 14.64
2022-01-26 14:16:29.787 | DEBUG    | __main__:trials:24 - Trial = 1294/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.789 | DEBUG    | __main__:trials:29 - Trial = 1294/30000 | Total reward = 44.56
2022-01-26 14:16:29.793 | DEBUG    | __main__:trials:24 - Trial = 1295/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.794 | DEBUG    | __main__:trials:29 - Trial = 1295/30000 | Total reward = 37.83
2022-01-26 14:16:29.796 | DEBUG    | __main__:trials:26 - Trial = 1296/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.798 | DEBUG    | __main__:trials:29 - Trial = 1296/30000 | Total reward = 16.57
2022-01-26 14:16:29.801 | DEBUG    | __main__:trials:24 - Trial = 1297/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.803 | DEBUG    | __main__:trials:29 - Trial = 1297/30000 | Total reward = 24.08
2022-01-26 14:16:29.805 | DEBUG    | __main__:trials:26 - Trial = 1298/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.806 | DEBUG    | __main__:trials:29 - Trial = 1298/30000 | Total reward = 19.61
2022-01-26 14:16:29.809 | DEBUG    | __main__:trials:24 - Trial = 1299/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.811 | DEBUG    | __main__:trials:29 - Trial = 1299/30000 | Total reward = 52.45
2022-01-26 14:16:29.815 | DEBUG    | __main__:trials:24 - Trial = 1300/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.816 | DEBUG    | __main__:trials:29 - Trial = 1300/30000 | Total reward = 53.94
2022-01-26 14:16:29.819 | DEBUG    | __main__:trials:24 - Trial = 1301/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.821 | DEBUG    | __main__:trials:29 - Trial = 1301/30000 | Total reward = 50.52
2022-01-26 14:16:29.824 | DEBUG    | __main__:trials:24 - Trial = 1302/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.825 | DEBUG    | __main__:trials:29 - Trial = 1302/30000 | Total reward = 45.92
2022-01-26 14:16:29.829 | DEBUG    | __main__:trials:24 - Trial = 1303/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.836 | DEBUG    | __main__:trials:29 - Trial = 1303/30000 | Total reward = 50.86
2022-01-26 14:16:29.839 | DEBUG    | __main__:trials:24 - Trial = 1304/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.840 | DEBUG    | __main__:trials:29 - Trial = 1304/30000 | Total reward = 48.26
2022-01-26 14:16:29.844 | DEBUG    | __main__:trials:24 - Trial = 1305/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.846 | DEBUG    | __main__:trials:29 - Trial = 1305/30000 | Total reward = 52.47
2022-01-26 14:16:29.849 | DEBUG    | __main__:trials:24 - Trial = 1306/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.851 | DEBUG    | __main__:trials:29 - Trial = 1306/30000 | Total reward = 53.46
2022-01-26 14:16:29.854 | DEBUG    | __main__:trials:24 - Trial = 1307/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.856 | DEBUG    | __main__:trials:29 - Trial = 1307/30000 | Total reward = 49.40
2022-01-26 14:16:29.859 | DEBUG    | __main__:trials:24 - Trial = 1308/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.861 | DEBUG    | __main__:trials:29 - Trial = 1308/30000 | Total reward = 43.21
2022-01-26 14:16:29.864 | DEBUG    | __main__:trials:24 - Trial = 1309/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.866 | DEBUG    | __main__:trials:29 - Trial = 1309/30000 | Total reward = 49.42
2022-01-26 14:16:29.869 | DEBUG    | __main__:trials:24 - Trial = 1310/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.870 | DEBUG    | __main__:trials:29 - Trial = 1310/30000 | Total reward = 53.96
2022-01-26 14:16:29.875 | DEBUG    | __main__:trials:24 - Trial = 1311/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.876 | DEBUG    | __main__:trials:29 - Trial = 1311/30000 | Total reward = 61.75
2022-01-26 14:16:29.880 | DEBUG    | __main__:trials:26 - Trial = 1312/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.881 | DEBUG    | __main__:trials:29 - Trial = 1312/30000 | Total reward = 28.53
2022-01-26 14:16:29.885 | DEBUG    | __main__:trials:24 - Trial = 1313/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.887 | DEBUG    | __main__:trials:29 - Trial = 1313/30000 | Total reward = 55.80
2022-01-26 14:16:29.891 | DEBUG    | __main__:trials:24 - Trial = 1314/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.893 | DEBUG    | __main__:trials:29 - Trial = 1314/30000 | Total reward = 59.37
2022-01-26 14:16:29.896 | DEBUG    | __main__:trials:26 - Trial = 1315/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:29.898 | DEBUG    | __main__:trials:29 - Trial = 1315/30000 | Total reward = 43.02
2022-01-26 14:16:29.902 | DEBUG    | __main__:trials:24 - Trial = 1316/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.903 | DEBUG    | __main__:trials:29 - Trial = 1316/30000 | Total reward = 49.83
2022-01-26 14:16:29.907 | DEBUG    | __main__:trials:24 - Trial = 1317/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.908 | DEBUG    | __main__:trials:29 - Trial = 1317/30000 | Total reward = 42.20
2022-01-26 14:16:29.912 | DEBUG    | __main__:trials:24 - Trial = 1318/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.912 | DEBUG    | __main__:trials:29 - Trial = 1318/30000 | Total reward = 44.85
2022-01-26 14:16:29.916 | DEBUG    | __main__:trials:24 - Trial = 1319/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.918 | DEBUG    | __main__:trials:29 - Trial = 1319/30000 | Total reward = 48.51
2022-01-26 14:16:29.921 | DEBUG    | __main__:trials:24 - Trial = 1320/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.921 | DEBUG    | __main__:trials:29 - Trial = 1320/30000 | Total reward = 47.30
2022-01-26 14:16:29.926 | DEBUG    | __main__:trials:24 - Trial = 1321/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.927 | DEBUG    | __main__:trials:29 - Trial = 1321/30000 | Total reward = 46.50
2022-01-26 14:16:29.930 | DEBUG    | __main__:trials:24 - Trial = 1322/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.932 | DEBUG    | __main__:trials:29 - Trial = 1322/30000 | Total reward = 47.52
2022-01-26 14:16:29.936 | DEBUG    | __main__:trials:24 - Trial = 1323/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.937 | DEBUG    | __main__:trials:29 - Trial = 1323/30000 | Total reward = 43.24
2022-01-26 14:16:29.940 | DEBUG    | __main__:trials:24 - Trial = 1324/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.942 | DEBUG    | __main__:trials:29 - Trial = 1324/30000 | Total reward = 42.22
2022-01-26 14:16:29.945 | DEBUG    | __main__:trials:24 - Trial = 1325/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.946 | DEBUG    | __main__:trials:29 - Trial = 1325/30000 | Total reward = 56.93
2022-01-26 14:16:29.949 | DEBUG    | __main__:trials:24 - Trial = 1326/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.950 | DEBUG    | __main__:trials:29 - Trial = 1326/30000 | Total reward = 44.30
2022-01-26 14:16:29.954 | DEBUG    | __main__:trials:24 - Trial = 1327/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.955 | DEBUG    | __main__:trials:29 - Trial = 1327/30000 | Total reward = 50.70
2022-01-26 14:16:29.959 | DEBUG    | __main__:trials:24 - Trial = 1328/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.961 | DEBUG    | __main__:trials:29 - Trial = 1328/30000 | Total reward = 59.64
2022-01-26 14:16:29.964 | DEBUG    | __main__:trials:24 - Trial = 1329/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.966 | DEBUG    | __main__:trials:29 - Trial = 1329/30000 | Total reward = 55.77
2022-01-26 14:16:29.969 | DEBUG    | __main__:trials:24 - Trial = 1330/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.970 | DEBUG    | __main__:trials:29 - Trial = 1330/30000 | Total reward = 57.45
2022-01-26 14:16:29.974 | DEBUG    | __main__:trials:24 - Trial = 1331/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.975 | DEBUG    | __main__:trials:29 - Trial = 1331/30000 | Total reward = 43.86
2022-01-26 14:16:29.979 | DEBUG    | __main__:trials:24 - Trial = 1332/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.980 | DEBUG    | __main__:trials:29 - Trial = 1332/30000 | Total reward = 51.30
2022-01-26 14:16:29.983 | DEBUG    | __main__:trials:24 - Trial = 1333/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.985 | DEBUG    | __main__:trials:29 - Trial = 1333/30000 | Total reward = 48.13
2022-01-26 14:16:29.989 | DEBUG    | __main__:trials:24 - Trial = 1334/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.990 | DEBUG    | __main__:trials:29 - Trial = 1334/30000 | Total reward = 49.21
2022-01-26 14:16:29.993 | DEBUG    | __main__:trials:24 - Trial = 1335/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.994 | DEBUG    | __main__:trials:29 - Trial = 1335/30000 | Total reward = 54.44
2022-01-26 14:16:29.997 | DEBUG    | __main__:trials:24 - Trial = 1336/30000 | Max number of steps (20) reached
2022-01-26 14:16:29.999 | DEBUG    | __main__:trials:29 - Trial = 1336/30000 | Total reward = 53.48
2022-01-26 14:16:30.001 | DEBUG    | __main__:trials:24 - Trial = 1337/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.003 | DEBUG    | __main__:trials:29 - Trial = 1337/30000 | Total reward = 60.51
2022-01-26 14:16:30.006 | DEBUG    | __main__:trials:24 - Trial = 1338/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.007 | DEBUG    | __main__:trials:29 - Trial = 1338/30000 | Total reward = 49.25
2022-01-26 14:16:30.010 | DEBUG    | __main__:trials:24 - Trial = 1339/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.012 | DEBUG    | __main__:trials:29 - Trial = 1339/30000 | Total reward = 53.84
2022-01-26 14:16:30.014 | DEBUG    | __main__:trials:26 - Trial = 1340/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.015 | DEBUG    | __main__:trials:29 - Trial = 1340/30000 | Total reward = 13.86
2022-01-26 14:16:30.019 | DEBUG    | __main__:trials:24 - Trial = 1341/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.020 | DEBUG    | __main__:trials:29 - Trial = 1341/30000 | Total reward = 26.07
2022-01-26 14:16:30.023 | DEBUG    | __main__:trials:24 - Trial = 1342/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.025 | DEBUG    | __main__:trials:29 - Trial = 1342/30000 | Total reward = 52.73
2022-01-26 14:16:30.029 | DEBUG    | __main__:trials:24 - Trial = 1343/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.029 | DEBUG    | __main__:trials:29 - Trial = 1343/30000 | Total reward = 60.10
2022-01-26 14:16:30.033 | DEBUG    | __main__:trials:26 - Trial = 1344/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.033 | DEBUG    | __main__:trials:29 - Trial = 1344/30000 | Total reward = 30.86
2022-01-26 14:16:30.038 | DEBUG    | __main__:trials:24 - Trial = 1345/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.039 | DEBUG    | __main__:trials:29 - Trial = 1345/30000 | Total reward = 37.32
2022-01-26 14:16:30.042 | DEBUG    | __main__:trials:24 - Trial = 1346/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.044 | DEBUG    | __main__:trials:29 - Trial = 1346/30000 | Total reward = 36.05
2022-01-26 14:16:30.047 | DEBUG    | __main__:trials:26 - Trial = 1347/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.048 | DEBUG    | __main__:trials:29 - Trial = 1347/30000 | Total reward = 35.13
2022-01-26 14:16:30.052 | DEBUG    | __main__:trials:24 - Trial = 1348/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.053 | DEBUG    | __main__:trials:29 - Trial = 1348/30000 | Total reward = 57.21
2022-01-26 14:16:30.056 | DEBUG    | __main__:trials:24 - Trial = 1349/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.058 | DEBUG    | __main__:trials:29 - Trial = 1349/30000 | Total reward = 53.61
2022-01-26 14:16:30.062 | DEBUG    | __main__:trials:24 - Trial = 1350/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.063 | DEBUG    | __main__:trials:29 - Trial = 1350/30000 | Total reward = 59.02
2022-01-26 14:16:30.067 | DEBUG    | __main__:trials:24 - Trial = 1351/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.068 | DEBUG    | __main__:trials:29 - Trial = 1351/30000 | Total reward = 54.44
2022-01-26 14:16:30.071 | DEBUG    | __main__:trials:24 - Trial = 1352/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.073 | DEBUG    | __main__:trials:29 - Trial = 1352/30000 | Total reward = 63.92
2022-01-26 14:16:30.076 | DEBUG    | __main__:trials:24 - Trial = 1353/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.077 | DEBUG    | __main__:trials:29 - Trial = 1353/30000 | Total reward = 56.15
2022-01-26 14:16:30.081 | DEBUG    | __main__:trials:24 - Trial = 1354/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.083 | DEBUG    | __main__:trials:29 - Trial = 1354/30000 | Total reward = 57.52
2022-01-26 14:16:30.087 | DEBUG    | __main__:trials:24 - Trial = 1355/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.087 | DEBUG    | __main__:trials:29 - Trial = 1355/30000 | Total reward = 56.81
2022-01-26 14:16:30.091 | DEBUG    | __main__:trials:24 - Trial = 1356/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.093 | DEBUG    | __main__:trials:29 - Trial = 1356/30000 | Total reward = 5.52
2022-01-26 14:16:30.096 | DEBUG    | __main__:trials:24 - Trial = 1357/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.097 | DEBUG    | __main__:trials:29 - Trial = 1357/30000 | Total reward = 51.01
2022-01-26 14:16:30.101 | DEBUG    | __main__:trials:24 - Trial = 1358/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.103 | DEBUG    | __main__:trials:29 - Trial = 1358/30000 | Total reward = 50.80
2022-01-26 14:16:30.107 | DEBUG    | __main__:trials:24 - Trial = 1359/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.107 | DEBUG    | __main__:trials:29 - Trial = 1359/30000 | Total reward = 54.44
2022-01-26 14:16:30.112 | DEBUG    | __main__:trials:24 - Trial = 1360/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.112 | DEBUG    | __main__:trials:29 - Trial = 1360/30000 | Total reward = 66.04
2022-01-26 14:16:30.116 | DEBUG    | __main__:trials:24 - Trial = 1361/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.117 | DEBUG    | __main__:trials:29 - Trial = 1361/30000 | Total reward = 45.86
2022-01-26 14:16:30.121 | DEBUG    | __main__:trials:24 - Trial = 1362/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.121 | DEBUG    | __main__:trials:29 - Trial = 1362/30000 | Total reward = 52.64
2022-01-26 14:16:30.125 | DEBUG    | __main__:trials:24 - Trial = 1363/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.126 | DEBUG    | __main__:trials:29 - Trial = 1363/30000 | Total reward = 50.26
2022-01-26 14:16:30.130 | DEBUG    | __main__:trials:24 - Trial = 1364/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.131 | DEBUG    | __main__:trials:29 - Trial = 1364/30000 | Total reward = 68.86
2022-01-26 14:16:30.135 | DEBUG    | __main__:trials:24 - Trial = 1365/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.135 | DEBUG    | __main__:trials:29 - Trial = 1365/30000 | Total reward = 55.31
2022-01-26 14:16:30.139 | DEBUG    | __main__:trials:26 - Trial = 1366/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.141 | DEBUG    | __main__:trials:29 - Trial = 1366/30000 | Total reward = 30.19
2022-01-26 14:16:30.145 | DEBUG    | __main__:trials:24 - Trial = 1367/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.146 | DEBUG    | __main__:trials:29 - Trial = 1367/30000 | Total reward = 45.89
2022-01-26 14:16:30.149 | DEBUG    | __main__:trials:24 - Trial = 1368/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.150 | DEBUG    | __main__:trials:29 - Trial = 1368/30000 | Total reward = 43.77
2022-01-26 14:16:30.153 | DEBUG    | __main__:trials:24 - Trial = 1369/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.154 | DEBUG    | __main__:trials:29 - Trial = 1369/30000 | Total reward = 40.13
2022-01-26 14:16:30.158 | DEBUG    | __main__:trials:24 - Trial = 1370/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.159 | DEBUG    | __main__:trials:29 - Trial = 1370/30000 | Total reward = 54.79
2022-01-26 14:16:30.162 | DEBUG    | __main__:trials:24 - Trial = 1371/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.163 | DEBUG    | __main__:trials:29 - Trial = 1371/30000 | Total reward = 54.57
2022-01-26 14:16:30.166 | DEBUG    | __main__:trials:24 - Trial = 1372/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.168 | DEBUG    | __main__:trials:29 - Trial = 1372/30000 | Total reward = 49.99
2022-01-26 14:16:30.171 | DEBUG    | __main__:trials:24 - Trial = 1373/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.172 | DEBUG    | __main__:trials:29 - Trial = 1373/30000 | Total reward = 55.95
2022-01-26 14:16:30.176 | DEBUG    | __main__:trials:24 - Trial = 1374/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.177 | DEBUG    | __main__:trials:29 - Trial = 1374/30000 | Total reward = 35.66
2022-01-26 14:16:30.180 | DEBUG    | __main__:trials:24 - Trial = 1375/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.182 | DEBUG    | __main__:trials:29 - Trial = 1375/30000 | Total reward = 21.56
2022-01-26 14:16:30.186 | DEBUG    | __main__:trials:24 - Trial = 1376/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.186 | DEBUG    | __main__:trials:29 - Trial = 1376/30000 | Total reward = 37.33
2022-01-26 14:16:30.189 | DEBUG    | __main__:trials:26 - Trial = 1377/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.190 | DEBUG    | __main__:trials:29 - Trial = 1377/30000 | Total reward = 24.86
2022-01-26 14:16:30.193 | DEBUG    | __main__:trials:24 - Trial = 1378/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.194 | DEBUG    | __main__:trials:29 - Trial = 1378/30000 | Total reward = 54.44
2022-01-26 14:16:30.197 | DEBUG    | __main__:trials:24 - Trial = 1379/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.197 | DEBUG    | __main__:trials:29 - Trial = 1379/30000 | Total reward = 56.25
2022-01-26 14:16:30.202 | DEBUG    | __main__:trials:24 - Trial = 1380/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.203 | DEBUG    | __main__:trials:29 - Trial = 1380/30000 | Total reward = 54.44
2022-01-26 14:16:30.206 | DEBUG    | __main__:trials:26 - Trial = 1381/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.207 | DEBUG    | __main__:trials:29 - Trial = 1381/30000 | Total reward = 24.09
2022-01-26 14:16:30.211 | DEBUG    | __main__:trials:24 - Trial = 1382/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.212 | DEBUG    | __main__:trials:29 - Trial = 1382/30000 | Total reward = 27.58
2022-01-26 14:16:30.215 | DEBUG    | __main__:trials:24 - Trial = 1383/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.217 | DEBUG    | __main__:trials:29 - Trial = 1383/30000 | Total reward = 58.39
2022-01-26 14:16:30.220 | DEBUG    | __main__:trials:24 - Trial = 1384/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.222 | DEBUG    | __main__:trials:29 - Trial = 1384/30000 | Total reward = 54.47
2022-01-26 14:16:30.225 | DEBUG    | __main__:trials:24 - Trial = 1385/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.226 | DEBUG    | __main__:trials:29 - Trial = 1385/30000 | Total reward = 54.17
2022-01-26 14:16:30.230 | DEBUG    | __main__:trials:24 - Trial = 1386/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.232 | DEBUG    | __main__:trials:29 - Trial = 1386/30000 | Total reward = 53.06
2022-01-26 14:16:30.236 | DEBUG    | __main__:trials:24 - Trial = 1387/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.236 | DEBUG    | __main__:trials:29 - Trial = 1387/30000 | Total reward = 52.75
2022-01-26 14:16:30.241 | DEBUG    | __main__:trials:24 - Trial = 1388/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.242 | DEBUG    | __main__:trials:29 - Trial = 1388/30000 | Total reward = 53.17
2022-01-26 14:16:30.245 | DEBUG    | __main__:trials:26 - Trial = 1389/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.246 | DEBUG    | __main__:trials:29 - Trial = 1389/30000 | Total reward = 29.99
2022-01-26 14:16:30.249 | DEBUG    | __main__:trials:24 - Trial = 1390/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.251 | DEBUG    | __main__:trials:29 - Trial = 1390/30000 | Total reward = 46.09
2022-01-26 14:16:30.254 | DEBUG    | __main__:trials:24 - Trial = 1391/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.256 | DEBUG    | __main__:trials:29 - Trial = 1391/30000 | Total reward = 56.27
2022-01-26 14:16:30.259 | DEBUG    | __main__:trials:24 - Trial = 1392/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.261 | DEBUG    | __main__:trials:29 - Trial = 1392/30000 | Total reward = 54.44
2022-01-26 14:16:30.264 | DEBUG    | __main__:trials:24 - Trial = 1393/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.265 | DEBUG    | __main__:trials:29 - Trial = 1393/30000 | Total reward = 50.80
2022-01-26 14:16:30.268 | DEBUG    | __main__:trials:24 - Trial = 1394/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.270 | DEBUG    | __main__:trials:29 - Trial = 1394/30000 | Total reward = 47.52
2022-01-26 14:16:30.273 | DEBUG    | __main__:trials:24 - Trial = 1395/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.274 | DEBUG    | __main__:trials:29 - Trial = 1395/30000 | Total reward = 59.79
2022-01-26 14:16:30.277 | DEBUG    | __main__:trials:24 - Trial = 1396/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.279 | DEBUG    | __main__:trials:29 - Trial = 1396/30000 | Total reward = 66.11
2022-01-26 14:16:30.281 | DEBUG    | __main__:trials:24 - Trial = 1397/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.283 | DEBUG    | __main__:trials:29 - Trial = 1397/30000 | Total reward = 56.15
2022-01-26 14:16:30.287 | DEBUG    | __main__:trials:24 - Trial = 1398/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.288 | DEBUG    | __main__:trials:29 - Trial = 1398/30000 | Total reward = 55.62
2022-01-26 14:16:30.292 | DEBUG    | __main__:trials:24 - Trial = 1399/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.293 | DEBUG    | __main__:trials:29 - Trial = 1399/30000 | Total reward = 47.10
2022-01-26 14:16:30.297 | DEBUG    | __main__:trials:24 - Trial = 1400/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.298 | DEBUG    | __main__:trials:29 - Trial = 1400/30000 | Total reward = 33.83
2022-01-26 14:16:30.302 | DEBUG    | __main__:trials:24 - Trial = 1401/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.303 | DEBUG    | __main__:trials:29 - Trial = 1401/30000 | Total reward = 32.64
2022-01-26 14:16:30.306 | DEBUG    | __main__:trials:24 - Trial = 1402/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.308 | DEBUG    | __main__:trials:29 - Trial = 1402/30000 | Total reward = 57.28
2022-01-26 14:16:30.312 | DEBUG    | __main__:trials:24 - Trial = 1403/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.313 | DEBUG    | __main__:trials:29 - Trial = 1403/30000 | Total reward = 56.99
2022-01-26 14:16:30.317 | DEBUG    | __main__:trials:24 - Trial = 1404/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.317 | DEBUG    | __main__:trials:29 - Trial = 1404/30000 | Total reward = 52.21
2022-01-26 14:16:30.322 | DEBUG    | __main__:trials:24 - Trial = 1405/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.322 | DEBUG    | __main__:trials:29 - Trial = 1405/30000 | Total reward = 56.44
2022-01-26 14:16:30.327 | DEBUG    | __main__:trials:24 - Trial = 1406/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.328 | DEBUG    | __main__:trials:29 - Trial = 1406/30000 | Total reward = 51.66
2022-01-26 14:16:30.331 | DEBUG    | __main__:trials:24 - Trial = 1407/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.333 | DEBUG    | __main__:trials:29 - Trial = 1407/30000 | Total reward = 52.19
2022-01-26 14:16:30.336 | DEBUG    | __main__:trials:24 - Trial = 1408/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.338 | DEBUG    | __main__:trials:29 - Trial = 1408/30000 | Total reward = 49.59
2022-01-26 14:16:30.341 | DEBUG    | __main__:trials:24 - Trial = 1409/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.342 | DEBUG    | __main__:trials:29 - Trial = 1409/30000 | Total reward = 47.96
2022-01-26 14:16:30.346 | DEBUG    | __main__:trials:24 - Trial = 1410/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.346 | DEBUG    | __main__:trials:29 - Trial = 1410/30000 | Total reward = 62.21
2022-01-26 14:16:30.350 | DEBUG    | __main__:trials:24 - Trial = 1411/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.352 | DEBUG    | __main__:trials:29 - Trial = 1411/30000 | Total reward = 50.41
2022-01-26 14:16:30.355 | DEBUG    | __main__:trials:24 - Trial = 1412/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.356 | DEBUG    | __main__:trials:29 - Trial = 1412/30000 | Total reward = 41.94
2022-01-26 14:16:30.360 | DEBUG    | __main__:trials:24 - Trial = 1413/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.361 | DEBUG    | __main__:trials:29 - Trial = 1413/30000 | Total reward = 52.40
2022-01-26 14:16:30.365 | DEBUG    | __main__:trials:26 - Trial = 1414/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.366 | DEBUG    | __main__:trials:29 - Trial = 1414/30000 | Total reward = 30.46
2022-01-26 14:16:30.369 | DEBUG    | __main__:trials:24 - Trial = 1415/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.370 | DEBUG    | __main__:trials:29 - Trial = 1415/30000 | Total reward = 27.35
2022-01-26 14:16:30.373 | DEBUG    | __main__:trials:24 - Trial = 1416/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.374 | DEBUG    | __main__:trials:29 - Trial = 1416/30000 | Total reward = 53.65
2022-01-26 14:16:30.377 | DEBUG    | __main__:trials:24 - Trial = 1417/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.379 | DEBUG    | __main__:trials:29 - Trial = 1417/30000 | Total reward = 51.81
2022-01-26 14:16:30.382 | DEBUG    | __main__:trials:24 - Trial = 1418/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.384 | DEBUG    | __main__:trials:29 - Trial = 1418/30000 | Total reward = 57.17
2022-01-26 14:16:30.387 | DEBUG    | __main__:trials:24 - Trial = 1419/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.389 | DEBUG    | __main__:trials:29 - Trial = 1419/30000 | Total reward = 50.49
2022-01-26 14:16:30.392 | DEBUG    | __main__:trials:24 - Trial = 1420/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.393 | DEBUG    | __main__:trials:29 - Trial = 1420/30000 | Total reward = 57.67
2022-01-26 14:16:30.397 | DEBUG    | __main__:trials:24 - Trial = 1421/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.398 | DEBUG    | __main__:trials:29 - Trial = 1421/30000 | Total reward = 53.33
2022-01-26 14:16:30.401 | DEBUG    | __main__:trials:24 - Trial = 1422/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.402 | DEBUG    | __main__:trials:29 - Trial = 1422/30000 | Total reward = 54.02
2022-01-26 14:16:30.406 | DEBUG    | __main__:trials:24 - Trial = 1423/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.407 | DEBUG    | __main__:trials:29 - Trial = 1423/30000 | Total reward = 51.16
2022-01-26 14:16:30.411 | DEBUG    | __main__:trials:24 - Trial = 1424/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.412 | DEBUG    | __main__:trials:29 - Trial = 1424/30000 | Total reward = 48.92
2022-01-26 14:16:30.415 | DEBUG    | __main__:trials:24 - Trial = 1425/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.417 | DEBUG    | __main__:trials:29 - Trial = 1425/30000 | Total reward = 50.56
2022-01-26 14:16:30.420 | DEBUG    | __main__:trials:24 - Trial = 1426/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.422 | DEBUG    | __main__:trials:29 - Trial = 1426/30000 | Total reward = 56.08
2022-01-26 14:16:30.425 | DEBUG    | __main__:trials:24 - Trial = 1427/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.426 | DEBUG    | __main__:trials:29 - Trial = 1427/30000 | Total reward = 46.17
2022-01-26 14:16:30.430 | DEBUG    | __main__:trials:24 - Trial = 1428/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.430 | DEBUG    | __main__:trials:29 - Trial = 1428/30000 | Total reward = 50.89
2022-01-26 14:16:30.435 | DEBUG    | __main__:trials:24 - Trial = 1429/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.436 | DEBUG    | __main__:trials:29 - Trial = 1429/30000 | Total reward = 40.78
2022-01-26 14:16:30.440 | DEBUG    | __main__:trials:24 - Trial = 1430/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.441 | DEBUG    | __main__:trials:29 - Trial = 1430/30000 | Total reward = 39.45
2022-01-26 14:16:30.445 | DEBUG    | __main__:trials:24 - Trial = 1431/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.446 | DEBUG    | __main__:trials:29 - Trial = 1431/30000 | Total reward = 58.49
2022-01-26 14:16:30.450 | DEBUG    | __main__:trials:24 - Trial = 1432/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.451 | DEBUG    | __main__:trials:29 - Trial = 1432/30000 | Total reward = 47.13
2022-01-26 14:16:30.455 | DEBUG    | __main__:trials:24 - Trial = 1433/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.456 | DEBUG    | __main__:trials:29 - Trial = 1433/30000 | Total reward = 53.26
2022-01-26 14:16:30.460 | DEBUG    | __main__:trials:24 - Trial = 1434/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.462 | DEBUG    | __main__:trials:29 - Trial = 1434/30000 | Total reward = 54.48
2022-01-26 14:16:30.465 | DEBUG    | __main__:trials:24 - Trial = 1435/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.466 | DEBUG    | __main__:trials:29 - Trial = 1435/30000 | Total reward = 54.89
2022-01-26 14:16:30.470 | DEBUG    | __main__:trials:24 - Trial = 1436/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.471 | DEBUG    | __main__:trials:29 - Trial = 1436/30000 | Total reward = 47.38
2022-01-26 14:16:30.474 | DEBUG    | __main__:trials:24 - Trial = 1437/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.476 | DEBUG    | __main__:trials:29 - Trial = 1437/30000 | Total reward = 49.94
2022-01-26 14:16:30.479 | DEBUG    | __main__:trials:24 - Trial = 1438/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.481 | DEBUG    | __main__:trials:29 - Trial = 1438/30000 | Total reward = 51.31
2022-01-26 14:16:30.485 | DEBUG    | __main__:trials:24 - Trial = 1439/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.485 | DEBUG    | __main__:trials:29 - Trial = 1439/30000 | Total reward = 38.59
2022-01-26 14:16:30.489 | DEBUG    | __main__:trials:24 - Trial = 1440/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.490 | DEBUG    | __main__:trials:29 - Trial = 1440/30000 | Total reward = 54.38
2022-01-26 14:16:30.493 | DEBUG    | __main__:trials:24 - Trial = 1441/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.494 | DEBUG    | __main__:trials:29 - Trial = 1441/30000 | Total reward = 48.69
2022-01-26 14:16:30.497 | DEBUG    | __main__:trials:24 - Trial = 1442/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.498 | DEBUG    | __main__:trials:29 - Trial = 1442/30000 | Total reward = 52.22
2022-01-26 14:16:30.501 | DEBUG    | __main__:trials:24 - Trial = 1443/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.502 | DEBUG    | __main__:trials:29 - Trial = 1443/30000 | Total reward = 50.87
2022-01-26 14:16:30.505 | DEBUG    | __main__:trials:24 - Trial = 1444/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.508 | DEBUG    | __main__:trials:29 - Trial = 1444/30000 | Total reward = 34.30
2022-01-26 14:16:30.511 | DEBUG    | __main__:trials:24 - Trial = 1445/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.512 | DEBUG    | __main__:trials:29 - Trial = 1445/30000 | Total reward = 54.28
2022-01-26 14:16:30.516 | DEBUG    | __main__:trials:24 - Trial = 1446/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.517 | DEBUG    | __main__:trials:29 - Trial = 1446/30000 | Total reward = 42.10
2022-01-26 14:16:30.521 | DEBUG    | __main__:trials:24 - Trial = 1447/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.523 | DEBUG    | __main__:trials:29 - Trial = 1447/30000 | Total reward = 45.70
2022-01-26 14:16:30.526 | DEBUG    | __main__:trials:24 - Trial = 1448/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.527 | DEBUG    | __main__:trials:29 - Trial = 1448/30000 | Total reward = 49.72
2022-01-26 14:16:30.531 | DEBUG    | __main__:trials:24 - Trial = 1449/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.532 | DEBUG    | __main__:trials:29 - Trial = 1449/30000 | Total reward = 47.15
2022-01-26 14:16:30.536 | DEBUG    | __main__:trials:24 - Trial = 1450/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.538 | DEBUG    | __main__:trials:29 - Trial = 1450/30000 | Total reward = 51.96
2022-01-26 14:16:30.541 | DEBUG    | __main__:trials:24 - Trial = 1451/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.542 | DEBUG    | __main__:trials:29 - Trial = 1451/30000 | Total reward = 45.87
2022-01-26 14:16:30.546 | DEBUG    | __main__:trials:24 - Trial = 1452/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.547 | DEBUG    | __main__:trials:29 - Trial = 1452/30000 | Total reward = 51.23
2022-01-26 14:16:30.552 | DEBUG    | __main__:trials:24 - Trial = 1453/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.553 | DEBUG    | __main__:trials:29 - Trial = 1453/30000 | Total reward = 51.98
2022-01-26 14:16:30.557 | DEBUG    | __main__:trials:24 - Trial = 1454/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.558 | DEBUG    | __main__:trials:29 - Trial = 1454/30000 | Total reward = 47.96
2022-01-26 14:16:30.562 | DEBUG    | __main__:trials:24 - Trial = 1455/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.563 | DEBUG    | __main__:trials:29 - Trial = 1455/30000 | Total reward = 52.90
2022-01-26 14:16:30.567 | DEBUG    | __main__:trials:24 - Trial = 1456/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.569 | DEBUG    | __main__:trials:29 - Trial = 1456/30000 | Total reward = 43.13
2022-01-26 14:16:30.572 | DEBUG    | __main__:trials:24 - Trial = 1457/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.574 | DEBUG    | __main__:trials:29 - Trial = 1457/30000 | Total reward = 47.92
2022-01-26 14:16:30.577 | DEBUG    | __main__:trials:24 - Trial = 1458/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.579 | DEBUG    | __main__:trials:29 - Trial = 1458/30000 | Total reward = 39.95
2022-01-26 14:16:30.582 | DEBUG    | __main__:trials:24 - Trial = 1459/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.584 | DEBUG    | __main__:trials:29 - Trial = 1459/30000 | Total reward = 55.70
2022-01-26 14:16:30.588 | DEBUG    | __main__:trials:24 - Trial = 1460/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.589 | DEBUG    | __main__:trials:29 - Trial = 1460/30000 | Total reward = 58.90
2022-01-26 14:16:30.592 | DEBUG    | __main__:trials:24 - Trial = 1461/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.593 | DEBUG    | __main__:trials:29 - Trial = 1461/30000 | Total reward = 59.00
2022-01-26 14:16:30.596 | DEBUG    | __main__:trials:24 - Trial = 1462/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.598 | DEBUG    | __main__:trials:29 - Trial = 1462/30000 | Total reward = 50.84
2022-01-26 14:16:30.602 | DEBUG    | __main__:trials:24 - Trial = 1463/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.602 | DEBUG    | __main__:trials:29 - Trial = 1463/30000 | Total reward = 46.57
2022-01-26 14:16:30.607 | DEBUG    | __main__:trials:24 - Trial = 1464/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.608 | DEBUG    | __main__:trials:29 - Trial = 1464/30000 | Total reward = 42.12
2022-01-26 14:16:30.612 | DEBUG    | __main__:trials:24 - Trial = 1465/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.613 | DEBUG    | __main__:trials:29 - Trial = 1465/30000 | Total reward = 51.46
2022-01-26 14:16:30.617 | DEBUG    | __main__:trials:24 - Trial = 1466/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.618 | DEBUG    | __main__:trials:29 - Trial = 1466/30000 | Total reward = 38.77
2022-01-26 14:16:30.622 | DEBUG    | __main__:trials:24 - Trial = 1467/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.624 | DEBUG    | __main__:trials:29 - Trial = 1467/30000 | Total reward = 55.93
2022-01-26 14:16:30.627 | DEBUG    | __main__:trials:24 - Trial = 1468/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.629 | DEBUG    | __main__:trials:29 - Trial = 1468/30000 | Total reward = 55.93
2022-01-26 14:16:30.632 | DEBUG    | __main__:trials:24 - Trial = 1469/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.634 | DEBUG    | __main__:trials:29 - Trial = 1469/30000 | Total reward = 55.55
2022-01-26 14:16:30.637 | DEBUG    | __main__:trials:24 - Trial = 1470/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.639 | DEBUG    | __main__:trials:29 - Trial = 1470/30000 | Total reward = 40.40
2022-01-26 14:16:30.643 | DEBUG    | __main__:trials:24 - Trial = 1471/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.644 | DEBUG    | __main__:trials:29 - Trial = 1471/30000 | Total reward = 31.99
2022-01-26 14:16:30.647 | DEBUG    | __main__:trials:24 - Trial = 1472/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.649 | DEBUG    | __main__:trials:29 - Trial = 1472/30000 | Total reward = 53.56
2022-01-26 14:16:30.652 | DEBUG    | __main__:trials:24 - Trial = 1473/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.654 | DEBUG    | __main__:trials:29 - Trial = 1473/30000 | Total reward = 48.64
2022-01-26 14:16:30.657 | DEBUG    | __main__:trials:24 - Trial = 1474/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.658 | DEBUG    | __main__:trials:29 - Trial = 1474/30000 | Total reward = 51.02
2022-01-26 14:16:30.663 | DEBUG    | __main__:trials:24 - Trial = 1475/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.664 | DEBUG    | __main__:trials:29 - Trial = 1475/30000 | Total reward = 44.54
2022-01-26 14:16:30.667 | DEBUG    | __main__:trials:24 - Trial = 1476/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.669 | DEBUG    | __main__:trials:29 - Trial = 1476/30000 | Total reward = 48.52
2022-01-26 14:16:30.671 | DEBUG    | __main__:trials:26 - Trial = 1477/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.672 | DEBUG    | __main__:trials:29 - Trial = 1477/30000 | Total reward = 14.72
2022-01-26 14:16:30.676 | DEBUG    | __main__:trials:24 - Trial = 1478/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.677 | DEBUG    | __main__:trials:29 - Trial = 1478/30000 | Total reward = 48.27
2022-01-26 14:16:30.682 | DEBUG    | __main__:trials:24 - Trial = 1479/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.683 | DEBUG    | __main__:trials:29 - Trial = 1479/30000 | Total reward = 42.76
2022-01-26 14:16:30.687 | DEBUG    | __main__:trials:24 - Trial = 1480/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.688 | DEBUG    | __main__:trials:29 - Trial = 1480/30000 | Total reward = 40.31
2022-01-26 14:16:30.692 | DEBUG    | __main__:trials:24 - Trial = 1481/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.693 | DEBUG    | __main__:trials:29 - Trial = 1481/30000 | Total reward = 46.78
2022-01-26 14:16:30.697 | DEBUG    | __main__:trials:24 - Trial = 1482/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.698 | DEBUG    | __main__:trials:29 - Trial = 1482/30000 | Total reward = 46.27
2022-01-26 14:16:30.701 | DEBUG    | __main__:trials:26 - Trial = 1483/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.702 | DEBUG    | __main__:trials:29 - Trial = 1483/30000 | Total reward = 21.55
2022-01-26 14:16:30.706 | DEBUG    | __main__:trials:24 - Trial = 1484/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.706 | DEBUG    | __main__:trials:29 - Trial = 1484/30000 | Total reward = 46.15
2022-01-26 14:16:30.710 | DEBUG    | __main__:trials:24 - Trial = 1485/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.712 | DEBUG    | __main__:trials:29 - Trial = 1485/30000 | Total reward = 46.78
2022-01-26 14:16:30.715 | DEBUG    | __main__:trials:24 - Trial = 1486/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.716 | DEBUG    | __main__:trials:29 - Trial = 1486/30000 | Total reward = 46.80
2022-01-26 14:16:30.720 | DEBUG    | __main__:trials:24 - Trial = 1487/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.721 | DEBUG    | __main__:trials:29 - Trial = 1487/30000 | Total reward = 46.78
2022-01-26 14:16:30.724 | DEBUG    | __main__:trials:24 - Trial = 1488/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.726 | DEBUG    | __main__:trials:29 - Trial = 1488/30000 | Total reward = 55.57
2022-01-26 14:16:30.729 | DEBUG    | __main__:trials:24 - Trial = 1489/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.730 | DEBUG    | __main__:trials:29 - Trial = 1489/30000 | Total reward = 36.16
2022-01-26 14:16:30.733 | DEBUG    | __main__:trials:24 - Trial = 1490/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.735 | DEBUG    | __main__:trials:29 - Trial = 1490/30000 | Total reward = 48.43
2022-01-26 14:16:30.738 | DEBUG    | __main__:trials:26 - Trial = 1491/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.739 | DEBUG    | __main__:trials:29 - Trial = 1491/30000 | Total reward = 9.23
2022-01-26 14:16:30.742 | DEBUG    | __main__:trials:24 - Trial = 1492/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.744 | DEBUG    | __main__:trials:29 - Trial = 1492/30000 | Total reward = 39.34
2022-01-26 14:16:30.747 | DEBUG    | __main__:trials:24 - Trial = 1493/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.749 | DEBUG    | __main__:trials:29 - Trial = 1493/30000 | Total reward = 49.52
2022-01-26 14:16:30.752 | DEBUG    | __main__:trials:24 - Trial = 1494/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.754 | DEBUG    | __main__:trials:29 - Trial = 1494/30000 | Total reward = 46.86
2022-01-26 14:16:30.757 | DEBUG    | __main__:trials:24 - Trial = 1495/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.759 | DEBUG    | __main__:trials:29 - Trial = 1495/30000 | Total reward = 52.82
2022-01-26 14:16:30.762 | DEBUG    | __main__:trials:24 - Trial = 1496/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.763 | DEBUG    | __main__:trials:29 - Trial = 1496/30000 | Total reward = 34.64
2022-01-26 14:16:30.767 | DEBUG    | __main__:trials:24 - Trial = 1497/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.769 | DEBUG    | __main__:trials:29 - Trial = 1497/30000 | Total reward = 36.07
2022-01-26 14:16:30.772 | DEBUG    | __main__:trials:24 - Trial = 1498/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.774 | DEBUG    | __main__:trials:29 - Trial = 1498/30000 | Total reward = 48.27
2022-01-26 14:16:30.777 | DEBUG    | __main__:trials:24 - Trial = 1499/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.779 | DEBUG    | __main__:trials:29 - Trial = 1499/30000 | Total reward = 46.61
2022-01-26 14:16:30.780 | DEBUG    | __main__:trials:26 - Trial = 1500/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.782 | DEBUG    | __main__:trials:29 - Trial = 1500/30000 | Total reward = 11.23
2022-01-26 14:16:30.786 | DEBUG    | __main__:trials:24 - Trial = 1501/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.787 | DEBUG    | __main__:trials:29 - Trial = 1501/30000 | Total reward = 41.51
2022-01-26 14:16:30.790 | DEBUG    | __main__:trials:24 - Trial = 1502/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.792 | DEBUG    | __main__:trials:29 - Trial = 1502/30000 | Total reward = 32.51
2022-01-26 14:16:30.795 | DEBUG    | __main__:trials:24 - Trial = 1503/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.796 | DEBUG    | __main__:trials:29 - Trial = 1503/30000 | Total reward = 44.92
2022-01-26 14:16:30.800 | DEBUG    | __main__:trials:26 - Trial = 1504/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.801 | DEBUG    | __main__:trials:29 - Trial = 1504/30000 | Total reward = 15.74
2022-01-26 14:16:30.805 | DEBUG    | __main__:trials:24 - Trial = 1505/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.806 | DEBUG    | __main__:trials:29 - Trial = 1505/30000 | Total reward = 45.38
2022-01-26 14:16:30.810 | DEBUG    | __main__:trials:24 - Trial = 1506/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.812 | DEBUG    | __main__:trials:29 - Trial = 1506/30000 | Total reward = 49.98
2022-01-26 14:16:30.814 | DEBUG    | __main__:trials:24 - Trial = 1507/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.816 | DEBUG    | __main__:trials:29 - Trial = 1507/30000 | Total reward = 39.61
2022-01-26 14:16:30.820 | DEBUG    | __main__:trials:24 - Trial = 1508/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.821 | DEBUG    | __main__:trials:29 - Trial = 1508/30000 | Total reward = 45.57
2022-01-26 14:16:30.825 | DEBUG    | __main__:trials:24 - Trial = 1509/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.826 | DEBUG    | __main__:trials:29 - Trial = 1509/30000 | Total reward = 47.70
2022-01-26 14:16:30.829 | DEBUG    | __main__:trials:24 - Trial = 1510/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.831 | DEBUG    | __main__:trials:29 - Trial = 1510/30000 | Total reward = 50.37
2022-01-26 14:16:30.835 | DEBUG    | __main__:trials:24 - Trial = 1511/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.836 | DEBUG    | __main__:trials:29 - Trial = 1511/30000 | Total reward = 28.39
2022-01-26 14:16:30.840 | DEBUG    | __main__:trials:24 - Trial = 1512/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.840 | DEBUG    | __main__:trials:29 - Trial = 1512/30000 | Total reward = 30.46
2022-01-26 14:16:30.845 | DEBUG    | __main__:trials:24 - Trial = 1513/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.846 | DEBUG    | __main__:trials:29 - Trial = 1513/30000 | Total reward = 30.53
2022-01-26 14:16:30.849 | DEBUG    | __main__:trials:24 - Trial = 1514/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.850 | DEBUG    | __main__:trials:29 - Trial = 1514/30000 | Total reward = 39.53
2022-01-26 14:16:30.853 | DEBUG    | __main__:trials:26 - Trial = 1515/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.854 | DEBUG    | __main__:trials:29 - Trial = 1515/30000 | Total reward = 13.47
2022-01-26 14:16:30.858 | DEBUG    | __main__:trials:24 - Trial = 1516/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.859 | DEBUG    | __main__:trials:29 - Trial = 1516/30000 | Total reward = 46.51
2022-01-26 14:16:30.862 | DEBUG    | __main__:trials:24 - Trial = 1517/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.863 | DEBUG    | __main__:trials:29 - Trial = 1517/30000 | Total reward = 26.69
2022-01-26 14:16:30.866 | DEBUG    | __main__:trials:24 - Trial = 1518/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.868 | DEBUG    | __main__:trials:29 - Trial = 1518/30000 | Total reward = 51.60
2022-01-26 14:16:30.871 | DEBUG    | __main__:trials:24 - Trial = 1519/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.872 | DEBUG    | __main__:trials:29 - Trial = 1519/30000 | Total reward = 48.82
2022-01-26 14:16:30.876 | DEBUG    | __main__:trials:26 - Trial = 1520/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.876 | DEBUG    | __main__:trials:29 - Trial = 1520/30000 | Total reward = 31.46
2022-01-26 14:16:30.881 | DEBUG    | __main__:trials:24 - Trial = 1521/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.882 | DEBUG    | __main__:trials:29 - Trial = 1521/30000 | Total reward = 45.12
2022-01-26 14:16:30.886 | DEBUG    | __main__:trials:24 - Trial = 1522/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.887 | DEBUG    | __main__:trials:29 - Trial = 1522/30000 | Total reward = 48.80
2022-01-26 14:16:30.891 | DEBUG    | __main__:trials:26 - Trial = 1523/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.892 | DEBUG    | __main__:trials:29 - Trial = 1523/30000 | Total reward = 41.29
2022-01-26 14:16:30.896 | DEBUG    | __main__:trials:24 - Trial = 1524/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.898 | DEBUG    | __main__:trials:29 - Trial = 1524/30000 | Total reward = 46.49
2022-01-26 14:16:30.901 | DEBUG    | __main__:trials:24 - Trial = 1525/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.902 | DEBUG    | __main__:trials:29 - Trial = 1525/30000 | Total reward = 48.02
2022-01-26 14:16:30.905 | DEBUG    | __main__:trials:24 - Trial = 1526/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.907 | DEBUG    | __main__:trials:29 - Trial = 1526/30000 | Total reward = 41.64
2022-01-26 14:16:30.910 | DEBUG    | __main__:trials:24 - Trial = 1527/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.911 | DEBUG    | __main__:trials:29 - Trial = 1527/30000 | Total reward = 46.78
2022-01-26 14:16:30.915 | DEBUG    | __main__:trials:24 - Trial = 1528/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.915 | DEBUG    | __main__:trials:29 - Trial = 1528/30000 | Total reward = 44.36
2022-01-26 14:16:30.920 | DEBUG    | __main__:trials:24 - Trial = 1529/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.922 | DEBUG    | __main__:trials:29 - Trial = 1529/30000 | Total reward = 42.50
2022-01-26 14:16:30.926 | DEBUG    | __main__:trials:24 - Trial = 1530/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.927 | DEBUG    | __main__:trials:29 - Trial = 1530/30000 | Total reward = 42.12
2022-01-26 14:16:30.931 | DEBUG    | __main__:trials:26 - Trial = 1531/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.932 | DEBUG    | __main__:trials:29 - Trial = 1531/30000 | Total reward = 22.41
2022-01-26 14:16:30.936 | DEBUG    | __main__:trials:24 - Trial = 1532/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.938 | DEBUG    | __main__:trials:29 - Trial = 1532/30000 | Total reward = 47.24
2022-01-26 14:16:30.941 | DEBUG    | __main__:trials:26 - Trial = 1533/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:30.943 | DEBUG    | __main__:trials:29 - Trial = 1533/30000 | Total reward = 22.09
2022-01-26 14:16:30.946 | DEBUG    | __main__:trials:24 - Trial = 1534/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.947 | DEBUG    | __main__:trials:29 - Trial = 1534/30000 | Total reward = 49.45
2022-01-26 14:16:30.951 | DEBUG    | __main__:trials:24 - Trial = 1535/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.952 | DEBUG    | __main__:trials:29 - Trial = 1535/30000 | Total reward = 39.43
2022-01-26 14:16:30.956 | DEBUG    | __main__:trials:24 - Trial = 1536/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.957 | DEBUG    | __main__:trials:29 - Trial = 1536/30000 | Total reward = 49.42
2022-01-26 14:16:30.960 | DEBUG    | __main__:trials:24 - Trial = 1537/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.962 | DEBUG    | __main__:trials:29 - Trial = 1537/30000 | Total reward = 58.48
2022-01-26 14:16:30.965 | DEBUG    | __main__:trials:24 - Trial = 1538/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.966 | DEBUG    | __main__:trials:29 - Trial = 1538/30000 | Total reward = 49.80
2022-01-26 14:16:30.969 | DEBUG    | __main__:trials:24 - Trial = 1539/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.970 | DEBUG    | __main__:trials:29 - Trial = 1539/30000 | Total reward = 57.46
2022-01-26 14:16:30.974 | DEBUG    | __main__:trials:24 - Trial = 1540/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.974 | DEBUG    | __main__:trials:29 - Trial = 1540/30000 | Total reward = 44.21
2022-01-26 14:16:30.980 | DEBUG    | __main__:trials:24 - Trial = 1541/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.980 | DEBUG    | __main__:trials:29 - Trial = 1541/30000 | Total reward = 57.55
2022-01-26 14:16:30.990 | DEBUG    | __main__:trials:24 - Trial = 1542/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.991 | DEBUG    | __main__:trials:29 - Trial = 1542/30000 | Total reward = 26.25
2022-01-26 14:16:30.995 | DEBUG    | __main__:trials:24 - Trial = 1543/30000 | Max number of steps (20) reached
2022-01-26 14:16:30.997 | DEBUG    | __main__:trials:29 - Trial = 1543/30000 | Total reward = 57.39
2022-01-26 14:16:31.002 | DEBUG    | __main__:trials:24 - Trial = 1544/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.002 | DEBUG    | __main__:trials:29 - Trial = 1544/30000 | Total reward = 31.42
2022-01-26 14:16:31.007 | DEBUG    | __main__:trials:24 - Trial = 1545/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.008 | DEBUG    | __main__:trials:29 - Trial = 1545/30000 | Total reward = 34.48
2022-01-26 14:16:31.012 | DEBUG    | __main__:trials:24 - Trial = 1546/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.013 | DEBUG    | __main__:trials:29 - Trial = 1546/30000 | Total reward = 25.68
2022-01-26 14:16:31.016 | DEBUG    | __main__:trials:24 - Trial = 1547/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.018 | DEBUG    | __main__:trials:29 - Trial = 1547/30000 | Total reward = 35.72
2022-01-26 14:16:31.022 | DEBUG    | __main__:trials:24 - Trial = 1548/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.022 | DEBUG    | __main__:trials:29 - Trial = 1548/30000 | Total reward = 50.11
2022-01-26 14:16:31.027 | DEBUG    | __main__:trials:24 - Trial = 1549/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.028 | DEBUG    | __main__:trials:29 - Trial = 1549/30000 | Total reward = 38.59
2022-01-26 14:16:31.032 | DEBUG    | __main__:trials:24 - Trial = 1550/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.034 | DEBUG    | __main__:trials:29 - Trial = 1550/30000 | Total reward = 49.43
2022-01-26 14:16:31.037 | DEBUG    | __main__:trials:24 - Trial = 1551/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.039 | DEBUG    | __main__:trials:29 - Trial = 1551/30000 | Total reward = 37.73
2022-01-26 14:16:31.042 | DEBUG    | __main__:trials:26 - Trial = 1552/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.044 | DEBUG    | __main__:trials:29 - Trial = 1552/30000 | Total reward = 20.63
2022-01-26 14:16:31.048 | DEBUG    | __main__:trials:24 - Trial = 1553/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.049 | DEBUG    | __main__:trials:29 - Trial = 1553/30000 | Total reward = 44.97
2022-01-26 14:16:31.053 | DEBUG    | __main__:trials:24 - Trial = 1554/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.053 | DEBUG    | __main__:trials:29 - Trial = 1554/30000 | Total reward = 46.45
2022-01-26 14:16:31.057 | DEBUG    | __main__:trials:24 - Trial = 1555/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.058 | DEBUG    | __main__:trials:29 - Trial = 1555/30000 | Total reward = 41.57
2022-01-26 14:16:31.063 | DEBUG    | __main__:trials:24 - Trial = 1556/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.064 | DEBUG    | __main__:trials:29 - Trial = 1556/30000 | Total reward = 44.37
2022-01-26 14:16:31.067 | DEBUG    | __main__:trials:24 - Trial = 1557/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.069 | DEBUG    | __main__:trials:29 - Trial = 1557/30000 | Total reward = 49.74
2022-01-26 14:16:31.071 | DEBUG    | __main__:trials:26 - Trial = 1558/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.073 | DEBUG    | __main__:trials:29 - Trial = 1558/30000 | Total reward = 15.56
2022-01-26 14:16:31.077 | DEBUG    | __main__:trials:24 - Trial = 1559/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.078 | DEBUG    | __main__:trials:29 - Trial = 1559/30000 | Total reward = 46.96
2022-01-26 14:16:31.081 | DEBUG    | __main__:trials:24 - Trial = 1560/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.083 | DEBUG    | __main__:trials:29 - Trial = 1560/30000 | Total reward = 48.08
2022-01-26 14:16:31.085 | DEBUG    | __main__:trials:26 - Trial = 1561/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.086 | DEBUG    | __main__:trials:29 - Trial = 1561/30000 | Total reward = 10.51
2022-01-26 14:16:31.090 | DEBUG    | __main__:trials:24 - Trial = 1562/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.091 | DEBUG    | __main__:trials:29 - Trial = 1562/30000 | Total reward = 46.86
2022-01-26 14:16:31.095 | DEBUG    | __main__:trials:24 - Trial = 1563/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.097 | DEBUG    | __main__:trials:29 - Trial = 1563/30000 | Total reward = 36.11
2022-01-26 14:16:31.100 | DEBUG    | __main__:trials:24 - Trial = 1564/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.101 | DEBUG    | __main__:trials:29 - Trial = 1564/30000 | Total reward = 45.68
2022-01-26 14:16:31.105 | DEBUG    | __main__:trials:24 - Trial = 1565/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.107 | DEBUG    | __main__:trials:29 - Trial = 1565/30000 | Total reward = 43.00
2022-01-26 14:16:31.110 | DEBUG    | __main__:trials:24 - Trial = 1566/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.112 | DEBUG    | __main__:trials:29 - Trial = 1566/30000 | Total reward = 46.47
2022-01-26 14:16:31.115 | DEBUG    | __main__:trials:26 - Trial = 1567/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.116 | DEBUG    | __main__:trials:29 - Trial = 1567/30000 | Total reward = 30.35
2022-01-26 14:16:31.120 | DEBUG    | __main__:trials:24 - Trial = 1568/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.122 | DEBUG    | __main__:trials:29 - Trial = 1568/30000 | Total reward = 50.12
2022-01-26 14:16:31.126 | DEBUG    | __main__:trials:24 - Trial = 1569/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.126 | DEBUG    | __main__:trials:29 - Trial = 1569/30000 | Total reward = 40.86
2022-01-26 14:16:31.131 | DEBUG    | __main__:trials:24 - Trial = 1570/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.132 | DEBUG    | __main__:trials:29 - Trial = 1570/30000 | Total reward = 54.74
2022-01-26 14:16:31.136 | DEBUG    | __main__:trials:24 - Trial = 1571/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.137 | DEBUG    | __main__:trials:29 - Trial = 1571/30000 | Total reward = 39.76
2022-01-26 14:16:31.141 | DEBUG    | __main__:trials:24 - Trial = 1572/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.142 | DEBUG    | __main__:trials:29 - Trial = 1572/30000 | Total reward = 44.49
2022-01-26 14:16:31.146 | DEBUG    | __main__:trials:24 - Trial = 1573/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.147 | DEBUG    | __main__:trials:29 - Trial = 1573/30000 | Total reward = 48.62
2022-01-26 14:16:31.151 | DEBUG    | __main__:trials:24 - Trial = 1574/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.152 | DEBUG    | __main__:trials:29 - Trial = 1574/30000 | Total reward = 51.92
2022-01-26 14:16:31.156 | DEBUG    | __main__:trials:24 - Trial = 1575/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.158 | DEBUG    | __main__:trials:29 - Trial = 1575/30000 | Total reward = 48.62
2022-01-26 14:16:31.162 | DEBUG    | __main__:trials:24 - Trial = 1576/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.163 | DEBUG    | __main__:trials:29 - Trial = 1576/30000 | Total reward = 49.13
2022-01-26 14:16:31.167 | DEBUG    | __main__:trials:24 - Trial = 1577/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.168 | DEBUG    | __main__:trials:29 - Trial = 1577/30000 | Total reward = 43.35
2022-01-26 14:16:31.172 | DEBUG    | __main__:trials:24 - Trial = 1578/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.174 | DEBUG    | __main__:trials:29 - Trial = 1578/30000 | Total reward = 46.74
2022-01-26 14:16:31.178 | DEBUG    | __main__:trials:24 - Trial = 1579/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.179 | DEBUG    | __main__:trials:29 - Trial = 1579/30000 | Total reward = 40.68
2022-01-26 14:16:31.183 | DEBUG    | __main__:trials:24 - Trial = 1580/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.184 | DEBUG    | __main__:trials:29 - Trial = 1580/30000 | Total reward = 52.48
2022-01-26 14:16:31.187 | DEBUG    | __main__:trials:24 - Trial = 1581/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.188 | DEBUG    | __main__:trials:29 - Trial = 1581/30000 | Total reward = 48.62
2022-01-26 14:16:31.192 | DEBUG    | __main__:trials:24 - Trial = 1582/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.193 | DEBUG    | __main__:trials:29 - Trial = 1582/30000 | Total reward = 39.35
2022-01-26 14:16:31.197 | DEBUG    | __main__:trials:24 - Trial = 1583/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.198 | DEBUG    | __main__:trials:29 - Trial = 1583/30000 | Total reward = 49.69
2022-01-26 14:16:31.201 | DEBUG    | __main__:trials:24 - Trial = 1584/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.202 | DEBUG    | __main__:trials:29 - Trial = 1584/30000 | Total reward = 37.73
2022-01-26 14:16:31.205 | DEBUG    | __main__:trials:24 - Trial = 1585/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.206 | DEBUG    | __main__:trials:29 - Trial = 1585/30000 | Total reward = 37.62
2022-01-26 14:16:31.209 | DEBUG    | __main__:trials:24 - Trial = 1586/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.210 | DEBUG    | __main__:trials:29 - Trial = 1586/30000 | Total reward = 53.08
2022-01-26 14:16:31.213 | DEBUG    | __main__:trials:24 - Trial = 1587/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.214 | DEBUG    | __main__:trials:29 - Trial = 1587/30000 | Total reward = 46.05
2022-01-26 14:16:31.217 | DEBUG    | __main__:trials:24 - Trial = 1588/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.217 | DEBUG    | __main__:trials:29 - Trial = 1588/30000 | Total reward = 46.38
2022-01-26 14:16:31.221 | DEBUG    | __main__:trials:26 - Trial = 1589/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.222 | DEBUG    | __main__:trials:29 - Trial = 1589/30000 | Total reward = 27.77
2022-01-26 14:16:31.227 | DEBUG    | __main__:trials:24 - Trial = 1590/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.227 | DEBUG    | __main__:trials:29 - Trial = 1590/30000 | Total reward = 48.13
2022-01-26 14:16:31.231 | DEBUG    | __main__:trials:24 - Trial = 1591/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.233 | DEBUG    | __main__:trials:29 - Trial = 1591/30000 | Total reward = 29.63
2022-01-26 14:16:31.235 | DEBUG    | __main__:trials:26 - Trial = 1592/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.236 | DEBUG    | __main__:trials:29 - Trial = 1592/30000 | Total reward = 19.17
2022-01-26 14:16:31.240 | DEBUG    | __main__:trials:24 - Trial = 1593/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.241 | DEBUG    | __main__:trials:29 - Trial = 1593/30000 | Total reward = 46.89
2022-01-26 14:16:31.246 | DEBUG    | __main__:trials:24 - Trial = 1594/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.246 | DEBUG    | __main__:trials:29 - Trial = 1594/30000 | Total reward = 32.44
2022-01-26 14:16:31.252 | DEBUG    | __main__:trials:24 - Trial = 1595/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.253 | DEBUG    | __main__:trials:29 - Trial = 1595/30000 | Total reward = 46.78
2022-01-26 14:16:31.257 | DEBUG    | __main__:trials:24 - Trial = 1596/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.258 | DEBUG    | __main__:trials:29 - Trial = 1596/30000 | Total reward = 49.65
2022-01-26 14:16:31.262 | DEBUG    | __main__:trials:24 - Trial = 1597/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.263 | DEBUG    | __main__:trials:29 - Trial = 1597/30000 | Total reward = 58.71
2022-01-26 14:16:31.267 | DEBUG    | __main__:trials:24 - Trial = 1598/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.268 | DEBUG    | __main__:trials:29 - Trial = 1598/30000 | Total reward = 41.17
2022-01-26 14:16:31.272 | DEBUG    | __main__:trials:24 - Trial = 1599/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.274 | DEBUG    | __main__:trials:29 - Trial = 1599/30000 | Total reward = 40.57
2022-01-26 14:16:31.277 | DEBUG    | __main__:trials:24 - Trial = 1600/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.278 | DEBUG    | __main__:trials:29 - Trial = 1600/30000 | Total reward = 49.45
2022-01-26 14:16:31.282 | DEBUG    | __main__:trials:24 - Trial = 1601/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.284 | DEBUG    | __main__:trials:29 - Trial = 1601/30000 | Total reward = 50.92
2022-01-26 14:16:31.287 | DEBUG    | __main__:trials:24 - Trial = 1602/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.288 | DEBUG    | __main__:trials:29 - Trial = 1602/30000 | Total reward = 51.64
2022-01-26 14:16:31.292 | DEBUG    | __main__:trials:24 - Trial = 1603/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.294 | DEBUG    | __main__:trials:29 - Trial = 1603/30000 | Total reward = 43.95
2022-01-26 14:16:31.297 | DEBUG    | __main__:trials:24 - Trial = 1604/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.299 | DEBUG    | __main__:trials:29 - Trial = 1604/30000 | Total reward = 46.45
2022-01-26 14:16:31.302 | DEBUG    | __main__:trials:24 - Trial = 1605/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.304 | DEBUG    | __main__:trials:29 - Trial = 1605/30000 | Total reward = 46.54
2022-01-26 14:16:31.307 | DEBUG    | __main__:trials:26 - Trial = 1606/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.307 | DEBUG    | __main__:trials:29 - Trial = 1606/30000 | Total reward = 9.23
2022-01-26 14:16:31.312 | DEBUG    | __main__:trials:24 - Trial = 1607/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.313 | DEBUG    | __main__:trials:29 - Trial = 1607/30000 | Total reward = 55.44
2022-01-26 14:16:31.317 | DEBUG    | __main__:trials:24 - Trial = 1608/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.318 | DEBUG    | __main__:trials:29 - Trial = 1608/30000 | Total reward = 49.86
2022-01-26 14:16:31.322 | DEBUG    | __main__:trials:24 - Trial = 1609/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.324 | DEBUG    | __main__:trials:29 - Trial = 1609/30000 | Total reward = 48.76
2022-01-26 14:16:31.327 | DEBUG    | __main__:trials:24 - Trial = 1610/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.328 | DEBUG    | __main__:trials:29 - Trial = 1610/30000 | Total reward = 53.08
2022-01-26 14:16:31.332 | DEBUG    | __main__:trials:24 - Trial = 1611/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.334 | DEBUG    | __main__:trials:29 - Trial = 1611/30000 | Total reward = 49.55
2022-01-26 14:16:31.337 | DEBUG    | __main__:trials:24 - Trial = 1612/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.339 | DEBUG    | __main__:trials:29 - Trial = 1612/30000 | Total reward = 41.19
2022-01-26 14:16:31.342 | DEBUG    | __main__:trials:24 - Trial = 1613/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.343 | DEBUG    | __main__:trials:29 - Trial = 1613/30000 | Total reward = 40.33
2022-01-26 14:16:31.346 | DEBUG    | __main__:trials:24 - Trial = 1614/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.348 | DEBUG    | __main__:trials:29 - Trial = 1614/30000 | Total reward = 55.17
2022-01-26 14:16:31.352 | DEBUG    | __main__:trials:24 - Trial = 1615/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.352 | DEBUG    | __main__:trials:29 - Trial = 1615/30000 | Total reward = 61.75
2022-01-26 14:16:31.357 | DEBUG    | __main__:trials:24 - Trial = 1616/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.358 | DEBUG    | __main__:trials:29 - Trial = 1616/30000 | Total reward = 40.57
2022-01-26 14:16:31.362 | DEBUG    | __main__:trials:24 - Trial = 1617/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.364 | DEBUG    | __main__:trials:29 - Trial = 1617/30000 | Total reward = 55.47
2022-01-26 14:16:31.367 | DEBUG    | __main__:trials:24 - Trial = 1618/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.368 | DEBUG    | __main__:trials:29 - Trial = 1618/30000 | Total reward = 58.28
2022-01-26 14:16:31.372 | DEBUG    | __main__:trials:24 - Trial = 1619/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.373 | DEBUG    | __main__:trials:29 - Trial = 1619/30000 | Total reward = 59.31
2022-01-26 14:16:31.376 | DEBUG    | __main__:trials:24 - Trial = 1620/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.378 | DEBUG    | __main__:trials:29 - Trial = 1620/30000 | Total reward = 56.43
2022-01-26 14:16:31.381 | DEBUG    | __main__:trials:24 - Trial = 1621/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.382 | DEBUG    | __main__:trials:29 - Trial = 1621/30000 | Total reward = 53.75
2022-01-26 14:16:31.385 | DEBUG    | __main__:trials:24 - Trial = 1622/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.386 | DEBUG    | __main__:trials:29 - Trial = 1622/30000 | Total reward = 62.33
2022-01-26 14:16:31.389 | DEBUG    | __main__:trials:24 - Trial = 1623/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.390 | DEBUG    | __main__:trials:29 - Trial = 1623/30000 | Total reward = 54.35
2022-01-26 14:16:31.393 | DEBUG    | __main__:trials:24 - Trial = 1624/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.394 | DEBUG    | __main__:trials:29 - Trial = 1624/30000 | Total reward = 45.90
2022-01-26 14:16:31.397 | DEBUG    | __main__:trials:24 - Trial = 1625/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.399 | DEBUG    | __main__:trials:29 - Trial = 1625/30000 | Total reward = 44.63
2022-01-26 14:16:31.403 | DEBUG    | __main__:trials:24 - Trial = 1626/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.405 | DEBUG    | __main__:trials:29 - Trial = 1626/30000 | Total reward = 48.77
2022-01-26 14:16:31.408 | DEBUG    | __main__:trials:24 - Trial = 1627/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.409 | DEBUG    | __main__:trials:29 - Trial = 1627/30000 | Total reward = 36.97
2022-01-26 14:16:31.413 | DEBUG    | __main__:trials:24 - Trial = 1628/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.414 | DEBUG    | __main__:trials:29 - Trial = 1628/30000 | Total reward = 54.34
2022-01-26 14:16:31.418 | DEBUG    | __main__:trials:24 - Trial = 1629/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.419 | DEBUG    | __main__:trials:29 - Trial = 1629/30000 | Total reward = 48.47
2022-01-26 14:16:31.422 | DEBUG    | __main__:trials:24 - Trial = 1630/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.423 | DEBUG    | __main__:trials:29 - Trial = 1630/30000 | Total reward = 60.85
2022-01-26 14:16:31.426 | DEBUG    | __main__:trials:24 - Trial = 1631/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.428 | DEBUG    | __main__:trials:29 - Trial = 1631/30000 | Total reward = 54.45
2022-01-26 14:16:31.431 | DEBUG    | __main__:trials:24 - Trial = 1632/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.431 | DEBUG    | __main__:trials:29 - Trial = 1632/30000 | Total reward = 46.89
2022-01-26 14:16:31.435 | DEBUG    | __main__:trials:24 - Trial = 1633/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.437 | DEBUG    | __main__:trials:29 - Trial = 1633/30000 | Total reward = 56.34
2022-01-26 14:16:31.440 | DEBUG    | __main__:trials:24 - Trial = 1634/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.442 | DEBUG    | __main__:trials:29 - Trial = 1634/30000 | Total reward = 37.90
2022-01-26 14:16:31.445 | DEBUG    | __main__:trials:24 - Trial = 1635/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.446 | DEBUG    | __main__:trials:29 - Trial = 1635/30000 | Total reward = 54.72
2022-01-26 14:16:31.451 | DEBUG    | __main__:trials:24 - Trial = 1636/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.452 | DEBUG    | __main__:trials:29 - Trial = 1636/30000 | Total reward = 47.21
2022-01-26 14:16:31.456 | DEBUG    | __main__:trials:24 - Trial = 1637/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.458 | DEBUG    | __main__:trials:29 - Trial = 1637/30000 | Total reward = 37.08
2022-01-26 14:16:31.461 | DEBUG    | __main__:trials:24 - Trial = 1638/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.462 | DEBUG    | __main__:trials:29 - Trial = 1638/30000 | Total reward = 40.85
2022-01-26 14:16:31.467 | DEBUG    | __main__:trials:24 - Trial = 1639/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.467 | DEBUG    | __main__:trials:29 - Trial = 1639/30000 | Total reward = 43.11
2022-01-26 14:16:31.471 | DEBUG    | __main__:trials:24 - Trial = 1640/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.473 | DEBUG    | __main__:trials:29 - Trial = 1640/30000 | Total reward = 42.12
2022-01-26 14:16:31.477 | DEBUG    | __main__:trials:24 - Trial = 1641/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.478 | DEBUG    | __main__:trials:29 - Trial = 1641/30000 | Total reward = 34.64
2022-01-26 14:16:31.481 | DEBUG    | __main__:trials:24 - Trial = 1642/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.482 | DEBUG    | __main__:trials:29 - Trial = 1642/30000 | Total reward = 48.76
2022-01-26 14:16:31.486 | DEBUG    | __main__:trials:24 - Trial = 1643/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.488 | DEBUG    | __main__:trials:29 - Trial = 1643/30000 | Total reward = 54.45
2022-01-26 14:16:31.491 | DEBUG    | __main__:trials:24 - Trial = 1644/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.492 | DEBUG    | __main__:trials:29 - Trial = 1644/30000 | Total reward = 48.79
2022-01-26 14:16:31.496 | DEBUG    | __main__:trials:24 - Trial = 1645/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.498 | DEBUG    | __main__:trials:29 - Trial = 1645/30000 | Total reward = 39.49
2022-01-26 14:16:31.501 | DEBUG    | __main__:trials:24 - Trial = 1646/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.503 | DEBUG    | __main__:trials:29 - Trial = 1646/30000 | Total reward = 53.54
2022-01-26 14:16:31.507 | DEBUG    | __main__:trials:24 - Trial = 1647/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.507 | DEBUG    | __main__:trials:29 - Trial = 1647/30000 | Total reward = 55.27
2022-01-26 14:16:31.512 | DEBUG    | __main__:trials:24 - Trial = 1648/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.513 | DEBUG    | __main__:trials:29 - Trial = 1648/30000 | Total reward = 54.45
2022-01-26 14:16:31.516 | DEBUG    | __main__:trials:24 - Trial = 1649/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.517 | DEBUG    | __main__:trials:29 - Trial = 1649/30000 | Total reward = 49.77
2022-01-26 14:16:31.520 | DEBUG    | __main__:trials:24 - Trial = 1650/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.521 | DEBUG    | __main__:trials:29 - Trial = 1650/30000 | Total reward = 42.12
2022-01-26 14:16:31.525 | DEBUG    | __main__:trials:24 - Trial = 1651/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.526 | DEBUG    | __main__:trials:29 - Trial = 1651/30000 | Total reward = 55.06
2022-01-26 14:16:31.529 | DEBUG    | __main__:trials:24 - Trial = 1652/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.531 | DEBUG    | __main__:trials:29 - Trial = 1652/30000 | Total reward = 62.25
2022-01-26 14:16:31.534 | DEBUG    | __main__:trials:24 - Trial = 1653/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.536 | DEBUG    | __main__:trials:29 - Trial = 1653/30000 | Total reward = 65.75
2022-01-26 14:16:31.540 | DEBUG    | __main__:trials:24 - Trial = 1654/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.541 | DEBUG    | __main__:trials:29 - Trial = 1654/30000 | Total reward = 48.64
2022-01-26 14:16:31.545 | DEBUG    | __main__:trials:24 - Trial = 1655/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.546 | DEBUG    | __main__:trials:29 - Trial = 1655/30000 | Total reward = 53.76
2022-01-26 14:16:31.550 | DEBUG    | __main__:trials:24 - Trial = 1656/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.551 | DEBUG    | __main__:trials:29 - Trial = 1656/30000 | Total reward = 53.00
2022-01-26 14:16:31.556 | DEBUG    | __main__:trials:24 - Trial = 1657/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.557 | DEBUG    | __main__:trials:29 - Trial = 1657/30000 | Total reward = 53.77
2022-01-26 14:16:31.561 | DEBUG    | __main__:trials:24 - Trial = 1658/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.563 | DEBUG    | __main__:trials:29 - Trial = 1658/30000 | Total reward = 53.28
2022-01-26 14:16:31.566 | DEBUG    | __main__:trials:24 - Trial = 1659/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.567 | DEBUG    | __main__:trials:29 - Trial = 1659/30000 | Total reward = 47.11
2022-01-26 14:16:31.571 | DEBUG    | __main__:trials:24 - Trial = 1660/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.572 | DEBUG    | __main__:trials:29 - Trial = 1660/30000 | Total reward = 53.01
2022-01-26 14:16:31.576 | DEBUG    | __main__:trials:24 - Trial = 1661/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.577 | DEBUG    | __main__:trials:29 - Trial = 1661/30000 | Total reward = 40.72
2022-01-26 14:16:31.581 | DEBUG    | __main__:trials:24 - Trial = 1662/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.582 | DEBUG    | __main__:trials:29 - Trial = 1662/30000 | Total reward = 34.06
2022-01-26 14:16:31.586 | DEBUG    | __main__:trials:24 - Trial = 1663/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.588 | DEBUG    | __main__:trials:29 - Trial = 1663/30000 | Total reward = 53.62
2022-01-26 14:16:31.591 | DEBUG    | __main__:trials:26 - Trial = 1664/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:31.592 | DEBUG    | __main__:trials:29 - Trial = 1664/30000 | Total reward = 12.26
2022-01-26 14:16:31.596 | DEBUG    | __main__:trials:24 - Trial = 1665/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.597 | DEBUG    | __main__:trials:29 - Trial = 1665/30000 | Total reward = 61.45
2022-01-26 14:16:31.601 | DEBUG    | __main__:trials:24 - Trial = 1666/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.602 | DEBUG    | __main__:trials:29 - Trial = 1666/30000 | Total reward = 54.04
2022-01-26 14:16:31.606 | DEBUG    | __main__:trials:24 - Trial = 1667/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.607 | DEBUG    | __main__:trials:29 - Trial = 1667/30000 | Total reward = 51.96
2022-01-26 14:16:31.612 | DEBUG    | __main__:trials:24 - Trial = 1668/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.613 | DEBUG    | __main__:trials:29 - Trial = 1668/30000 | Total reward = 50.36
2022-01-26 14:16:31.617 | DEBUG    | __main__:trials:24 - Trial = 1669/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.618 | DEBUG    | __main__:trials:29 - Trial = 1669/30000 | Total reward = 58.49
2022-01-26 14:16:31.622 | DEBUG    | __main__:trials:24 - Trial = 1670/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.622 | DEBUG    | __main__:trials:29 - Trial = 1670/30000 | Total reward = 54.24
2022-01-26 14:16:31.627 | DEBUG    | __main__:trials:24 - Trial = 1671/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.628 | DEBUG    | __main__:trials:29 - Trial = 1671/30000 | Total reward = 54.62
2022-01-26 14:16:31.632 | DEBUG    | __main__:trials:24 - Trial = 1672/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.634 | DEBUG    | __main__:trials:29 - Trial = 1672/30000 | Total reward = 55.71
2022-01-26 14:16:31.637 | DEBUG    | __main__:trials:24 - Trial = 1673/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.638 | DEBUG    | __main__:trials:29 - Trial = 1673/30000 | Total reward = 51.57
2022-01-26 14:16:31.643 | DEBUG    | __main__:trials:24 - Trial = 1674/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.644 | DEBUG    | __main__:trials:29 - Trial = 1674/30000 | Total reward = 55.17
2022-01-26 14:16:31.648 | DEBUG    | __main__:trials:24 - Trial = 1675/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.650 | DEBUG    | __main__:trials:29 - Trial = 1675/30000 | Total reward = 55.07
2022-01-26 14:16:31.653 | DEBUG    | __main__:trials:24 - Trial = 1676/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.654 | DEBUG    | __main__:trials:29 - Trial = 1676/30000 | Total reward = 54.53
2022-01-26 14:16:31.657 | DEBUG    | __main__:trials:24 - Trial = 1677/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.658 | DEBUG    | __main__:trials:29 - Trial = 1677/30000 | Total reward = 60.10
2022-01-26 14:16:31.662 | DEBUG    | __main__:trials:24 - Trial = 1678/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.664 | DEBUG    | __main__:trials:29 - Trial = 1678/30000 | Total reward = 36.03
2022-01-26 14:16:31.668 | DEBUG    | __main__:trials:24 - Trial = 1679/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.668 | DEBUG    | __main__:trials:29 - Trial = 1679/30000 | Total reward = 43.76
2022-01-26 14:16:31.673 | DEBUG    | __main__:trials:24 - Trial = 1680/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.674 | DEBUG    | __main__:trials:29 - Trial = 1680/30000 | Total reward = 45.91
2022-01-26 14:16:31.678 | DEBUG    | __main__:trials:24 - Trial = 1681/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.680 | DEBUG    | __main__:trials:29 - Trial = 1681/30000 | Total reward = 54.30
2022-01-26 14:16:31.684 | DEBUG    | __main__:trials:24 - Trial = 1682/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.684 | DEBUG    | __main__:trials:29 - Trial = 1682/30000 | Total reward = 47.37
2022-01-26 14:16:31.689 | DEBUG    | __main__:trials:24 - Trial = 1683/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.690 | DEBUG    | __main__:trials:29 - Trial = 1683/30000 | Total reward = 32.89
2022-01-26 14:16:31.694 | DEBUG    | __main__:trials:24 - Trial = 1684/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.695 | DEBUG    | __main__:trials:29 - Trial = 1684/30000 | Total reward = 42.25
2022-01-26 14:16:31.699 | DEBUG    | __main__:trials:24 - Trial = 1685/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.701 | DEBUG    | __main__:trials:29 - Trial = 1685/30000 | Total reward = 47.43
2022-01-26 14:16:31.704 | DEBUG    | __main__:trials:24 - Trial = 1686/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.706 | DEBUG    | __main__:trials:29 - Trial = 1686/30000 | Total reward = 54.11
2022-01-26 14:16:31.710 | DEBUG    | __main__:trials:24 - Trial = 1687/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.710 | DEBUG    | __main__:trials:29 - Trial = 1687/30000 | Total reward = 51.41
2022-01-26 14:16:31.715 | DEBUG    | __main__:trials:24 - Trial = 1688/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.716 | DEBUG    | __main__:trials:29 - Trial = 1688/30000 | Total reward = 54.24
2022-01-26 14:16:31.720 | DEBUG    | __main__:trials:24 - Trial = 1689/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.722 | DEBUG    | __main__:trials:29 - Trial = 1689/30000 | Total reward = 48.41
2022-01-26 14:16:31.726 | DEBUG    | __main__:trials:24 - Trial = 1690/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.727 | DEBUG    | __main__:trials:29 - Trial = 1690/30000 | Total reward = 50.66
2022-01-26 14:16:31.731 | DEBUG    | __main__:trials:24 - Trial = 1691/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.732 | DEBUG    | __main__:trials:29 - Trial = 1691/30000 | Total reward = 47.98
2022-01-26 14:16:31.735 | DEBUG    | __main__:trials:24 - Trial = 1692/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.737 | DEBUG    | __main__:trials:29 - Trial = 1692/30000 | Total reward = 48.40
2022-01-26 14:16:31.740 | DEBUG    | __main__:trials:24 - Trial = 1693/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.742 | DEBUG    | __main__:trials:29 - Trial = 1693/30000 | Total reward = 44.70
2022-01-26 14:16:31.746 | DEBUG    | __main__:trials:24 - Trial = 1694/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.746 | DEBUG    | __main__:trials:29 - Trial = 1694/30000 | Total reward = 63.11
2022-01-26 14:16:31.751 | DEBUG    | __main__:trials:24 - Trial = 1695/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.752 | DEBUG    | __main__:trials:29 - Trial = 1695/30000 | Total reward = 56.73
2022-01-26 14:16:31.756 | DEBUG    | __main__:trials:24 - Trial = 1696/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.757 | DEBUG    | __main__:trials:29 - Trial = 1696/30000 | Total reward = 46.02
2022-01-26 14:16:31.760 | DEBUG    | __main__:trials:24 - Trial = 1697/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.762 | DEBUG    | __main__:trials:29 - Trial = 1697/30000 | Total reward = 30.94
2022-01-26 14:16:31.766 | DEBUG    | __main__:trials:24 - Trial = 1698/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.767 | DEBUG    | __main__:trials:29 - Trial = 1698/30000 | Total reward = 35.90
2022-01-26 14:16:31.771 | DEBUG    | __main__:trials:24 - Trial = 1699/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.772 | DEBUG    | __main__:trials:29 - Trial = 1699/30000 | Total reward = 51.56
2022-01-26 14:16:31.776 | DEBUG    | __main__:trials:24 - Trial = 1700/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.778 | DEBUG    | __main__:trials:29 - Trial = 1700/30000 | Total reward = 48.47
2022-01-26 14:16:31.781 | DEBUG    | __main__:trials:24 - Trial = 1701/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.783 | DEBUG    | __main__:trials:29 - Trial = 1701/30000 | Total reward = 56.82
2022-01-26 14:16:31.786 | DEBUG    | __main__:trials:24 - Trial = 1702/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.788 | DEBUG    | __main__:trials:29 - Trial = 1702/30000 | Total reward = 48.76
2022-01-26 14:16:31.791 | DEBUG    | __main__:trials:24 - Trial = 1703/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.793 | DEBUG    | __main__:trials:29 - Trial = 1703/30000 | Total reward = 56.72
2022-01-26 14:16:31.796 | DEBUG    | __main__:trials:24 - Trial = 1704/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.797 | DEBUG    | __main__:trials:29 - Trial = 1704/30000 | Total reward = 44.88
2022-01-26 14:16:31.801 | DEBUG    | __main__:trials:24 - Trial = 1705/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.802 | DEBUG    | __main__:trials:29 - Trial = 1705/30000 | Total reward = 51.97
2022-01-26 14:16:31.805 | DEBUG    | __main__:trials:24 - Trial = 1706/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.807 | DEBUG    | __main__:trials:29 - Trial = 1706/30000 | Total reward = 40.12
2022-01-26 14:16:31.810 | DEBUG    | __main__:trials:24 - Trial = 1707/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.811 | DEBUG    | __main__:trials:29 - Trial = 1707/30000 | Total reward = 48.62
2022-01-26 14:16:31.814 | DEBUG    | __main__:trials:24 - Trial = 1708/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.815 | DEBUG    | __main__:trials:29 - Trial = 1708/30000 | Total reward = 55.07
2022-01-26 14:16:31.818 | DEBUG    | __main__:trials:24 - Trial = 1709/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.819 | DEBUG    | __main__:trials:29 - Trial = 1709/30000 | Total reward = 39.28
2022-01-26 14:16:31.822 | DEBUG    | __main__:trials:24 - Trial = 1710/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.825 | DEBUG    | __main__:trials:29 - Trial = 1710/30000 | Total reward = 44.25
2022-01-26 14:16:31.827 | DEBUG    | __main__:trials:24 - Trial = 1711/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.829 | DEBUG    | __main__:trials:29 - Trial = 1711/30000 | Total reward = 33.15
2022-01-26 14:16:31.832 | DEBUG    | __main__:trials:24 - Trial = 1712/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.833 | DEBUG    | __main__:trials:29 - Trial = 1712/30000 | Total reward = 51.70
2022-01-26 14:16:31.838 | DEBUG    | __main__:trials:24 - Trial = 1713/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.839 | DEBUG    | __main__:trials:29 - Trial = 1713/30000 | Total reward = 52.87
2022-01-26 14:16:31.842 | DEBUG    | __main__:trials:24 - Trial = 1714/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.843 | DEBUG    | __main__:trials:29 - Trial = 1714/30000 | Total reward = 53.89
2022-01-26 14:16:31.847 | DEBUG    | __main__:trials:24 - Trial = 1715/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.847 | DEBUG    | __main__:trials:29 - Trial = 1715/30000 | Total reward = 49.88
2022-01-26 14:16:31.851 | DEBUG    | __main__:trials:24 - Trial = 1716/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.851 | DEBUG    | __main__:trials:29 - Trial = 1716/30000 | Total reward = 52.15
2022-01-26 14:16:31.855 | DEBUG    | __main__:trials:24 - Trial = 1717/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.855 | DEBUG    | __main__:trials:29 - Trial = 1717/30000 | Total reward = 43.67
2022-01-26 14:16:31.859 | DEBUG    | __main__:trials:24 - Trial = 1718/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.859 | DEBUG    | __main__:trials:29 - Trial = 1718/30000 | Total reward = 56.66
2022-01-26 14:16:31.863 | DEBUG    | __main__:trials:24 - Trial = 1719/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.865 | DEBUG    | __main__:trials:29 - Trial = 1719/30000 | Total reward = 46.95
2022-01-26 14:16:31.868 | DEBUG    | __main__:trials:24 - Trial = 1720/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.869 | DEBUG    | __main__:trials:29 - Trial = 1720/30000 | Total reward = 47.96
2022-01-26 14:16:31.873 | DEBUG    | __main__:trials:24 - Trial = 1721/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.873 | DEBUG    | __main__:trials:29 - Trial = 1721/30000 | Total reward = 48.77
2022-01-26 14:16:31.877 | DEBUG    | __main__:trials:24 - Trial = 1722/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.878 | DEBUG    | __main__:trials:29 - Trial = 1722/30000 | Total reward = 46.67
2022-01-26 14:16:31.881 | DEBUG    | __main__:trials:24 - Trial = 1723/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.882 | DEBUG    | __main__:trials:29 - Trial = 1723/30000 | Total reward = 47.24
2022-01-26 14:16:31.885 | DEBUG    | __main__:trials:24 - Trial = 1724/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.886 | DEBUG    | __main__:trials:29 - Trial = 1724/30000 | Total reward = 46.84
2022-01-26 14:16:31.889 | DEBUG    | __main__:trials:24 - Trial = 1725/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.890 | DEBUG    | __main__:trials:29 - Trial = 1725/30000 | Total reward = 41.96
2022-01-26 14:16:31.893 | DEBUG    | __main__:trials:24 - Trial = 1726/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.895 | DEBUG    | __main__:trials:29 - Trial = 1726/30000 | Total reward = 56.53
2022-01-26 14:16:31.898 | DEBUG    | __main__:trials:24 - Trial = 1727/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.899 | DEBUG    | __main__:trials:29 - Trial = 1727/30000 | Total reward = 52.74
2022-01-26 14:16:31.903 | DEBUG    | __main__:trials:24 - Trial = 1728/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.904 | DEBUG    | __main__:trials:29 - Trial = 1728/30000 | Total reward = 48.44
2022-01-26 14:16:31.907 | DEBUG    | __main__:trials:24 - Trial = 1729/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.909 | DEBUG    | __main__:trials:29 - Trial = 1729/30000 | Total reward = 52.47
2022-01-26 14:16:31.912 | DEBUG    | __main__:trials:24 - Trial = 1730/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.913 | DEBUG    | __main__:trials:29 - Trial = 1730/30000 | Total reward = 59.37
2022-01-26 14:16:31.917 | DEBUG    | __main__:trials:24 - Trial = 1731/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.919 | DEBUG    | __main__:trials:29 - Trial = 1731/30000 | Total reward = 54.15
2022-01-26 14:16:31.922 | DEBUG    | __main__:trials:24 - Trial = 1732/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.923 | DEBUG    | __main__:trials:29 - Trial = 1732/30000 | Total reward = 53.37
2022-01-26 14:16:31.926 | DEBUG    | __main__:trials:24 - Trial = 1733/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.928 | DEBUG    | __main__:trials:29 - Trial = 1733/30000 | Total reward = 41.41
2022-01-26 14:16:31.931 | DEBUG    | __main__:trials:24 - Trial = 1734/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.933 | DEBUG    | __main__:trials:29 - Trial = 1734/30000 | Total reward = 41.03
2022-01-26 14:16:31.936 | DEBUG    | __main__:trials:24 - Trial = 1735/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.938 | DEBUG    | __main__:trials:29 - Trial = 1735/30000 | Total reward = 13.71
2022-01-26 14:16:31.942 | DEBUG    | __main__:trials:24 - Trial = 1736/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.943 | DEBUG    | __main__:trials:29 - Trial = 1736/30000 | Total reward = 52.14
2022-01-26 14:16:31.947 | DEBUG    | __main__:trials:24 - Trial = 1737/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.948 | DEBUG    | __main__:trials:29 - Trial = 1737/30000 | Total reward = 52.44
2022-01-26 14:16:31.951 | DEBUG    | __main__:trials:24 - Trial = 1738/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.953 | DEBUG    | __main__:trials:29 - Trial = 1738/30000 | Total reward = 48.42
2022-01-26 14:16:31.956 | DEBUG    | __main__:trials:24 - Trial = 1739/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.958 | DEBUG    | __main__:trials:29 - Trial = 1739/30000 | Total reward = 56.93
2022-01-26 14:16:31.962 | DEBUG    | __main__:trials:24 - Trial = 1740/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.963 | DEBUG    | __main__:trials:29 - Trial = 1740/30000 | Total reward = 47.81
2022-01-26 14:16:31.967 | DEBUG    | __main__:trials:24 - Trial = 1741/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.968 | DEBUG    | __main__:trials:29 - Trial = 1741/30000 | Total reward = 48.16
2022-01-26 14:16:31.972 | DEBUG    | __main__:trials:24 - Trial = 1742/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.974 | DEBUG    | __main__:trials:29 - Trial = 1742/30000 | Total reward = 54.24
2022-01-26 14:16:31.977 | DEBUG    | __main__:trials:24 - Trial = 1743/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.979 | DEBUG    | __main__:trials:29 - Trial = 1743/30000 | Total reward = 38.44
2022-01-26 14:16:31.983 | DEBUG    | __main__:trials:24 - Trial = 1744/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.984 | DEBUG    | __main__:trials:29 - Trial = 1744/30000 | Total reward = 48.79
2022-01-26 14:16:31.988 | DEBUG    | __main__:trials:24 - Trial = 1745/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.990 | DEBUG    | __main__:trials:29 - Trial = 1745/30000 | Total reward = 46.58
2022-01-26 14:16:31.993 | DEBUG    | __main__:trials:24 - Trial = 1746/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.995 | DEBUG    | __main__:trials:29 - Trial = 1746/30000 | Total reward = 48.16
2022-01-26 14:16:31.999 | DEBUG    | __main__:trials:24 - Trial = 1747/30000 | Max number of steps (20) reached
2022-01-26 14:16:31.999 | DEBUG    | __main__:trials:29 - Trial = 1747/30000 | Total reward = 58.19
2022-01-26 14:16:32.003 | DEBUG    | __main__:trials:24 - Trial = 1748/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.005 | DEBUG    | __main__:trials:29 - Trial = 1748/30000 | Total reward = 47.69
2022-01-26 14:16:32.008 | DEBUG    | __main__:trials:24 - Trial = 1749/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.010 | DEBUG    | __main__:trials:29 - Trial = 1749/30000 | Total reward = 33.51
2022-01-26 14:16:32.013 | DEBUG    | __main__:trials:24 - Trial = 1750/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.015 | DEBUG    | __main__:trials:29 - Trial = 1750/30000 | Total reward = 48.34
2022-01-26 14:16:32.019 | DEBUG    | __main__:trials:24 - Trial = 1751/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.019 | DEBUG    | __main__:trials:29 - Trial = 1751/30000 | Total reward = 48.34
2022-01-26 14:16:32.024 | DEBUG    | __main__:trials:24 - Trial = 1752/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.024 | DEBUG    | __main__:trials:29 - Trial = 1752/30000 | Total reward = 53.88
2022-01-26 14:16:32.029 | DEBUG    | __main__:trials:24 - Trial = 1753/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.030 | DEBUG    | __main__:trials:29 - Trial = 1753/30000 | Total reward = 46.62
2022-01-26 14:16:32.033 | DEBUG    | __main__:trials:26 - Trial = 1754/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.034 | DEBUG    | __main__:trials:29 - Trial = 1754/30000 | Total reward = 24.54
2022-01-26 14:16:32.037 | DEBUG    | __main__:trials:24 - Trial = 1755/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.038 | DEBUG    | __main__:trials:29 - Trial = 1755/30000 | Total reward = 35.16
2022-01-26 14:16:32.041 | DEBUG    | __main__:trials:24 - Trial = 1756/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.043 | DEBUG    | __main__:trials:29 - Trial = 1756/30000 | Total reward = 49.06
2022-01-26 14:16:32.046 | DEBUG    | __main__:trials:24 - Trial = 1757/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.046 | DEBUG    | __main__:trials:29 - Trial = 1757/30000 | Total reward = 42.00
2022-01-26 14:16:32.049 | DEBUG    | __main__:trials:24 - Trial = 1758/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.051 | DEBUG    | __main__:trials:29 - Trial = 1758/30000 | Total reward = 47.44
2022-01-26 14:16:32.055 | DEBUG    | __main__:trials:24 - Trial = 1759/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.056 | DEBUG    | __main__:trials:29 - Trial = 1759/30000 | Total reward = 35.29
2022-01-26 14:16:32.060 | DEBUG    | __main__:trials:24 - Trial = 1760/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.061 | DEBUG    | __main__:trials:29 - Trial = 1760/30000 | Total reward = 28.66
2022-01-26 14:16:32.065 | DEBUG    | __main__:trials:24 - Trial = 1761/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.066 | DEBUG    | __main__:trials:29 - Trial = 1761/30000 | Total reward = 54.61
2022-01-26 14:16:32.070 | DEBUG    | __main__:trials:24 - Trial = 1762/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.071 | DEBUG    | __main__:trials:29 - Trial = 1762/30000 | Total reward = 47.17
2022-01-26 14:16:32.074 | DEBUG    | __main__:trials:24 - Trial = 1763/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.076 | DEBUG    | __main__:trials:29 - Trial = 1763/30000 | Total reward = 45.36
2022-01-26 14:16:32.079 | DEBUG    | __main__:trials:24 - Trial = 1764/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.080 | DEBUG    | __main__:trials:29 - Trial = 1764/30000 | Total reward = 48.21
2022-01-26 14:16:32.084 | DEBUG    | __main__:trials:24 - Trial = 1765/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.086 | DEBUG    | __main__:trials:29 - Trial = 1765/30000 | Total reward = 43.42
2022-01-26 14:16:32.089 | DEBUG    | __main__:trials:24 - Trial = 1766/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.090 | DEBUG    | __main__:trials:29 - Trial = 1766/30000 | Total reward = 46.82
2022-01-26 14:16:32.094 | DEBUG    | __main__:trials:24 - Trial = 1767/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.096 | DEBUG    | __main__:trials:29 - Trial = 1767/30000 | Total reward = 49.52
2022-01-26 14:16:32.099 | DEBUG    | __main__:trials:24 - Trial = 1768/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.100 | DEBUG    | __main__:trials:29 - Trial = 1768/30000 | Total reward = 58.36
2022-01-26 14:16:32.105 | DEBUG    | __main__:trials:24 - Trial = 1769/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.106 | DEBUG    | __main__:trials:29 - Trial = 1769/30000 | Total reward = 52.30
2022-01-26 14:16:32.110 | DEBUG    | __main__:trials:26 - Trial = 1770/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.111 | DEBUG    | __main__:trials:29 - Trial = 1770/30000 | Total reward = 44.38
2022-01-26 14:16:32.115 | DEBUG    | __main__:trials:24 - Trial = 1771/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.117 | DEBUG    | __main__:trials:29 - Trial = 1771/30000 | Total reward = 51.90
2022-01-26 14:16:32.120 | DEBUG    | __main__:trials:24 - Trial = 1772/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.122 | DEBUG    | __main__:trials:29 - Trial = 1772/30000 | Total reward = 46.97
2022-01-26 14:16:32.125 | DEBUG    | __main__:trials:24 - Trial = 1773/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.127 | DEBUG    | __main__:trials:29 - Trial = 1773/30000 | Total reward = 43.00
2022-01-26 14:16:32.130 | DEBUG    | __main__:trials:24 - Trial = 1774/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.131 | DEBUG    | __main__:trials:29 - Trial = 1774/30000 | Total reward = 50.17
2022-01-26 14:16:32.134 | DEBUG    | __main__:trials:24 - Trial = 1775/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.136 | DEBUG    | __main__:trials:29 - Trial = 1775/30000 | Total reward = 56.01
2022-01-26 14:16:32.140 | DEBUG    | __main__:trials:26 - Trial = 1776/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.140 | DEBUG    | __main__:trials:29 - Trial = 1776/30000 | Total reward = 31.85
2022-01-26 14:16:32.145 | DEBUG    | __main__:trials:24 - Trial = 1777/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.146 | DEBUG    | __main__:trials:29 - Trial = 1777/30000 | Total reward = 49.56
2022-01-26 14:16:32.150 | DEBUG    | __main__:trials:24 - Trial = 1778/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.151 | DEBUG    | __main__:trials:29 - Trial = 1778/30000 | Total reward = 48.70
2022-01-26 14:16:32.155 | DEBUG    | __main__:trials:24 - Trial = 1779/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.157 | DEBUG    | __main__:trials:29 - Trial = 1779/30000 | Total reward = 61.16
2022-01-26 14:16:32.160 | DEBUG    | __main__:trials:24 - Trial = 1780/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.162 | DEBUG    | __main__:trials:29 - Trial = 1780/30000 | Total reward = 47.99
2022-01-26 14:16:32.165 | DEBUG    | __main__:trials:24 - Trial = 1781/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.167 | DEBUG    | __main__:trials:29 - Trial = 1781/30000 | Total reward = 45.94
2022-01-26 14:16:32.170 | DEBUG    | __main__:trials:24 - Trial = 1782/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.172 | DEBUG    | __main__:trials:29 - Trial = 1782/30000 | Total reward = 53.15
2022-01-26 14:16:32.175 | DEBUG    | __main__:trials:24 - Trial = 1783/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.176 | DEBUG    | __main__:trials:29 - Trial = 1783/30000 | Total reward = 51.50
2022-01-26 14:16:32.180 | DEBUG    | __main__:trials:24 - Trial = 1784/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.182 | DEBUG    | __main__:trials:29 - Trial = 1784/30000 | Total reward = 31.38
2022-01-26 14:16:32.184 | DEBUG    | __main__:trials:26 - Trial = 1785/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.185 | DEBUG    | __main__:trials:29 - Trial = 1785/30000 | Total reward = 8.47
2022-01-26 14:16:32.189 | DEBUG    | __main__:trials:24 - Trial = 1786/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.191 | DEBUG    | __main__:trials:29 - Trial = 1786/30000 | Total reward = 45.84
2022-01-26 14:16:32.194 | DEBUG    | __main__:trials:24 - Trial = 1787/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.195 | DEBUG    | __main__:trials:29 - Trial = 1787/30000 | Total reward = 53.43
2022-01-26 14:16:32.200 | DEBUG    | __main__:trials:24 - Trial = 1788/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.201 | DEBUG    | __main__:trials:29 - Trial = 1788/30000 | Total reward = 48.22
2022-01-26 14:16:32.205 | DEBUG    | __main__:trials:24 - Trial = 1789/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.206 | DEBUG    | __main__:trials:29 - Trial = 1789/30000 | Total reward = 46.15
2022-01-26 14:16:32.209 | DEBUG    | __main__:trials:24 - Trial = 1790/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.210 | DEBUG    | __main__:trials:29 - Trial = 1790/30000 | Total reward = 43.61
2022-01-26 14:16:32.213 | DEBUG    | __main__:trials:26 - Trial = 1791/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.214 | DEBUG    | __main__:trials:29 - Trial = 1791/30000 | Total reward = 31.14
2022-01-26 14:16:32.217 | DEBUG    | __main__:trials:24 - Trial = 1792/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.219 | DEBUG    | __main__:trials:29 - Trial = 1792/30000 | Total reward = 28.72
2022-01-26 14:16:32.222 | DEBUG    | __main__:trials:24 - Trial = 1793/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.223 | DEBUG    | __main__:trials:29 - Trial = 1793/30000 | Total reward = 51.30
2022-01-26 14:16:32.226 | DEBUG    | __main__:trials:24 - Trial = 1794/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.228 | DEBUG    | __main__:trials:29 - Trial = 1794/30000 | Total reward = 46.75
2022-01-26 14:16:32.231 | DEBUG    | __main__:trials:24 - Trial = 1795/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.233 | DEBUG    | __main__:trials:29 - Trial = 1795/30000 | Total reward = 42.69
2022-01-26 14:16:32.236 | DEBUG    | __main__:trials:24 - Trial = 1796/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.237 | DEBUG    | __main__:trials:29 - Trial = 1796/30000 | Total reward = 49.62
2022-01-26 14:16:32.241 | DEBUG    | __main__:trials:24 - Trial = 1797/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.243 | DEBUG    | __main__:trials:29 - Trial = 1797/30000 | Total reward = 46.95
2022-01-26 14:16:32.246 | DEBUG    | __main__:trials:24 - Trial = 1798/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.248 | DEBUG    | __main__:trials:29 - Trial = 1798/30000 | Total reward = 47.67
2022-01-26 14:16:32.251 | DEBUG    | __main__:trials:24 - Trial = 1799/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.252 | DEBUG    | __main__:trials:29 - Trial = 1799/30000 | Total reward = 20.80
2022-01-26 14:16:32.255 | DEBUG    | __main__:trials:24 - Trial = 1800/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.257 | DEBUG    | __main__:trials:29 - Trial = 1800/30000 | Total reward = 46.21
2022-01-26 14:16:32.260 | DEBUG    | __main__:trials:24 - Trial = 1801/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.261 | DEBUG    | __main__:trials:29 - Trial = 1801/30000 | Total reward = 52.12
2022-01-26 14:16:32.265 | DEBUG    | __main__:trials:24 - Trial = 1802/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.266 | DEBUG    | __main__:trials:29 - Trial = 1802/30000 | Total reward = 47.14
2022-01-26 14:16:32.270 | DEBUG    | __main__:trials:24 - Trial = 1803/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.271 | DEBUG    | __main__:trials:29 - Trial = 1803/30000 | Total reward = 60.38
2022-01-26 14:16:32.275 | DEBUG    | __main__:trials:24 - Trial = 1804/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.277 | DEBUG    | __main__:trials:29 - Trial = 1804/30000 | Total reward = 38.53
2022-01-26 14:16:32.280 | DEBUG    | __main__:trials:24 - Trial = 1805/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.282 | DEBUG    | __main__:trials:29 - Trial = 1805/30000 | Total reward = 48.73
2022-01-26 14:16:32.285 | DEBUG    | __main__:trials:24 - Trial = 1806/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.286 | DEBUG    | __main__:trials:29 - Trial = 1806/30000 | Total reward = 54.97
2022-01-26 14:16:32.290 | DEBUG    | __main__:trials:24 - Trial = 1807/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.292 | DEBUG    | __main__:trials:29 - Trial = 1807/30000 | Total reward = 61.58
2022-01-26 14:16:32.296 | DEBUG    | __main__:trials:24 - Trial = 1808/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.297 | DEBUG    | __main__:trials:29 - Trial = 1808/30000 | Total reward = 58.25
2022-01-26 14:16:32.300 | DEBUG    | __main__:trials:26 - Trial = 1809/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.302 | DEBUG    | __main__:trials:29 - Trial = 1809/30000 | Total reward = 27.38
2022-01-26 14:16:32.305 | DEBUG    | __main__:trials:24 - Trial = 1810/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.307 | DEBUG    | __main__:trials:29 - Trial = 1810/30000 | Total reward = 53.89
2022-01-26 14:16:32.310 | DEBUG    | __main__:trials:26 - Trial = 1811/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.311 | DEBUG    | __main__:trials:29 - Trial = 1811/30000 | Total reward = 33.26
2022-01-26 14:16:32.315 | DEBUG    | __main__:trials:24 - Trial = 1812/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.316 | DEBUG    | __main__:trials:29 - Trial = 1812/30000 | Total reward = 45.41
2022-01-26 14:16:32.320 | DEBUG    | __main__:trials:24 - Trial = 1813/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.321 | DEBUG    | __main__:trials:29 - Trial = 1813/30000 | Total reward = 51.46
2022-01-26 14:16:32.325 | DEBUG    | __main__:trials:24 - Trial = 1814/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.326 | DEBUG    | __main__:trials:29 - Trial = 1814/30000 | Total reward = 54.44
2022-01-26 14:16:32.329 | DEBUG    | __main__:trials:24 - Trial = 1815/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.330 | DEBUG    | __main__:trials:29 - Trial = 1815/30000 | Total reward = 39.69
2022-01-26 14:16:32.334 | DEBUG    | __main__:trials:24 - Trial = 1816/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.335 | DEBUG    | __main__:trials:29 - Trial = 1816/30000 | Total reward = 52.52
2022-01-26 14:16:32.339 | DEBUG    | __main__:trials:24 - Trial = 1817/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.340 | DEBUG    | __main__:trials:29 - Trial = 1817/30000 | Total reward = 54.23
2022-01-26 14:16:32.344 | DEBUG    | __main__:trials:24 - Trial = 1818/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.345 | DEBUG    | __main__:trials:29 - Trial = 1818/30000 | Total reward = 59.53
2022-01-26 14:16:32.349 | DEBUG    | __main__:trials:24 - Trial = 1819/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.351 | DEBUG    | __main__:trials:29 - Trial = 1819/30000 | Total reward = 51.50
2022-01-26 14:16:32.354 | DEBUG    | __main__:trials:24 - Trial = 1820/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.356 | DEBUG    | __main__:trials:29 - Trial = 1820/30000 | Total reward = 56.90
2022-01-26 14:16:32.359 | DEBUG    | __main__:trials:24 - Trial = 1821/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.360 | DEBUG    | __main__:trials:29 - Trial = 1821/30000 | Total reward = 48.16
2022-01-26 14:16:32.364 | DEBUG    | __main__:trials:24 - Trial = 1822/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.365 | DEBUG    | __main__:trials:29 - Trial = 1822/30000 | Total reward = 55.00
2022-01-26 14:16:32.369 | DEBUG    | __main__:trials:24 - Trial = 1823/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.370 | DEBUG    | __main__:trials:29 - Trial = 1823/30000 | Total reward = 50.19
2022-01-26 14:16:32.373 | DEBUG    | __main__:trials:24 - Trial = 1824/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.375 | DEBUG    | __main__:trials:29 - Trial = 1824/30000 | Total reward = 45.76
2022-01-26 14:16:32.378 | DEBUG    | __main__:trials:24 - Trial = 1825/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.379 | DEBUG    | __main__:trials:29 - Trial = 1825/30000 | Total reward = 52.04
2022-01-26 14:16:32.383 | DEBUG    | __main__:trials:24 - Trial = 1826/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.385 | DEBUG    | __main__:trials:29 - Trial = 1826/30000 | Total reward = 47.65
2022-01-26 14:16:32.388 | DEBUG    | __main__:trials:26 - Trial = 1827/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.390 | DEBUG    | __main__:trials:29 - Trial = 1827/30000 | Total reward = 34.88
2022-01-26 14:16:32.393 | DEBUG    | __main__:trials:24 - Trial = 1828/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.394 | DEBUG    | __main__:trials:29 - Trial = 1828/30000 | Total reward = 51.25
2022-01-26 14:16:32.399 | DEBUG    | __main__:trials:24 - Trial = 1829/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.399 | DEBUG    | __main__:trials:29 - Trial = 1829/30000 | Total reward = 47.07
2022-01-26 14:16:32.404 | DEBUG    | __main__:trials:24 - Trial = 1830/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.405 | DEBUG    | __main__:trials:29 - Trial = 1830/30000 | Total reward = 53.53
2022-01-26 14:16:32.408 | DEBUG    | __main__:trials:24 - Trial = 1831/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.410 | DEBUG    | __main__:trials:29 - Trial = 1831/30000 | Total reward = 45.78
2022-01-26 14:16:32.413 | DEBUG    | __main__:trials:26 - Trial = 1832/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.414 | DEBUG    | __main__:trials:29 - Trial = 1832/30000 | Total reward = 31.99
2022-01-26 14:16:32.418 | DEBUG    | __main__:trials:24 - Trial = 1833/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.419 | DEBUG    | __main__:trials:29 - Trial = 1833/30000 | Total reward = 49.83
2022-01-26 14:16:32.423 | DEBUG    | __main__:trials:24 - Trial = 1834/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.423 | DEBUG    | __main__:trials:29 - Trial = 1834/30000 | Total reward = 51.81
2022-01-26 14:16:32.427 | DEBUG    | __main__:trials:24 - Trial = 1835/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.429 | DEBUG    | __main__:trials:29 - Trial = 1835/30000 | Total reward = 51.81
2022-01-26 14:16:32.432 | DEBUG    | __main__:trials:24 - Trial = 1836/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.433 | DEBUG    | __main__:trials:29 - Trial = 1836/30000 | Total reward = 45.66
2022-01-26 14:16:32.437 | DEBUG    | __main__:trials:24 - Trial = 1837/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.438 | DEBUG    | __main__:trials:29 - Trial = 1837/30000 | Total reward = 53.01
2022-01-26 14:16:32.441 | DEBUG    | __main__:trials:24 - Trial = 1838/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.442 | DEBUG    | __main__:trials:29 - Trial = 1838/30000 | Total reward = 56.75
2022-01-26 14:16:32.446 | DEBUG    | __main__:trials:24 - Trial = 1839/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.447 | DEBUG    | __main__:trials:29 - Trial = 1839/30000 | Total reward = 55.33
2022-01-26 14:16:32.451 | DEBUG    | __main__:trials:24 - Trial = 1840/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.452 | DEBUG    | __main__:trials:29 - Trial = 1840/30000 | Total reward = 38.14
2022-01-26 14:16:32.456 | DEBUG    | __main__:trials:24 - Trial = 1841/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.457 | DEBUG    | __main__:trials:29 - Trial = 1841/30000 | Total reward = 55.95
2022-01-26 14:16:32.460 | DEBUG    | __main__:trials:24 - Trial = 1842/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.462 | DEBUG    | __main__:trials:29 - Trial = 1842/30000 | Total reward = 55.82
2022-01-26 14:16:32.466 | DEBUG    | __main__:trials:24 - Trial = 1843/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.467 | DEBUG    | __main__:trials:29 - Trial = 1843/30000 | Total reward = 59.24
2022-01-26 14:16:32.471 | DEBUG    | __main__:trials:24 - Trial = 1844/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.472 | DEBUG    | __main__:trials:29 - Trial = 1844/30000 | Total reward = 47.57
2022-01-26 14:16:32.475 | DEBUG    | __main__:trials:26 - Trial = 1845/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.476 | DEBUG    | __main__:trials:29 - Trial = 1845/30000 | Total reward = 10.73
2022-01-26 14:16:32.479 | DEBUG    | __main__:trials:26 - Trial = 1846/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.481 | DEBUG    | __main__:trials:29 - Trial = 1846/30000 | Total reward = 38.72
2022-01-26 14:16:32.484 | DEBUG    | __main__:trials:24 - Trial = 1847/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.486 | DEBUG    | __main__:trials:29 - Trial = 1847/30000 | Total reward = 45.58
2022-01-26 14:16:32.489 | DEBUG    | __main__:trials:24 - Trial = 1848/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.491 | DEBUG    | __main__:trials:29 - Trial = 1848/30000 | Total reward = 46.46
2022-01-26 14:16:32.495 | DEBUG    | __main__:trials:24 - Trial = 1849/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.495 | DEBUG    | __main__:trials:29 - Trial = 1849/30000 | Total reward = 52.25
2022-01-26 14:16:32.500 | DEBUG    | __main__:trials:24 - Trial = 1850/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.501 | DEBUG    | __main__:trials:29 - Trial = 1850/30000 | Total reward = 44.90
2022-01-26 14:16:32.505 | DEBUG    | __main__:trials:24 - Trial = 1851/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.505 | DEBUG    | __main__:trials:29 - Trial = 1851/30000 | Total reward = 51.58
2022-01-26 14:16:32.509 | DEBUG    | __main__:trials:24 - Trial = 1852/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.510 | DEBUG    | __main__:trials:29 - Trial = 1852/30000 | Total reward = 36.72
2022-01-26 14:16:32.514 | DEBUG    | __main__:trials:24 - Trial = 1853/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.516 | DEBUG    | __main__:trials:29 - Trial = 1853/30000 | Total reward = 52.53
2022-01-26 14:16:32.519 | DEBUG    | __main__:trials:24 - Trial = 1854/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.519 | DEBUG    | __main__:trials:29 - Trial = 1854/30000 | Total reward = 55.19
2022-01-26 14:16:32.522 | DEBUG    | __main__:trials:26 - Trial = 1855/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.524 | DEBUG    | __main__:trials:29 - Trial = 1855/30000 | Total reward = 18.24
2022-01-26 14:16:32.527 | DEBUG    | __main__:trials:24 - Trial = 1856/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.528 | DEBUG    | __main__:trials:29 - Trial = 1856/30000 | Total reward = 51.75
2022-01-26 14:16:32.532 | DEBUG    | __main__:trials:24 - Trial = 1857/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.533 | DEBUG    | __main__:trials:29 - Trial = 1857/30000 | Total reward = 50.83
2022-01-26 14:16:32.537 | DEBUG    | __main__:trials:24 - Trial = 1858/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.539 | DEBUG    | __main__:trials:29 - Trial = 1858/30000 | Total reward = 50.56
2022-01-26 14:16:32.542 | DEBUG    | __main__:trials:24 - Trial = 1859/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.543 | DEBUG    | __main__:trials:29 - Trial = 1859/30000 | Total reward = 48.33
2022-01-26 14:16:32.547 | DEBUG    | __main__:trials:24 - Trial = 1860/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.548 | DEBUG    | __main__:trials:29 - Trial = 1860/30000 | Total reward = 44.67
2022-01-26 14:16:32.552 | DEBUG    | __main__:trials:24 - Trial = 1861/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.554 | DEBUG    | __main__:trials:29 - Trial = 1861/30000 | Total reward = 51.56
2022-01-26 14:16:32.557 | DEBUG    | __main__:trials:24 - Trial = 1862/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.559 | DEBUG    | __main__:trials:29 - Trial = 1862/30000 | Total reward = 56.01
2022-01-26 14:16:32.562 | DEBUG    | __main__:trials:24 - Trial = 1863/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.564 | DEBUG    | __main__:trials:29 - Trial = 1863/30000 | Total reward = 50.17
2022-01-26 14:16:32.568 | DEBUG    | __main__:trials:24 - Trial = 1864/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.569 | DEBUG    | __main__:trials:29 - Trial = 1864/30000 | Total reward = 44.33
2022-01-26 14:16:32.573 | DEBUG    | __main__:trials:26 - Trial = 1865/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.573 | DEBUG    | __main__:trials:29 - Trial = 1865/30000 | Total reward = 36.33
2022-01-26 14:16:32.577 | DEBUG    | __main__:trials:26 - Trial = 1866/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.577 | DEBUG    | __main__:trials:29 - Trial = 1866/30000 | Total reward = 34.88
2022-01-26 14:16:32.582 | DEBUG    | __main__:trials:24 - Trial = 1867/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.583 | DEBUG    | __main__:trials:29 - Trial = 1867/30000 | Total reward = 49.43
2022-01-26 14:16:32.587 | DEBUG    | __main__:trials:24 - Trial = 1868/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.589 | DEBUG    | __main__:trials:29 - Trial = 1868/30000 | Total reward = 36.36
2022-01-26 14:16:32.592 | DEBUG    | __main__:trials:24 - Trial = 1869/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.594 | DEBUG    | __main__:trials:29 - Trial = 1869/30000 | Total reward = 52.30
2022-01-26 14:16:32.597 | DEBUG    | __main__:trials:26 - Trial = 1870/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.599 | DEBUG    | __main__:trials:29 - Trial = 1870/30000 | Total reward = 38.44
2022-01-26 14:16:32.601 | DEBUG    | __main__:trials:24 - Trial = 1871/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.603 | DEBUG    | __main__:trials:29 - Trial = 1871/30000 | Total reward = 47.98
2022-01-26 14:16:32.607 | DEBUG    | __main__:trials:24 - Trial = 1872/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.608 | DEBUG    | __main__:trials:29 - Trial = 1872/30000 | Total reward = 35.67
2022-01-26 14:16:32.612 | DEBUG    | __main__:trials:24 - Trial = 1873/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.613 | DEBUG    | __main__:trials:29 - Trial = 1873/30000 | Total reward = 49.49
2022-01-26 14:16:32.617 | DEBUG    | __main__:trials:24 - Trial = 1874/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.618 | DEBUG    | __main__:trials:29 - Trial = 1874/30000 | Total reward = 44.69
2022-01-26 14:16:32.621 | DEBUG    | __main__:trials:24 - Trial = 1875/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.622 | DEBUG    | __main__:trials:29 - Trial = 1875/30000 | Total reward = 53.39
2022-01-26 14:16:32.626 | DEBUG    | __main__:trials:24 - Trial = 1876/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.627 | DEBUG    | __main__:trials:29 - Trial = 1876/30000 | Total reward = 47.08
2022-01-26 14:16:32.631 | DEBUG    | __main__:trials:24 - Trial = 1877/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.633 | DEBUG    | __main__:trials:29 - Trial = 1877/30000 | Total reward = 50.17
2022-01-26 14:16:32.636 | DEBUG    | __main__:trials:24 - Trial = 1878/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.637 | DEBUG    | __main__:trials:29 - Trial = 1878/30000 | Total reward = 57.98
2022-01-26 14:16:32.641 | DEBUG    | __main__:trials:24 - Trial = 1879/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.642 | DEBUG    | __main__:trials:29 - Trial = 1879/30000 | Total reward = 37.65
2022-01-26 14:16:32.646 | DEBUG    | __main__:trials:24 - Trial = 1880/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.648 | DEBUG    | __main__:trials:29 - Trial = 1880/30000 | Total reward = 50.28
2022-01-26 14:16:32.651 | DEBUG    | __main__:trials:24 - Trial = 1881/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.652 | DEBUG    | __main__:trials:29 - Trial = 1881/30000 | Total reward = 38.98
2022-01-26 14:16:32.656 | DEBUG    | __main__:trials:24 - Trial = 1882/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.657 | DEBUG    | __main__:trials:29 - Trial = 1882/30000 | Total reward = 56.21
2022-01-26 14:16:32.660 | DEBUG    | __main__:trials:24 - Trial = 1883/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.662 | DEBUG    | __main__:trials:29 - Trial = 1883/30000 | Total reward = 51.00
2022-01-26 14:16:32.665 | DEBUG    | __main__:trials:24 - Trial = 1884/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.666 | DEBUG    | __main__:trials:29 - Trial = 1884/30000 | Total reward = 49.91
2022-01-26 14:16:32.670 | DEBUG    | __main__:trials:24 - Trial = 1885/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.671 | DEBUG    | __main__:trials:29 - Trial = 1885/30000 | Total reward = 47.44
2022-01-26 14:16:32.674 | DEBUG    | __main__:trials:24 - Trial = 1886/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.675 | DEBUG    | __main__:trials:29 - Trial = 1886/30000 | Total reward = 50.03
2022-01-26 14:16:32.678 | DEBUG    | __main__:trials:26 - Trial = 1887/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.679 | DEBUG    | __main__:trials:29 - Trial = 1887/30000 | Total reward = 16.90
2022-01-26 14:16:32.683 | DEBUG    | __main__:trials:24 - Trial = 1888/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.684 | DEBUG    | __main__:trials:29 - Trial = 1888/30000 | Total reward = 48.94
2022-01-26 14:16:32.687 | DEBUG    | __main__:trials:26 - Trial = 1889/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.689 | DEBUG    | __main__:trials:29 - Trial = 1889/30000 | Total reward = 16.07
2022-01-26 14:16:32.692 | DEBUG    | __main__:trials:24 - Trial = 1890/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.694 | DEBUG    | __main__:trials:29 - Trial = 1890/30000 | Total reward = 50.17
2022-01-26 14:16:32.697 | DEBUG    | __main__:trials:24 - Trial = 1891/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.698 | DEBUG    | __main__:trials:29 - Trial = 1891/30000 | Total reward = 49.73
2022-01-26 14:16:32.702 | DEBUG    | __main__:trials:24 - Trial = 1892/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.703 | DEBUG    | __main__:trials:29 - Trial = 1892/30000 | Total reward = 51.53
2022-01-26 14:16:32.706 | DEBUG    | __main__:trials:26 - Trial = 1893/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.708 | DEBUG    | __main__:trials:29 - Trial = 1893/30000 | Total reward = 18.69
2022-01-26 14:16:32.712 | DEBUG    | __main__:trials:24 - Trial = 1894/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.712 | DEBUG    | __main__:trials:29 - Trial = 1894/30000 | Total reward = 22.80
2022-01-26 14:16:32.717 | DEBUG    | __main__:trials:24 - Trial = 1895/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.718 | DEBUG    | __main__:trials:29 - Trial = 1895/30000 | Total reward = 49.62
2022-01-26 14:16:32.722 | DEBUG    | __main__:trials:24 - Trial = 1896/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.723 | DEBUG    | __main__:trials:29 - Trial = 1896/30000 | Total reward = 46.31
2022-01-26 14:16:32.727 | DEBUG    | __main__:trials:24 - Trial = 1897/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.728 | DEBUG    | __main__:trials:29 - Trial = 1897/30000 | Total reward = 51.54
2022-01-26 14:16:32.731 | DEBUG    | __main__:trials:24 - Trial = 1898/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.733 | DEBUG    | __main__:trials:29 - Trial = 1898/30000 | Total reward = 51.04
2022-01-26 14:16:32.736 | DEBUG    | __main__:trials:24 - Trial = 1899/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.737 | DEBUG    | __main__:trials:29 - Trial = 1899/30000 | Total reward = 40.99
2022-01-26 14:16:32.740 | DEBUG    | __main__:trials:24 - Trial = 1900/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.742 | DEBUG    | __main__:trials:29 - Trial = 1900/30000 | Total reward = 50.47
2022-01-26 14:16:32.745 | DEBUG    | __main__:trials:24 - Trial = 1901/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.747 | DEBUG    | __main__:trials:29 - Trial = 1901/30000 | Total reward = 44.39
2022-01-26 14:16:32.749 | DEBUG    | __main__:trials:24 - Trial = 1902/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.750 | DEBUG    | __main__:trials:29 - Trial = 1902/30000 | Total reward = 50.62
2022-01-26 14:16:32.754 | DEBUG    | __main__:trials:24 - Trial = 1903/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.755 | DEBUG    | __main__:trials:29 - Trial = 1903/30000 | Total reward = 54.88
2022-01-26 14:16:32.759 | DEBUG    | __main__:trials:24 - Trial = 1904/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.761 | DEBUG    | __main__:trials:29 - Trial = 1904/30000 | Total reward = 41.76
2022-01-26 14:16:32.764 | DEBUG    | __main__:trials:24 - Trial = 1905/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.766 | DEBUG    | __main__:trials:29 - Trial = 1905/30000 | Total reward = 48.83
2022-01-26 14:16:32.770 | DEBUG    | __main__:trials:24 - Trial = 1906/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.771 | DEBUG    | __main__:trials:29 - Trial = 1906/30000 | Total reward = 45.99
2022-01-26 14:16:32.775 | DEBUG    | __main__:trials:24 - Trial = 1907/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.776 | DEBUG    | __main__:trials:29 - Trial = 1907/30000 | Total reward = 49.04
2022-01-26 14:16:32.779 | DEBUG    | __main__:trials:26 - Trial = 1908/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.781 | DEBUG    | __main__:trials:29 - Trial = 1908/30000 | Total reward = 20.60
2022-01-26 14:16:32.784 | DEBUG    | __main__:trials:26 - Trial = 1909/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.785 | DEBUG    | __main__:trials:29 - Trial = 1909/30000 | Total reward = 22.23
2022-01-26 14:16:32.789 | DEBUG    | __main__:trials:24 - Trial = 1910/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.791 | DEBUG    | __main__:trials:29 - Trial = 1910/30000 | Total reward = 47.85
2022-01-26 14:16:32.795 | DEBUG    | __main__:trials:24 - Trial = 1911/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.795 | DEBUG    | __main__:trials:29 - Trial = 1911/30000 | Total reward = 46.39
2022-01-26 14:16:32.800 | DEBUG    | __main__:trials:24 - Trial = 1912/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.801 | DEBUG    | __main__:trials:29 - Trial = 1912/30000 | Total reward = 50.24
2022-01-26 14:16:32.804 | DEBUG    | __main__:trials:24 - Trial = 1913/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.806 | DEBUG    | __main__:trials:29 - Trial = 1913/30000 | Total reward = 50.17
2022-01-26 14:16:32.810 | DEBUG    | __main__:trials:24 - Trial = 1914/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.810 | DEBUG    | __main__:trials:29 - Trial = 1914/30000 | Total reward = 53.12
2022-01-26 14:16:32.815 | DEBUG    | __main__:trials:24 - Trial = 1915/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.817 | DEBUG    | __main__:trials:29 - Trial = 1915/30000 | Total reward = 42.10
2022-01-26 14:16:32.820 | DEBUG    | __main__:trials:24 - Trial = 1916/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.822 | DEBUG    | __main__:trials:29 - Trial = 1916/30000 | Total reward = 35.80
2022-01-26 14:16:32.826 | DEBUG    | __main__:trials:24 - Trial = 1917/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.827 | DEBUG    | __main__:trials:29 - Trial = 1917/30000 | Total reward = 50.71
2022-01-26 14:16:32.831 | DEBUG    | __main__:trials:24 - Trial = 1918/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.832 | DEBUG    | __main__:trials:29 - Trial = 1918/30000 | Total reward = 48.31
2022-01-26 14:16:32.836 | DEBUG    | __main__:trials:24 - Trial = 1919/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.838 | DEBUG    | __main__:trials:29 - Trial = 1919/30000 | Total reward = 50.17
2022-01-26 14:16:32.841 | DEBUG    | __main__:trials:24 - Trial = 1920/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.842 | DEBUG    | __main__:trials:29 - Trial = 1920/30000 | Total reward = 49.19
2022-01-26 14:16:32.846 | DEBUG    | __main__:trials:24 - Trial = 1921/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.848 | DEBUG    | __main__:trials:29 - Trial = 1921/30000 | Total reward = 47.05
2022-01-26 14:16:32.851 | DEBUG    | __main__:trials:24 - Trial = 1922/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.853 | DEBUG    | __main__:trials:29 - Trial = 1922/30000 | Total reward = 49.64
2022-01-26 14:16:32.856 | DEBUG    | __main__:trials:26 - Trial = 1923/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.857 | DEBUG    | __main__:trials:29 - Trial = 1923/30000 | Total reward = 33.42
2022-01-26 14:16:32.860 | DEBUG    | __main__:trials:24 - Trial = 1924/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.862 | DEBUG    | __main__:trials:29 - Trial = 1924/30000 | Total reward = 49.91
2022-01-26 14:16:32.866 | DEBUG    | __main__:trials:24 - Trial = 1925/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.867 | DEBUG    | __main__:trials:29 - Trial = 1925/30000 | Total reward = 50.31
2022-01-26 14:16:32.871 | DEBUG    | __main__:trials:24 - Trial = 1926/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.872 | DEBUG    | __main__:trials:29 - Trial = 1926/30000 | Total reward = 48.20
2022-01-26 14:16:32.876 | DEBUG    | __main__:trials:26 - Trial = 1927/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:32.877 | DEBUG    | __main__:trials:29 - Trial = 1927/30000 | Total reward = 26.95
2022-01-26 14:16:32.881 | DEBUG    | __main__:trials:24 - Trial = 1928/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.882 | DEBUG    | __main__:trials:29 - Trial = 1928/30000 | Total reward = 52.21
2022-01-26 14:16:32.886 | DEBUG    | __main__:trials:24 - Trial = 1929/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.887 | DEBUG    | __main__:trials:29 - Trial = 1929/30000 | Total reward = 47.52
2022-01-26 14:16:32.892 | DEBUG    | __main__:trials:24 - Trial = 1930/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.893 | DEBUG    | __main__:trials:29 - Trial = 1930/30000 | Total reward = 44.30
2022-01-26 14:16:32.896 | DEBUG    | __main__:trials:24 - Trial = 1931/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.898 | DEBUG    | __main__:trials:29 - Trial = 1931/30000 | Total reward = 51.63
2022-01-26 14:16:32.902 | DEBUG    | __main__:trials:24 - Trial = 1932/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.904 | DEBUG    | __main__:trials:29 - Trial = 1932/30000 | Total reward = 44.11
2022-01-26 14:16:32.907 | DEBUG    | __main__:trials:24 - Trial = 1933/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.908 | DEBUG    | __main__:trials:29 - Trial = 1933/30000 | Total reward = 43.39
2022-01-26 14:16:32.912 | DEBUG    | __main__:trials:24 - Trial = 1934/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.913 | DEBUG    | __main__:trials:29 - Trial = 1934/30000 | Total reward = 53.67
2022-01-26 14:16:32.916 | DEBUG    | __main__:trials:24 - Trial = 1935/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.918 | DEBUG    | __main__:trials:29 - Trial = 1935/30000 | Total reward = 50.40
2022-01-26 14:16:32.921 | DEBUG    | __main__:trials:24 - Trial = 1936/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.922 | DEBUG    | __main__:trials:29 - Trial = 1936/30000 | Total reward = 43.14
2022-01-26 14:16:32.925 | DEBUG    | __main__:trials:24 - Trial = 1937/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.927 | DEBUG    | __main__:trials:29 - Trial = 1937/30000 | Total reward = 46.82
2022-01-26 14:16:32.930 | DEBUG    | __main__:trials:24 - Trial = 1938/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.932 | DEBUG    | __main__:trials:29 - Trial = 1938/30000 | Total reward = 50.28
2022-01-26 14:16:32.935 | DEBUG    | __main__:trials:24 - Trial = 1939/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.937 | DEBUG    | __main__:trials:29 - Trial = 1939/30000 | Total reward = 52.37
2022-01-26 14:16:32.940 | DEBUG    | __main__:trials:24 - Trial = 1940/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.941 | DEBUG    | __main__:trials:29 - Trial = 1940/30000 | Total reward = 44.11
2022-01-26 14:16:32.945 | DEBUG    | __main__:trials:24 - Trial = 1941/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.946 | DEBUG    | __main__:trials:29 - Trial = 1941/30000 | Total reward = 43.57
2022-01-26 14:16:32.950 | DEBUG    | __main__:trials:24 - Trial = 1942/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.951 | DEBUG    | __main__:trials:29 - Trial = 1942/30000 | Total reward = 43.63
2022-01-26 14:16:32.955 | DEBUG    | __main__:trials:24 - Trial = 1943/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.957 | DEBUG    | __main__:trials:29 - Trial = 1943/30000 | Total reward = 32.90
2022-01-26 14:16:32.961 | DEBUG    | __main__:trials:24 - Trial = 1944/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.963 | DEBUG    | __main__:trials:29 - Trial = 1944/30000 | Total reward = 41.89
2022-01-26 14:16:32.967 | DEBUG    | __main__:trials:24 - Trial = 1945/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.968 | DEBUG    | __main__:trials:29 - Trial = 1945/30000 | Total reward = 52.58
2022-01-26 14:16:32.972 | DEBUG    | __main__:trials:24 - Trial = 1946/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.974 | DEBUG    | __main__:trials:29 - Trial = 1946/30000 | Total reward = 32.53
2022-01-26 14:16:32.977 | DEBUG    | __main__:trials:24 - Trial = 1947/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.979 | DEBUG    | __main__:trials:29 - Trial = 1947/30000 | Total reward = 52.46
2022-01-26 14:16:32.982 | DEBUG    | __main__:trials:24 - Trial = 1948/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.984 | DEBUG    | __main__:trials:29 - Trial = 1948/30000 | Total reward = 48.50
2022-01-26 14:16:32.987 | DEBUG    | __main__:trials:24 - Trial = 1949/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.988 | DEBUG    | __main__:trials:29 - Trial = 1949/30000 | Total reward = 23.83
2022-01-26 14:16:32.992 | DEBUG    | __main__:trials:24 - Trial = 1950/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.993 | DEBUG    | __main__:trials:29 - Trial = 1950/30000 | Total reward = 39.99
2022-01-26 14:16:32.998 | DEBUG    | __main__:trials:24 - Trial = 1951/30000 | Max number of steps (20) reached
2022-01-26 14:16:32.999 | DEBUG    | __main__:trials:29 - Trial = 1951/30000 | Total reward = 45.97
2022-01-26 14:16:33.003 | DEBUG    | __main__:trials:24 - Trial = 1952/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.004 | DEBUG    | __main__:trials:29 - Trial = 1952/30000 | Total reward = 52.58
2022-01-26 14:16:33.008 | DEBUG    | __main__:trials:24 - Trial = 1953/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.009 | DEBUG    | __main__:trials:29 - Trial = 1953/30000 | Total reward = 48.74
2022-01-26 14:16:33.014 | DEBUG    | __main__:trials:24 - Trial = 1954/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.015 | DEBUG    | __main__:trials:29 - Trial = 1954/30000 | Total reward = 51.55
2022-01-26 14:16:33.019 | DEBUG    | __main__:trials:24 - Trial = 1955/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.021 | DEBUG    | __main__:trials:29 - Trial = 1955/30000 | Total reward = 48.74
2022-01-26 14:16:33.024 | DEBUG    | __main__:trials:24 - Trial = 1956/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.026 | DEBUG    | __main__:trials:29 - Trial = 1956/30000 | Total reward = 51.73
2022-01-26 14:16:33.030 | DEBUG    | __main__:trials:24 - Trial = 1957/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.031 | DEBUG    | __main__:trials:29 - Trial = 1957/30000 | Total reward = 31.97
2022-01-26 14:16:33.035 | DEBUG    | __main__:trials:24 - Trial = 1958/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.036 | DEBUG    | __main__:trials:29 - Trial = 1958/30000 | Total reward = 29.97
2022-01-26 14:16:33.040 | DEBUG    | __main__:trials:24 - Trial = 1959/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.041 | DEBUG    | __main__:trials:29 - Trial = 1959/30000 | Total reward = 59.30
2022-01-26 14:16:33.045 | DEBUG    | __main__:trials:24 - Trial = 1960/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.047 | DEBUG    | __main__:trials:29 - Trial = 1960/30000 | Total reward = 38.37
2022-01-26 14:16:33.051 | DEBUG    | __main__:trials:24 - Trial = 1961/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.051 | DEBUG    | __main__:trials:29 - Trial = 1961/30000 | Total reward = 39.26
2022-01-26 14:16:33.055 | DEBUG    | __main__:trials:24 - Trial = 1962/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.057 | DEBUG    | __main__:trials:29 - Trial = 1962/30000 | Total reward = 54.32
2022-01-26 14:16:33.060 | DEBUG    | __main__:trials:24 - Trial = 1963/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.061 | DEBUG    | __main__:trials:29 - Trial = 1963/30000 | Total reward = 52.52
2022-01-26 14:16:33.065 | DEBUG    | __main__:trials:24 - Trial = 1964/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.066 | DEBUG    | __main__:trials:29 - Trial = 1964/30000 | Total reward = 51.31
2022-01-26 14:16:33.070 | DEBUG    | __main__:trials:24 - Trial = 1965/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.071 | DEBUG    | __main__:trials:29 - Trial = 1965/30000 | Total reward = 48.17
2022-01-26 14:16:33.075 | DEBUG    | __main__:trials:24 - Trial = 1966/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.077 | DEBUG    | __main__:trials:29 - Trial = 1966/30000 | Total reward = 51.98
2022-01-26 14:16:33.080 | DEBUG    | __main__:trials:24 - Trial = 1967/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.081 | DEBUG    | __main__:trials:29 - Trial = 1967/30000 | Total reward = 55.66
2022-01-26 14:16:33.086 | DEBUG    | __main__:trials:24 - Trial = 1968/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.086 | DEBUG    | __main__:trials:29 - Trial = 1968/30000 | Total reward = 54.65
2022-01-26 14:16:33.090 | DEBUG    | __main__:trials:24 - Trial = 1969/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.092 | DEBUG    | __main__:trials:29 - Trial = 1969/30000 | Total reward = 62.57
2022-01-26 14:16:33.096 | DEBUG    | __main__:trials:24 - Trial = 1970/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.097 | DEBUG    | __main__:trials:29 - Trial = 1970/30000 | Total reward = 51.32
2022-01-26 14:16:33.101 | DEBUG    | __main__:trials:24 - Trial = 1971/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.102 | DEBUG    | __main__:trials:29 - Trial = 1971/30000 | Total reward = 57.14
2022-01-26 14:16:33.105 | DEBUG    | __main__:trials:24 - Trial = 1972/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.106 | DEBUG    | __main__:trials:29 - Trial = 1972/30000 | Total reward = 52.83
2022-01-26 14:16:33.109 | DEBUG    | __main__:trials:24 - Trial = 1973/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.110 | DEBUG    | __main__:trials:29 - Trial = 1973/30000 | Total reward = 40.47
2022-01-26 14:16:33.113 | DEBUG    | __main__:trials:24 - Trial = 1974/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.115 | DEBUG    | __main__:trials:29 - Trial = 1974/30000 | Total reward = 47.78
2022-01-26 14:16:33.118 | DEBUG    | __main__:trials:24 - Trial = 1975/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.119 | DEBUG    | __main__:trials:29 - Trial = 1975/30000 | Total reward = 48.10
2022-01-26 14:16:33.124 | DEBUG    | __main__:trials:24 - Trial = 1976/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.125 | DEBUG    | __main__:trials:29 - Trial = 1976/30000 | Total reward = 54.07
2022-01-26 14:16:33.128 | DEBUG    | __main__:trials:24 - Trial = 1977/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.130 | DEBUG    | __main__:trials:29 - Trial = 1977/30000 | Total reward = 45.19
2022-01-26 14:16:33.134 | DEBUG    | __main__:trials:24 - Trial = 1978/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.136 | DEBUG    | __main__:trials:29 - Trial = 1978/30000 | Total reward = 40.82
2022-01-26 14:16:33.138 | DEBUG    | __main__:trials:24 - Trial = 1979/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.139 | DEBUG    | __main__:trials:29 - Trial = 1979/30000 | Total reward = 48.62
2022-01-26 14:16:33.143 | DEBUG    | __main__:trials:24 - Trial = 1980/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.144 | DEBUG    | __main__:trials:29 - Trial = 1980/30000 | Total reward = 51.66
2022-01-26 14:16:33.148 | DEBUG    | __main__:trials:24 - Trial = 1981/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.149 | DEBUG    | __main__:trials:29 - Trial = 1981/30000 | Total reward = 55.20
2022-01-26 14:16:33.153 | DEBUG    | __main__:trials:24 - Trial = 1982/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.154 | DEBUG    | __main__:trials:29 - Trial = 1982/30000 | Total reward = 53.44
2022-01-26 14:16:33.158 | DEBUG    | __main__:trials:24 - Trial = 1983/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.160 | DEBUG    | __main__:trials:29 - Trial = 1983/30000 | Total reward = 32.47
2022-01-26 14:16:33.164 | DEBUG    | __main__:trials:24 - Trial = 1984/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.165 | DEBUG    | __main__:trials:29 - Trial = 1984/30000 | Total reward = 52.35
2022-01-26 14:16:33.169 | DEBUG    | __main__:trials:24 - Trial = 1985/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.171 | DEBUG    | __main__:trials:29 - Trial = 1985/30000 | Total reward = 27.97
2022-01-26 14:16:33.174 | DEBUG    | __main__:trials:24 - Trial = 1986/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.176 | DEBUG    | __main__:trials:29 - Trial = 1986/30000 | Total reward = 48.95
2022-01-26 14:16:33.179 | DEBUG    | __main__:trials:24 - Trial = 1987/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.181 | DEBUG    | __main__:trials:29 - Trial = 1987/30000 | Total reward = 44.25
2022-01-26 14:16:33.184 | DEBUG    | __main__:trials:24 - Trial = 1988/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.185 | DEBUG    | __main__:trials:29 - Trial = 1988/30000 | Total reward = 55.69
2022-01-26 14:16:33.188 | DEBUG    | __main__:trials:24 - Trial = 1989/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.190 | DEBUG    | __main__:trials:29 - Trial = 1989/30000 | Total reward = 51.23
2022-01-26 14:16:33.193 | DEBUG    | __main__:trials:24 - Trial = 1990/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.194 | DEBUG    | __main__:trials:29 - Trial = 1990/30000 | Total reward = 49.91
2022-01-26 14:16:33.197 | DEBUG    | __main__:trials:24 - Trial = 1991/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.198 | DEBUG    | __main__:trials:29 - Trial = 1991/30000 | Total reward = 54.35
2022-01-26 14:16:33.201 | DEBUG    | __main__:trials:24 - Trial = 1992/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.203 | DEBUG    | __main__:trials:29 - Trial = 1992/30000 | Total reward = 49.87
2022-01-26 14:16:33.207 | DEBUG    | __main__:trials:24 - Trial = 1993/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.208 | DEBUG    | __main__:trials:29 - Trial = 1993/30000 | Total reward = 52.58
2022-01-26 14:16:33.212 | DEBUG    | __main__:trials:24 - Trial = 1994/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.214 | DEBUG    | __main__:trials:29 - Trial = 1994/30000 | Total reward = 62.02
2022-01-26 14:16:33.217 | DEBUG    | __main__:trials:24 - Trial = 1995/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.219 | DEBUG    | __main__:trials:29 - Trial = 1995/30000 | Total reward = 48.74
2022-01-26 14:16:33.223 | DEBUG    | __main__:trials:24 - Trial = 1996/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.224 | DEBUG    | __main__:trials:29 - Trial = 1996/30000 | Total reward = 29.96
2022-01-26 14:16:33.227 | DEBUG    | __main__:trials:24 - Trial = 1997/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.229 | DEBUG    | __main__:trials:29 - Trial = 1997/30000 | Total reward = 51.26
2022-01-26 14:16:33.233 | DEBUG    | __main__:trials:24 - Trial = 1998/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.234 | DEBUG    | __main__:trials:29 - Trial = 1998/30000 | Total reward = 54.88
2022-01-26 14:16:33.238 | DEBUG    | __main__:trials:24 - Trial = 1999/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.240 | DEBUG    | __main__:trials:29 - Trial = 1999/30000 | Total reward = 30.06
2022-01-26 14:16:33.242 | DEBUG    | __main__:trials:26 - Trial = 2000/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.244 | DEBUG    | __main__:trials:29 - Trial = 2000/30000 | Total reward = 30.88
2022-01-26 14:16:33.248 | DEBUG    | __main__:trials:24 - Trial = 2001/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.250 | DEBUG    | __main__:trials:29 - Trial = 2001/30000 | Total reward = 49.08
2022-01-26 14:16:33.252 | DEBUG    | __main__:trials:26 - Trial = 2002/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.254 | DEBUG    | __main__:trials:29 - Trial = 2002/30000 | Total reward = 20.12
2022-01-26 14:16:33.257 | DEBUG    | __main__:trials:26 - Trial = 2003/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.259 | DEBUG    | __main__:trials:29 - Trial = 2003/30000 | Total reward = 33.53
2022-01-26 14:16:33.263 | DEBUG    | __main__:trials:24 - Trial = 2004/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.264 | DEBUG    | __main__:trials:29 - Trial = 2004/30000 | Total reward = 32.89
2022-01-26 14:16:33.267 | DEBUG    | __main__:trials:24 - Trial = 2005/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.269 | DEBUG    | __main__:trials:29 - Trial = 2005/30000 | Total reward = 50.95
2022-01-26 14:16:33.272 | DEBUG    | __main__:trials:24 - Trial = 2006/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.274 | DEBUG    | __main__:trials:29 - Trial = 2006/30000 | Total reward = 45.26
2022-01-26 14:16:33.277 | DEBUG    | __main__:trials:24 - Trial = 2007/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.279 | DEBUG    | __main__:trials:29 - Trial = 2007/30000 | Total reward = 48.36
2022-01-26 14:16:33.282 | DEBUG    | __main__:trials:24 - Trial = 2008/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.284 | DEBUG    | __main__:trials:29 - Trial = 2008/30000 | Total reward = 50.58
2022-01-26 14:16:33.287 | DEBUG    | __main__:trials:24 - Trial = 2009/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.289 | DEBUG    | __main__:trials:29 - Trial = 2009/30000 | Total reward = 36.07
2022-01-26 14:16:33.291 | DEBUG    | __main__:trials:26 - Trial = 2010/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.293 | DEBUG    | __main__:trials:29 - Trial = 2010/30000 | Total reward = 28.57
2022-01-26 14:16:33.296 | DEBUG    | __main__:trials:24 - Trial = 2011/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.297 | DEBUG    | __main__:trials:29 - Trial = 2011/30000 | Total reward = 62.80
2022-01-26 14:16:33.301 | DEBUG    | __main__:trials:24 - Trial = 2012/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.301 | DEBUG    | __main__:trials:29 - Trial = 2012/30000 | Total reward = 51.39
2022-01-26 14:16:33.306 | DEBUG    | __main__:trials:24 - Trial = 2013/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.308 | DEBUG    | __main__:trials:29 - Trial = 2013/30000 | Total reward = 49.97
2022-01-26 14:16:33.311 | DEBUG    | __main__:trials:26 - Trial = 2014/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.313 | DEBUG    | __main__:trials:29 - Trial = 2014/30000 | Total reward = 32.87
2022-01-26 14:16:33.316 | DEBUG    | __main__:trials:24 - Trial = 2015/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.317 | DEBUG    | __main__:trials:29 - Trial = 2015/30000 | Total reward = 51.65
2022-01-26 14:16:33.320 | DEBUG    | __main__:trials:24 - Trial = 2016/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.322 | DEBUG    | __main__:trials:29 - Trial = 2016/30000 | Total reward = 37.28
2022-01-26 14:16:33.326 | DEBUG    | __main__:trials:24 - Trial = 2017/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.327 | DEBUG    | __main__:trials:29 - Trial = 2017/30000 | Total reward = 44.29
2022-01-26 14:16:33.331 | DEBUG    | __main__:trials:24 - Trial = 2018/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.333 | DEBUG    | __main__:trials:29 - Trial = 2018/30000 | Total reward = 44.14
2022-01-26 14:16:33.336 | DEBUG    | __main__:trials:24 - Trial = 2019/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.338 | DEBUG    | __main__:trials:29 - Trial = 2019/30000 | Total reward = 56.29
2022-01-26 14:16:33.341 | DEBUG    | __main__:trials:24 - Trial = 2020/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.343 | DEBUG    | __main__:trials:29 - Trial = 2020/30000 | Total reward = 52.27
2022-01-26 14:16:33.347 | DEBUG    | __main__:trials:24 - Trial = 2021/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.348 | DEBUG    | __main__:trials:29 - Trial = 2021/30000 | Total reward = 48.61
2022-01-26 14:16:33.352 | DEBUG    | __main__:trials:24 - Trial = 2022/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.353 | DEBUG    | __main__:trials:29 - Trial = 2022/30000 | Total reward = 50.60
2022-01-26 14:16:33.357 | DEBUG    | __main__:trials:24 - Trial = 2023/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.357 | DEBUG    | __main__:trials:29 - Trial = 2023/30000 | Total reward = 42.57
2022-01-26 14:16:33.361 | DEBUG    | __main__:trials:24 - Trial = 2024/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.362 | DEBUG    | __main__:trials:29 - Trial = 2024/30000 | Total reward = 32.95
2022-01-26 14:16:33.366 | DEBUG    | __main__:trials:24 - Trial = 2025/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.367 | DEBUG    | __main__:trials:29 - Trial = 2025/30000 | Total reward = 48.96
2022-01-26 14:16:33.370 | DEBUG    | __main__:trials:24 - Trial = 2026/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.372 | DEBUG    | __main__:trials:29 - Trial = 2026/30000 | Total reward = 44.83
2022-01-26 14:16:33.376 | DEBUG    | __main__:trials:24 - Trial = 2027/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.377 | DEBUG    | __main__:trials:29 - Trial = 2027/30000 | Total reward = 51.10
2022-01-26 14:16:33.381 | DEBUG    | __main__:trials:26 - Trial = 2028/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.382 | DEBUG    | __main__:trials:29 - Trial = 2028/30000 | Total reward = 29.69
2022-01-26 14:16:33.385 | DEBUG    | __main__:trials:24 - Trial = 2029/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.387 | DEBUG    | __main__:trials:29 - Trial = 2029/30000 | Total reward = 43.39
2022-01-26 14:16:33.391 | DEBUG    | __main__:trials:24 - Trial = 2030/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.391 | DEBUG    | __main__:trials:29 - Trial = 2030/30000 | Total reward = 48.74
2022-01-26 14:16:33.396 | DEBUG    | __main__:trials:24 - Trial = 2031/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.398 | DEBUG    | __main__:trials:29 - Trial = 2031/30000 | Total reward = 47.77
2022-01-26 14:16:33.401 | DEBUG    | __main__:trials:24 - Trial = 2032/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.402 | DEBUG    | __main__:trials:29 - Trial = 2032/30000 | Total reward = 42.46
2022-01-26 14:16:33.406 | DEBUG    | __main__:trials:24 - Trial = 2033/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.407 | DEBUG    | __main__:trials:29 - Trial = 2033/30000 | Total reward = 51.36
2022-01-26 14:16:33.411 | DEBUG    | __main__:trials:24 - Trial = 2034/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.413 | DEBUG    | __main__:trials:29 - Trial = 2034/30000 | Total reward = 52.07
2022-01-26 14:16:33.417 | DEBUG    | __main__:trials:24 - Trial = 2035/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.418 | DEBUG    | __main__:trials:29 - Trial = 2035/30000 | Total reward = 52.94
2022-01-26 14:16:33.422 | DEBUG    | __main__:trials:24 - Trial = 2036/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.424 | DEBUG    | __main__:trials:29 - Trial = 2036/30000 | Total reward = 50.26
2022-01-26 14:16:33.427 | DEBUG    | __main__:trials:24 - Trial = 2037/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.429 | DEBUG    | __main__:trials:29 - Trial = 2037/30000 | Total reward = 53.02
2022-01-26 14:16:33.432 | DEBUG    | __main__:trials:24 - Trial = 2038/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.433 | DEBUG    | __main__:trials:29 - Trial = 2038/30000 | Total reward = 62.15
2022-01-26 14:16:33.437 | DEBUG    | __main__:trials:24 - Trial = 2039/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.438 | DEBUG    | __main__:trials:29 - Trial = 2039/30000 | Total reward = 55.33
2022-01-26 14:16:33.443 | DEBUG    | __main__:trials:24 - Trial = 2040/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.443 | DEBUG    | __main__:trials:29 - Trial = 2040/30000 | Total reward = 46.05
2022-01-26 14:16:33.448 | DEBUG    | __main__:trials:24 - Trial = 2041/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.449 | DEBUG    | __main__:trials:29 - Trial = 2041/30000 | Total reward = 53.95
2022-01-26 14:16:33.453 | DEBUG    | __main__:trials:24 - Trial = 2042/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.453 | DEBUG    | __main__:trials:29 - Trial = 2042/30000 | Total reward = 53.17
2022-01-26 14:16:33.457 | DEBUG    | __main__:trials:24 - Trial = 2043/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.459 | DEBUG    | __main__:trials:29 - Trial = 2043/30000 | Total reward = 62.80
2022-01-26 14:16:33.462 | DEBUG    | __main__:trials:24 - Trial = 2044/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.464 | DEBUG    | __main__:trials:29 - Trial = 2044/30000 | Total reward = 60.09
2022-01-26 14:16:33.467 | DEBUG    | __main__:trials:26 - Trial = 2045/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.468 | DEBUG    | __main__:trials:29 - Trial = 2045/30000 | Total reward = 40.24
2022-01-26 14:16:33.472 | DEBUG    | __main__:trials:24 - Trial = 2046/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.474 | DEBUG    | __main__:trials:29 - Trial = 2046/30000 | Total reward = 47.74
2022-01-26 14:16:33.478 | DEBUG    | __main__:trials:24 - Trial = 2047/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.479 | DEBUG    | __main__:trials:29 - Trial = 2047/30000 | Total reward = 53.25
2022-01-26 14:16:33.483 | DEBUG    | __main__:trials:24 - Trial = 2048/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.484 | DEBUG    | __main__:trials:29 - Trial = 2048/30000 | Total reward = 51.20
2022-01-26 14:16:33.488 | DEBUG    | __main__:trials:24 - Trial = 2049/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.489 | DEBUG    | __main__:trials:29 - Trial = 2049/30000 | Total reward = 59.86
2022-01-26 14:16:33.493 | DEBUG    | __main__:trials:24 - Trial = 2050/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.495 | DEBUG    | __main__:trials:29 - Trial = 2050/30000 | Total reward = 42.18
2022-01-26 14:16:33.499 | DEBUG    | __main__:trials:24 - Trial = 2051/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.499 | DEBUG    | __main__:trials:29 - Trial = 2051/30000 | Total reward = 50.18
2022-01-26 14:16:33.504 | DEBUG    | __main__:trials:24 - Trial = 2052/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.505 | DEBUG    | __main__:trials:29 - Trial = 2052/30000 | Total reward = 51.68
2022-01-26 14:16:33.508 | DEBUG    | __main__:trials:24 - Trial = 2053/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.510 | DEBUG    | __main__:trials:29 - Trial = 2053/30000 | Total reward = 53.69
2022-01-26 14:16:33.514 | DEBUG    | __main__:trials:24 - Trial = 2054/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.515 | DEBUG    | __main__:trials:29 - Trial = 2054/30000 | Total reward = 53.58
2022-01-26 14:16:33.518 | DEBUG    | __main__:trials:24 - Trial = 2055/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.520 | DEBUG    | __main__:trials:29 - Trial = 2055/30000 | Total reward = 36.93
2022-01-26 14:16:33.523 | DEBUG    | __main__:trials:24 - Trial = 2056/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.525 | DEBUG    | __main__:trials:29 - Trial = 2056/30000 | Total reward = 50.05
2022-01-26 14:16:33.528 | DEBUG    | __main__:trials:24 - Trial = 2057/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.529 | DEBUG    | __main__:trials:29 - Trial = 2057/30000 | Total reward = 43.59
2022-01-26 14:16:33.533 | DEBUG    | __main__:trials:24 - Trial = 2058/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.535 | DEBUG    | __main__:trials:29 - Trial = 2058/30000 | Total reward = 47.71
2022-01-26 14:16:33.539 | DEBUG    | __main__:trials:24 - Trial = 2059/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.540 | DEBUG    | __main__:trials:29 - Trial = 2059/30000 | Total reward = 47.70
2022-01-26 14:16:33.544 | DEBUG    | __main__:trials:24 - Trial = 2060/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.546 | DEBUG    | __main__:trials:29 - Trial = 2060/30000 | Total reward = 52.25
2022-01-26 14:16:33.550 | DEBUG    | __main__:trials:24 - Trial = 2061/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.552 | DEBUG    | __main__:trials:29 - Trial = 2061/30000 | Total reward = 51.78
2022-01-26 14:16:33.556 | DEBUG    | __main__:trials:24 - Trial = 2062/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.557 | DEBUG    | __main__:trials:29 - Trial = 2062/30000 | Total reward = 49.67
2022-01-26 14:16:33.561 | DEBUG    | __main__:trials:24 - Trial = 2063/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.563 | DEBUG    | __main__:trials:29 - Trial = 2063/30000 | Total reward = 42.26
2022-01-26 14:16:33.566 | DEBUG    | __main__:trials:24 - Trial = 2064/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.567 | DEBUG    | __main__:trials:29 - Trial = 2064/30000 | Total reward = 48.15
2022-01-26 14:16:33.572 | DEBUG    | __main__:trials:24 - Trial = 2065/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.573 | DEBUG    | __main__:trials:29 - Trial = 2065/30000 | Total reward = 47.94
2022-01-26 14:16:33.577 | DEBUG    | __main__:trials:24 - Trial = 2066/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.578 | DEBUG    | __main__:trials:29 - Trial = 2066/30000 | Total reward = 48.12
2022-01-26 14:16:33.582 | DEBUG    | __main__:trials:24 - Trial = 2067/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.584 | DEBUG    | __main__:trials:29 - Trial = 2067/30000 | Total reward = 32.27
2022-01-26 14:16:33.588 | DEBUG    | __main__:trials:24 - Trial = 2068/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.588 | DEBUG    | __main__:trials:29 - Trial = 2068/30000 | Total reward = 31.97
2022-01-26 14:16:33.592 | DEBUG    | __main__:trials:24 - Trial = 2069/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.594 | DEBUG    | __main__:trials:29 - Trial = 2069/30000 | Total reward = 51.09
2022-01-26 14:16:33.598 | DEBUG    | __main__:trials:24 - Trial = 2070/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.599 | DEBUG    | __main__:trials:29 - Trial = 2070/30000 | Total reward = 36.27
2022-01-26 14:16:33.603 | DEBUG    | __main__:trials:24 - Trial = 2071/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.604 | DEBUG    | __main__:trials:29 - Trial = 2071/30000 | Total reward = 48.49
2022-01-26 14:16:33.608 | DEBUG    | __main__:trials:24 - Trial = 2072/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.610 | DEBUG    | __main__:trials:29 - Trial = 2072/30000 | Total reward = 51.11
2022-01-26 14:16:33.613 | DEBUG    | __main__:trials:24 - Trial = 2073/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.615 | DEBUG    | __main__:trials:29 - Trial = 2073/30000 | Total reward = 50.23
2022-01-26 14:16:33.619 | DEBUG    | __main__:trials:24 - Trial = 2074/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.620 | DEBUG    | __main__:trials:29 - Trial = 2074/30000 | Total reward = 49.67
2022-01-26 14:16:33.624 | DEBUG    | __main__:trials:24 - Trial = 2075/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.626 | DEBUG    | __main__:trials:29 - Trial = 2075/30000 | Total reward = 43.37
2022-01-26 14:16:33.629 | DEBUG    | __main__:trials:24 - Trial = 2076/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.631 | DEBUG    | __main__:trials:29 - Trial = 2076/30000 | Total reward = 50.58
2022-01-26 14:16:33.635 | DEBUG    | __main__:trials:24 - Trial = 2077/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.636 | DEBUG    | __main__:trials:29 - Trial = 2077/30000 | Total reward = 38.97
2022-01-26 14:16:33.640 | DEBUG    | __main__:trials:24 - Trial = 2078/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.641 | DEBUG    | __main__:trials:29 - Trial = 2078/30000 | Total reward = 36.27
2022-01-26 14:16:33.645 | DEBUG    | __main__:trials:24 - Trial = 2079/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.646 | DEBUG    | __main__:trials:29 - Trial = 2079/30000 | Total reward = 56.23
2022-01-26 14:16:33.649 | DEBUG    | __main__:trials:24 - Trial = 2080/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.650 | DEBUG    | __main__:trials:29 - Trial = 2080/30000 | Total reward = 47.42
2022-01-26 14:16:33.654 | DEBUG    | __main__:trials:24 - Trial = 2081/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.656 | DEBUG    | __main__:trials:29 - Trial = 2081/30000 | Total reward = 49.14
2022-01-26 14:16:33.659 | DEBUG    | __main__:trials:24 - Trial = 2082/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.661 | DEBUG    | __main__:trials:29 - Trial = 2082/30000 | Total reward = 46.75
2022-01-26 14:16:33.665 | DEBUG    | __main__:trials:24 - Trial = 2083/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.665 | DEBUG    | __main__:trials:29 - Trial = 2083/30000 | Total reward = 45.29
2022-01-26 14:16:33.669 | DEBUG    | __main__:trials:24 - Trial = 2084/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.670 | DEBUG    | __main__:trials:29 - Trial = 2084/30000 | Total reward = 43.85
2022-01-26 14:16:33.673 | DEBUG    | __main__:trials:24 - Trial = 2085/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.675 | DEBUG    | __main__:trials:29 - Trial = 2085/30000 | Total reward = 54.99
2022-01-26 14:16:33.678 | DEBUG    | __main__:trials:24 - Trial = 2086/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.679 | DEBUG    | __main__:trials:29 - Trial = 2086/30000 | Total reward = 43.22
2022-01-26 14:16:33.682 | DEBUG    | __main__:trials:24 - Trial = 2087/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.682 | DEBUG    | __main__:trials:29 - Trial = 2087/30000 | Total reward = 52.06
2022-01-26 14:16:33.687 | DEBUG    | __main__:trials:24 - Trial = 2088/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.688 | DEBUG    | __main__:trials:29 - Trial = 2088/30000 | Total reward = 55.86
2022-01-26 14:16:33.692 | DEBUG    | __main__:trials:24 - Trial = 2089/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.694 | DEBUG    | __main__:trials:29 - Trial = 2089/30000 | Total reward = 57.98
2022-01-26 14:16:33.697 | DEBUG    | __main__:trials:24 - Trial = 2090/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.699 | DEBUG    | __main__:trials:29 - Trial = 2090/30000 | Total reward = 43.38
2022-01-26 14:16:33.703 | DEBUG    | __main__:trials:24 - Trial = 2091/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.704 | DEBUG    | __main__:trials:29 - Trial = 2091/30000 | Total reward = 46.48
2022-01-26 14:16:33.708 | DEBUG    | __main__:trials:24 - Trial = 2092/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.709 | DEBUG    | __main__:trials:29 - Trial = 2092/30000 | Total reward = 43.60
2022-01-26 14:16:33.713 | DEBUG    | __main__:trials:24 - Trial = 2093/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.714 | DEBUG    | __main__:trials:29 - Trial = 2093/30000 | Total reward = 49.79
2022-01-26 14:16:33.718 | DEBUG    | __main__:trials:24 - Trial = 2094/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.719 | DEBUG    | __main__:trials:29 - Trial = 2094/30000 | Total reward = 41.99
2022-01-26 14:16:33.723 | DEBUG    | __main__:trials:24 - Trial = 2095/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.724 | DEBUG    | __main__:trials:29 - Trial = 2095/30000 | Total reward = 47.37
2022-01-26 14:16:33.728 | DEBUG    | __main__:trials:24 - Trial = 2096/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.729 | DEBUG    | __main__:trials:29 - Trial = 2096/30000 | Total reward = 48.93
2022-01-26 14:16:33.732 | DEBUG    | __main__:trials:24 - Trial = 2097/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.734 | DEBUG    | __main__:trials:29 - Trial = 2097/30000 | Total reward = 48.81
2022-01-26 14:16:33.736 | DEBUG    | __main__:trials:24 - Trial = 2098/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.737 | DEBUG    | __main__:trials:29 - Trial = 2098/30000 | Total reward = 58.72
2022-01-26 14:16:33.741 | DEBUG    | __main__:trials:24 - Trial = 2099/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.741 | DEBUG    | __main__:trials:29 - Trial = 2099/30000 | Total reward = 50.32
2022-01-26 14:16:33.746 | DEBUG    | __main__:trials:24 - Trial = 2100/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.746 | DEBUG    | __main__:trials:29 - Trial = 2100/30000 | Total reward = 67.13
2022-01-26 14:16:33.750 | DEBUG    | __main__:trials:24 - Trial = 2101/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.751 | DEBUG    | __main__:trials:29 - Trial = 2101/30000 | Total reward = 48.06
2022-01-26 14:16:33.755 | DEBUG    | __main__:trials:24 - Trial = 2102/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.757 | DEBUG    | __main__:trials:29 - Trial = 2102/30000 | Total reward = 48.68
2022-01-26 14:16:33.760 | DEBUG    | __main__:trials:24 - Trial = 2103/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.761 | DEBUG    | __main__:trials:29 - Trial = 2103/30000 | Total reward = 54.66
2022-01-26 14:16:33.766 | DEBUG    | __main__:trials:24 - Trial = 2104/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.767 | DEBUG    | __main__:trials:29 - Trial = 2104/30000 | Total reward = 34.43
2022-01-26 14:16:33.771 | DEBUG    | __main__:trials:26 - Trial = 2105/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.773 | DEBUG    | __main__:trials:29 - Trial = 2105/30000 | Total reward = 37.37
2022-01-26 14:16:33.776 | DEBUG    | __main__:trials:24 - Trial = 2106/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.777 | DEBUG    | __main__:trials:29 - Trial = 2106/30000 | Total reward = 48.47
2022-01-26 14:16:33.782 | DEBUG    | __main__:trials:24 - Trial = 2107/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.782 | DEBUG    | __main__:trials:29 - Trial = 2107/30000 | Total reward = 50.17
2022-01-26 14:16:33.786 | DEBUG    | __main__:trials:24 - Trial = 2108/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.787 | DEBUG    | __main__:trials:29 - Trial = 2108/30000 | Total reward = 52.66
2022-01-26 14:16:33.792 | DEBUG    | __main__:trials:24 - Trial = 2109/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.792 | DEBUG    | __main__:trials:29 - Trial = 2109/30000 | Total reward = 53.43
2022-01-26 14:16:33.796 | DEBUG    | __main__:trials:24 - Trial = 2110/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.798 | DEBUG    | __main__:trials:29 - Trial = 2110/30000 | Total reward = 48.87
2022-01-26 14:16:33.802 | DEBUG    | __main__:trials:24 - Trial = 2111/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.802 | DEBUG    | __main__:trials:29 - Trial = 2111/30000 | Total reward = 41.16
2022-01-26 14:16:33.807 | DEBUG    | __main__:trials:24 - Trial = 2112/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.808 | DEBUG    | __main__:trials:29 - Trial = 2112/30000 | Total reward = 44.68
2022-01-26 14:16:33.811 | DEBUG    | __main__:trials:24 - Trial = 2113/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.813 | DEBUG    | __main__:trials:29 - Trial = 2113/30000 | Total reward = 54.07
2022-01-26 14:16:33.816 | DEBUG    | __main__:trials:24 - Trial = 2114/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.818 | DEBUG    | __main__:trials:29 - Trial = 2114/30000 | Total reward = 31.64
2022-01-26 14:16:33.821 | DEBUG    | __main__:trials:24 - Trial = 2115/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.822 | DEBUG    | __main__:trials:29 - Trial = 2115/30000 | Total reward = 49.91
2022-01-26 14:16:33.825 | DEBUG    | __main__:trials:24 - Trial = 2116/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.826 | DEBUG    | __main__:trials:29 - Trial = 2116/30000 | Total reward = 40.34
2022-01-26 14:16:33.830 | DEBUG    | __main__:trials:24 - Trial = 2117/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.830 | DEBUG    | __main__:trials:29 - Trial = 2117/30000 | Total reward = 36.80
2022-01-26 14:16:33.835 | DEBUG    | __main__:trials:24 - Trial = 2118/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.835 | DEBUG    | __main__:trials:29 - Trial = 2118/30000 | Total reward = 47.42
2022-01-26 14:16:33.838 | DEBUG    | __main__:trials:26 - Trial = 2119/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:33.839 | DEBUG    | __main__:trials:29 - Trial = 2119/30000 | Total reward = 21.02
2022-01-26 14:16:33.844 | DEBUG    | __main__:trials:24 - Trial = 2120/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.844 | DEBUG    | __main__:trials:29 - Trial = 2120/30000 | Total reward = 44.70
2022-01-26 14:16:33.849 | DEBUG    | __main__:trials:24 - Trial = 2121/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.849 | DEBUG    | __main__:trials:29 - Trial = 2121/30000 | Total reward = 59.70
2022-01-26 14:16:33.854 | DEBUG    | __main__:trials:24 - Trial = 2122/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.855 | DEBUG    | __main__:trials:29 - Trial = 2122/30000 | Total reward = 40.96
2022-01-26 14:16:33.859 | DEBUG    | __main__:trials:24 - Trial = 2123/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.860 | DEBUG    | __main__:trials:29 - Trial = 2123/30000 | Total reward = 50.86
2022-01-26 14:16:33.864 | DEBUG    | __main__:trials:24 - Trial = 2124/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.866 | DEBUG    | __main__:trials:29 - Trial = 2124/30000 | Total reward = 54.83
2022-01-26 14:16:33.870 | DEBUG    | __main__:trials:24 - Trial = 2125/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.870 | DEBUG    | __main__:trials:29 - Trial = 2125/30000 | Total reward = 57.78
2022-01-26 14:16:33.875 | DEBUG    | __main__:trials:24 - Trial = 2126/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.877 | DEBUG    | __main__:trials:29 - Trial = 2126/30000 | Total reward = 46.00
2022-01-26 14:16:33.881 | DEBUG    | __main__:trials:24 - Trial = 2127/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.882 | DEBUG    | __main__:trials:29 - Trial = 2127/30000 | Total reward = 45.86
2022-01-26 14:16:33.886 | DEBUG    | __main__:trials:24 - Trial = 2128/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.887 | DEBUG    | __main__:trials:29 - Trial = 2128/30000 | Total reward = 51.11
2022-01-26 14:16:33.891 | DEBUG    | __main__:trials:24 - Trial = 2129/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.893 | DEBUG    | __main__:trials:29 - Trial = 2129/30000 | Total reward = 52.90
2022-01-26 14:16:33.896 | DEBUG    | __main__:trials:24 - Trial = 2130/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.897 | DEBUG    | __main__:trials:29 - Trial = 2130/30000 | Total reward = 48.50
2022-01-26 14:16:33.900 | DEBUG    | __main__:trials:24 - Trial = 2131/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.901 | DEBUG    | __main__:trials:29 - Trial = 2131/30000 | Total reward = 49.72
2022-01-26 14:16:33.905 | DEBUG    | __main__:trials:24 - Trial = 2132/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.906 | DEBUG    | __main__:trials:29 - Trial = 2132/30000 | Total reward = 33.22
2022-01-26 14:16:33.909 | DEBUG    | __main__:trials:24 - Trial = 2133/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.910 | DEBUG    | __main__:trials:29 - Trial = 2133/30000 | Total reward = 53.40
2022-01-26 14:16:33.913 | DEBUG    | __main__:trials:24 - Trial = 2134/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.915 | DEBUG    | __main__:trials:29 - Trial = 2134/30000 | Total reward = 45.67
2022-01-26 14:16:33.918 | DEBUG    | __main__:trials:24 - Trial = 2135/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.919 | DEBUG    | __main__:trials:29 - Trial = 2135/30000 | Total reward = 59.58
2022-01-26 14:16:33.923 | DEBUG    | __main__:trials:24 - Trial = 2136/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.924 | DEBUG    | __main__:trials:29 - Trial = 2136/30000 | Total reward = 56.59
2022-01-26 14:16:33.927 | DEBUG    | __main__:trials:24 - Trial = 2137/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.929 | DEBUG    | __main__:trials:29 - Trial = 2137/30000 | Total reward = 49.34
2022-01-26 14:16:33.933 | DEBUG    | __main__:trials:24 - Trial = 2138/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.935 | DEBUG    | __main__:trials:29 - Trial = 2138/30000 | Total reward = 45.58
2022-01-26 14:16:33.939 | DEBUG    | __main__:trials:24 - Trial = 2139/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.939 | DEBUG    | __main__:trials:29 - Trial = 2139/30000 | Total reward = 58.49
2022-01-26 14:16:33.944 | DEBUG    | __main__:trials:24 - Trial = 2140/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.946 | DEBUG    | __main__:trials:29 - Trial = 2140/30000 | Total reward = 52.01
2022-01-26 14:16:33.949 | DEBUG    | __main__:trials:24 - Trial = 2141/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.950 | DEBUG    | __main__:trials:29 - Trial = 2141/30000 | Total reward = 48.37
2022-01-26 14:16:33.953 | DEBUG    | __main__:trials:24 - Trial = 2142/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.954 | DEBUG    | __main__:trials:29 - Trial = 2142/30000 | Total reward = 55.93
2022-01-26 14:16:33.959 | DEBUG    | __main__:trials:24 - Trial = 2143/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.960 | DEBUG    | __main__:trials:29 - Trial = 2143/30000 | Total reward = 48.36
2022-01-26 14:16:33.964 | DEBUG    | __main__:trials:24 - Trial = 2144/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.965 | DEBUG    | __main__:trials:29 - Trial = 2144/30000 | Total reward = 34.83
2022-01-26 14:16:33.969 | DEBUG    | __main__:trials:24 - Trial = 2145/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.970 | DEBUG    | __main__:trials:29 - Trial = 2145/30000 | Total reward = 49.83
2022-01-26 14:16:33.974 | DEBUG    | __main__:trials:24 - Trial = 2146/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.975 | DEBUG    | __main__:trials:29 - Trial = 2146/30000 | Total reward = 50.73
2022-01-26 14:16:33.979 | DEBUG    | __main__:trials:24 - Trial = 2147/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.980 | DEBUG    | __main__:trials:29 - Trial = 2147/30000 | Total reward = 51.72
2022-01-26 14:16:33.984 | DEBUG    | __main__:trials:24 - Trial = 2148/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.986 | DEBUG    | __main__:trials:29 - Trial = 2148/30000 | Total reward = 49.17
2022-01-26 14:16:33.990 | DEBUG    | __main__:trials:24 - Trial = 2149/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.991 | DEBUG    | __main__:trials:29 - Trial = 2149/30000 | Total reward = 47.41
2022-01-26 14:16:33.995 | DEBUG    | __main__:trials:24 - Trial = 2150/30000 | Max number of steps (20) reached
2022-01-26 14:16:33.996 | DEBUG    | __main__:trials:29 - Trial = 2150/30000 | Total reward = 48.79
2022-01-26 14:16:34.000 | DEBUG    | __main__:trials:24 - Trial = 2151/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.002 | DEBUG    | __main__:trials:29 - Trial = 2151/30000 | Total reward = 54.25
2022-01-26 14:16:34.005 | DEBUG    | __main__:trials:24 - Trial = 2152/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.007 | DEBUG    | __main__:trials:29 - Trial = 2152/30000 | Total reward = 52.26
2022-01-26 14:16:34.010 | DEBUG    | __main__:trials:24 - Trial = 2153/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.012 | DEBUG    | __main__:trials:29 - Trial = 2153/30000 | Total reward = 48.14
2022-01-26 14:16:34.015 | DEBUG    | __main__:trials:24 - Trial = 2154/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.016 | DEBUG    | __main__:trials:29 - Trial = 2154/30000 | Total reward = 50.56
2022-01-26 14:16:34.019 | DEBUG    | __main__:trials:24 - Trial = 2155/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.021 | DEBUG    | __main__:trials:29 - Trial = 2155/30000 | Total reward = 52.35
2022-01-26 14:16:34.024 | DEBUG    | __main__:trials:24 - Trial = 2156/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.026 | DEBUG    | __main__:trials:29 - Trial = 2156/30000 | Total reward = 51.03
2022-01-26 14:16:34.030 | DEBUG    | __main__:trials:24 - Trial = 2157/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.031 | DEBUG    | __main__:trials:29 - Trial = 2157/30000 | Total reward = 28.37
2022-01-26 14:16:34.035 | DEBUG    | __main__:trials:24 - Trial = 2158/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.035 | DEBUG    | __main__:trials:29 - Trial = 2158/30000 | Total reward = 40.88
2022-01-26 14:16:34.040 | DEBUG    | __main__:trials:24 - Trial = 2159/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.041 | DEBUG    | __main__:trials:29 - Trial = 2159/30000 | Total reward = 52.35
2022-01-26 14:16:34.045 | DEBUG    | __main__:trials:24 - Trial = 2160/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.047 | DEBUG    | __main__:trials:29 - Trial = 2160/30000 | Total reward = 48.38
2022-01-26 14:16:34.050 | DEBUG    | __main__:trials:26 - Trial = 2161/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.051 | DEBUG    | __main__:trials:29 - Trial = 2161/30000 | Total reward = 23.23
2022-01-26 14:16:34.055 | DEBUG    | __main__:trials:24 - Trial = 2162/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.057 | DEBUG    | __main__:trials:29 - Trial = 2162/30000 | Total reward = 51.60
2022-01-26 14:16:34.060 | DEBUG    | __main__:trials:24 - Trial = 2163/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.061 | DEBUG    | __main__:trials:29 - Trial = 2163/30000 | Total reward = 52.86
2022-01-26 14:16:34.065 | DEBUG    | __main__:trials:24 - Trial = 2164/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.066 | DEBUG    | __main__:trials:29 - Trial = 2164/30000 | Total reward = 52.44
2022-01-26 14:16:34.070 | DEBUG    | __main__:trials:24 - Trial = 2165/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.071 | DEBUG    | __main__:trials:29 - Trial = 2165/30000 | Total reward = 48.62
2022-01-26 14:16:34.075 | DEBUG    | __main__:trials:24 - Trial = 2166/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.075 | DEBUG    | __main__:trials:29 - Trial = 2166/30000 | Total reward = 56.50
2022-01-26 14:16:34.079 | DEBUG    | __main__:trials:26 - Trial = 2167/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.081 | DEBUG    | __main__:trials:29 - Trial = 2167/30000 | Total reward = 26.30
2022-01-26 14:16:34.084 | DEBUG    | __main__:trials:24 - Trial = 2168/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.085 | DEBUG    | __main__:trials:29 - Trial = 2168/30000 | Total reward = 51.23
2022-01-26 14:16:34.090 | DEBUG    | __main__:trials:24 - Trial = 2169/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.091 | DEBUG    | __main__:trials:29 - Trial = 2169/30000 | Total reward = 56.60
2022-01-26 14:16:34.095 | DEBUG    | __main__:trials:24 - Trial = 2170/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.096 | DEBUG    | __main__:trials:29 - Trial = 2170/30000 | Total reward = 47.91
2022-01-26 14:16:34.099 | DEBUG    | __main__:trials:24 - Trial = 2171/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.101 | DEBUG    | __main__:trials:29 - Trial = 2171/30000 | Total reward = 51.79
2022-01-26 14:16:34.105 | DEBUG    | __main__:trials:24 - Trial = 2172/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.107 | DEBUG    | __main__:trials:29 - Trial = 2172/30000 | Total reward = 53.10
2022-01-26 14:16:34.110 | DEBUG    | __main__:trials:24 - Trial = 2173/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.111 | DEBUG    | __main__:trials:29 - Trial = 2173/30000 | Total reward = 52.93
2022-01-26 14:16:34.115 | DEBUG    | __main__:trials:24 - Trial = 2174/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.116 | DEBUG    | __main__:trials:29 - Trial = 2174/30000 | Total reward = 62.52
2022-01-26 14:16:34.120 | DEBUG    | __main__:trials:24 - Trial = 2175/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.121 | DEBUG    | __main__:trials:29 - Trial = 2175/30000 | Total reward = 55.90
2022-01-26 14:16:34.125 | DEBUG    | __main__:trials:24 - Trial = 2176/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.126 | DEBUG    | __main__:trials:29 - Trial = 2176/30000 | Total reward = 37.54
2022-01-26 14:16:34.130 | DEBUG    | __main__:trials:24 - Trial = 2177/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.131 | DEBUG    | __main__:trials:29 - Trial = 2177/30000 | Total reward = 49.47
2022-01-26 14:16:34.135 | DEBUG    | __main__:trials:24 - Trial = 2178/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.136 | DEBUG    | __main__:trials:29 - Trial = 2178/30000 | Total reward = 52.90
2022-01-26 14:16:34.140 | DEBUG    | __main__:trials:24 - Trial = 2179/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.141 | DEBUG    | __main__:trials:29 - Trial = 2179/30000 | Total reward = 52.35
2022-01-26 14:16:34.145 | DEBUG    | __main__:trials:24 - Trial = 2180/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.147 | DEBUG    | __main__:trials:29 - Trial = 2180/30000 | Total reward = 63.60
2022-01-26 14:16:34.150 | DEBUG    | __main__:trials:24 - Trial = 2181/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.152 | DEBUG    | __main__:trials:29 - Trial = 2181/30000 | Total reward = 56.03
2022-01-26 14:16:34.155 | DEBUG    | __main__:trials:24 - Trial = 2182/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.156 | DEBUG    | __main__:trials:29 - Trial = 2182/30000 | Total reward = 57.62
2022-01-26 14:16:34.160 | DEBUG    | __main__:trials:24 - Trial = 2183/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.162 | DEBUG    | __main__:trials:29 - Trial = 2183/30000 | Total reward = 46.68
2022-01-26 14:16:34.165 | DEBUG    | __main__:trials:24 - Trial = 2184/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.166 | DEBUG    | __main__:trials:29 - Trial = 2184/30000 | Total reward = 49.01
2022-01-26 14:16:34.171 | DEBUG    | __main__:trials:24 - Trial = 2185/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.172 | DEBUG    | __main__:trials:29 - Trial = 2185/30000 | Total reward = 56.53
2022-01-26 14:16:34.176 | DEBUG    | __main__:trials:24 - Trial = 2186/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.177 | DEBUG    | __main__:trials:29 - Trial = 2186/30000 | Total reward = 50.00
2022-01-26 14:16:34.180 | DEBUG    | __main__:trials:24 - Trial = 2187/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.182 | DEBUG    | __main__:trials:29 - Trial = 2187/30000 | Total reward = 49.51
2022-01-26 14:16:34.185 | DEBUG    | __main__:trials:24 - Trial = 2188/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.186 | DEBUG    | __main__:trials:29 - Trial = 2188/30000 | Total reward = 42.19
2022-01-26 14:16:34.189 | DEBUG    | __main__:trials:24 - Trial = 2189/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.191 | DEBUG    | __main__:trials:29 - Trial = 2189/30000 | Total reward = 50.87
2022-01-26 14:16:34.194 | DEBUG    | __main__:trials:24 - Trial = 2190/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.195 | DEBUG    | __main__:trials:29 - Trial = 2190/30000 | Total reward = 43.01
2022-01-26 14:16:34.198 | DEBUG    | __main__:trials:24 - Trial = 2191/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.200 | DEBUG    | __main__:trials:29 - Trial = 2191/30000 | Total reward = 53.19
2022-01-26 14:16:34.203 | DEBUG    | __main__:trials:24 - Trial = 2192/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.205 | DEBUG    | __main__:trials:29 - Trial = 2192/30000 | Total reward = 50.82
2022-01-26 14:16:34.209 | DEBUG    | __main__:trials:24 - Trial = 2193/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.210 | DEBUG    | __main__:trials:29 - Trial = 2193/30000 | Total reward = 45.51
2022-01-26 14:16:34.214 | DEBUG    | __main__:trials:24 - Trial = 2194/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.215 | DEBUG    | __main__:trials:29 - Trial = 2194/30000 | Total reward = 53.01
2022-01-26 14:16:34.220 | DEBUG    | __main__:trials:24 - Trial = 2195/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.220 | DEBUG    | __main__:trials:29 - Trial = 2195/30000 | Total reward = 44.94
2022-01-26 14:16:34.224 | DEBUG    | __main__:trials:24 - Trial = 2196/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.226 | DEBUG    | __main__:trials:29 - Trial = 2196/30000 | Total reward = 50.86
2022-01-26 14:16:34.230 | DEBUG    | __main__:trials:24 - Trial = 2197/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.231 | DEBUG    | __main__:trials:29 - Trial = 2197/30000 | Total reward = 50.69
2022-01-26 14:16:34.235 | DEBUG    | __main__:trials:24 - Trial = 2198/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.236 | DEBUG    | __main__:trials:29 - Trial = 2198/30000 | Total reward = 54.48
2022-01-26 14:16:34.239 | DEBUG    | __main__:trials:24 - Trial = 2199/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.242 | DEBUG    | __main__:trials:29 - Trial = 2199/30000 | Total reward = 36.18
2022-01-26 14:16:34.245 | DEBUG    | __main__:trials:24 - Trial = 2200/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.247 | DEBUG    | __main__:trials:29 - Trial = 2200/30000 | Total reward = 49.98
2022-01-26 14:16:34.250 | DEBUG    | __main__:trials:24 - Trial = 2201/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.252 | DEBUG    | __main__:trials:29 - Trial = 2201/30000 | Total reward = 48.34
2022-01-26 14:16:34.256 | DEBUG    | __main__:trials:24 - Trial = 2202/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.256 | DEBUG    | __main__:trials:29 - Trial = 2202/30000 | Total reward = 53.19
2022-01-26 14:16:34.260 | DEBUG    | __main__:trials:24 - Trial = 2203/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.261 | DEBUG    | __main__:trials:29 - Trial = 2203/30000 | Total reward = 58.15
2022-01-26 14:16:34.265 | DEBUG    | __main__:trials:24 - Trial = 2204/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.266 | DEBUG    | __main__:trials:29 - Trial = 2204/30000 | Total reward = 52.53
2022-01-26 14:16:34.270 | DEBUG    | __main__:trials:24 - Trial = 2205/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.271 | DEBUG    | __main__:trials:29 - Trial = 2205/30000 | Total reward = 49.86
2022-01-26 14:16:34.274 | DEBUG    | __main__:trials:24 - Trial = 2206/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.276 | DEBUG    | __main__:trials:29 - Trial = 2206/30000 | Total reward = 55.11
2022-01-26 14:16:34.280 | DEBUG    | __main__:trials:24 - Trial = 2207/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.281 | DEBUG    | __main__:trials:29 - Trial = 2207/30000 | Total reward = 50.58
2022-01-26 14:16:34.285 | DEBUG    | __main__:trials:24 - Trial = 2208/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.287 | DEBUG    | __main__:trials:29 - Trial = 2208/30000 | Total reward = 51.21
2022-01-26 14:16:34.290 | DEBUG    | __main__:trials:24 - Trial = 2209/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.292 | DEBUG    | __main__:trials:29 - Trial = 2209/30000 | Total reward = 50.69
2022-01-26 14:16:34.295 | DEBUG    | __main__:trials:24 - Trial = 2210/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.297 | DEBUG    | __main__:trials:29 - Trial = 2210/30000 | Total reward = 50.29
2022-01-26 14:16:34.300 | DEBUG    | __main__:trials:24 - Trial = 2211/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.302 | DEBUG    | __main__:trials:29 - Trial = 2211/30000 | Total reward = 52.70
2022-01-26 14:16:34.306 | DEBUG    | __main__:trials:24 - Trial = 2212/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.307 | DEBUG    | __main__:trials:29 - Trial = 2212/30000 | Total reward = 34.82
2022-01-26 14:16:34.311 | DEBUG    | __main__:trials:24 - Trial = 2213/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.313 | DEBUG    | __main__:trials:29 - Trial = 2213/30000 | Total reward = 56.65
2022-01-26 14:16:34.316 | DEBUG    | __main__:trials:24 - Trial = 2214/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.318 | DEBUG    | __main__:trials:29 - Trial = 2214/30000 | Total reward = 50.07
2022-01-26 14:16:34.322 | DEBUG    | __main__:trials:24 - Trial = 2215/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.323 | DEBUG    | __main__:trials:29 - Trial = 2215/30000 | Total reward = 57.07
2022-01-26 14:16:34.326 | DEBUG    | __main__:trials:24 - Trial = 2216/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.328 | DEBUG    | __main__:trials:29 - Trial = 2216/30000 | Total reward = 52.26
2022-01-26 14:16:34.332 | DEBUG    | __main__:trials:24 - Trial = 2217/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.334 | DEBUG    | __main__:trials:29 - Trial = 2217/30000 | Total reward = 58.01
2022-01-26 14:16:34.337 | DEBUG    | __main__:trials:24 - Trial = 2218/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.338 | DEBUG    | __main__:trials:29 - Trial = 2218/30000 | Total reward = 54.47
2022-01-26 14:16:34.343 | DEBUG    | __main__:trials:24 - Trial = 2219/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.344 | DEBUG    | __main__:trials:29 - Trial = 2219/30000 | Total reward = 51.06
2022-01-26 14:16:34.348 | DEBUG    | __main__:trials:24 - Trial = 2220/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.350 | DEBUG    | __main__:trials:29 - Trial = 2220/30000 | Total reward = 58.92
2022-01-26 14:16:34.353 | DEBUG    | __main__:trials:24 - Trial = 2221/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.354 | DEBUG    | __main__:trials:29 - Trial = 2221/30000 | Total reward = 48.46
2022-01-26 14:16:34.358 | DEBUG    | __main__:trials:24 - Trial = 2222/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.359 | DEBUG    | __main__:trials:29 - Trial = 2222/30000 | Total reward = 54.39
2022-01-26 14:16:34.363 | DEBUG    | __main__:trials:24 - Trial = 2223/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.364 | DEBUG    | __main__:trials:29 - Trial = 2223/30000 | Total reward = 55.60
2022-01-26 14:16:34.368 | DEBUG    | __main__:trials:24 - Trial = 2224/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.370 | DEBUG    | __main__:trials:29 - Trial = 2224/30000 | Total reward = 47.56
2022-01-26 14:16:34.374 | DEBUG    | __main__:trials:24 - Trial = 2225/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.374 | DEBUG    | __main__:trials:29 - Trial = 2225/30000 | Total reward = 58.02
2022-01-26 14:16:34.379 | DEBUG    | __main__:trials:24 - Trial = 2226/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.381 | DEBUG    | __main__:trials:29 - Trial = 2226/30000 | Total reward = 50.71
2022-01-26 14:16:34.384 | DEBUG    | __main__:trials:24 - Trial = 2227/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.386 | DEBUG    | __main__:trials:29 - Trial = 2227/30000 | Total reward = 41.23
2022-01-26 14:16:34.389 | DEBUG    | __main__:trials:26 - Trial = 2228/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.391 | DEBUG    | __main__:trials:29 - Trial = 2228/30000 | Total reward = 30.96
2022-01-26 14:16:34.394 | DEBUG    | __main__:trials:24 - Trial = 2229/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.396 | DEBUG    | __main__:trials:29 - Trial = 2229/30000 | Total reward = 50.53
2022-01-26 14:16:34.400 | DEBUG    | __main__:trials:24 - Trial = 2230/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.401 | DEBUG    | __main__:trials:29 - Trial = 2230/30000 | Total reward = 51.95
2022-01-26 14:16:34.404 | DEBUG    | __main__:trials:24 - Trial = 2231/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.406 | DEBUG    | __main__:trials:29 - Trial = 2231/30000 | Total reward = 47.32
2022-01-26 14:16:34.410 | DEBUG    | __main__:trials:24 - Trial = 2232/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.410 | DEBUG    | __main__:trials:29 - Trial = 2232/30000 | Total reward = 41.66
2022-01-26 14:16:34.414 | DEBUG    | __main__:trials:24 - Trial = 2233/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.416 | DEBUG    | __main__:trials:29 - Trial = 2233/30000 | Total reward = 46.18
2022-01-26 14:16:34.419 | DEBUG    | __main__:trials:24 - Trial = 2234/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.421 | DEBUG    | __main__:trials:29 - Trial = 2234/30000 | Total reward = 51.91
2022-01-26 14:16:34.424 | DEBUG    | __main__:trials:24 - Trial = 2235/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.426 | DEBUG    | __main__:trials:29 - Trial = 2235/30000 | Total reward = 55.87
2022-01-26 14:16:34.429 | DEBUG    | __main__:trials:24 - Trial = 2236/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.430 | DEBUG    | __main__:trials:29 - Trial = 2236/30000 | Total reward = 23.37
2022-01-26 14:16:34.434 | DEBUG    | __main__:trials:24 - Trial = 2237/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.435 | DEBUG    | __main__:trials:29 - Trial = 2237/30000 | Total reward = 56.46
2022-01-26 14:16:34.439 | DEBUG    | __main__:trials:24 - Trial = 2238/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.440 | DEBUG    | __main__:trials:29 - Trial = 2238/30000 | Total reward = 49.90
2022-01-26 14:16:34.444 | DEBUG    | __main__:trials:24 - Trial = 2239/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.444 | DEBUG    | __main__:trials:29 - Trial = 2239/30000 | Total reward = 49.71
2022-01-26 14:16:34.448 | DEBUG    | __main__:trials:24 - Trial = 2240/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.449 | DEBUG    | __main__:trials:29 - Trial = 2240/30000 | Total reward = 49.61
2022-01-26 14:16:34.453 | DEBUG    | __main__:trials:24 - Trial = 2241/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.454 | DEBUG    | __main__:trials:29 - Trial = 2241/30000 | Total reward = 53.72
2022-01-26 14:16:34.459 | DEBUG    | __main__:trials:24 - Trial = 2242/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.460 | DEBUG    | __main__:trials:29 - Trial = 2242/30000 | Total reward = 49.39
2022-01-26 14:16:34.464 | DEBUG    | __main__:trials:24 - Trial = 2243/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.466 | DEBUG    | __main__:trials:29 - Trial = 2243/30000 | Total reward = 49.13
2022-01-26 14:16:34.469 | DEBUG    | __main__:trials:24 - Trial = 2244/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.470 | DEBUG    | __main__:trials:29 - Trial = 2244/30000 | Total reward = 44.88
2022-01-26 14:16:34.474 | DEBUG    | __main__:trials:24 - Trial = 2245/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.475 | DEBUG    | __main__:trials:29 - Trial = 2245/30000 | Total reward = 51.63
2022-01-26 14:16:34.479 | DEBUG    | __main__:trials:24 - Trial = 2246/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.481 | DEBUG    | __main__:trials:29 - Trial = 2246/30000 | Total reward = 61.57
2022-01-26 14:16:34.485 | DEBUG    | __main__:trials:24 - Trial = 2247/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.486 | DEBUG    | __main__:trials:29 - Trial = 2247/30000 | Total reward = 44.38
2022-01-26 14:16:34.490 | DEBUG    | __main__:trials:24 - Trial = 2248/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.491 | DEBUG    | __main__:trials:29 - Trial = 2248/30000 | Total reward = 51.61
2022-01-26 14:16:34.494 | DEBUG    | __main__:trials:24 - Trial = 2249/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.496 | DEBUG    | __main__:trials:29 - Trial = 2249/30000 | Total reward = 49.81
2022-01-26 14:16:34.499 | DEBUG    | __main__:trials:24 - Trial = 2250/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.501 | DEBUG    | __main__:trials:29 - Trial = 2250/30000 | Total reward = 47.83
2022-01-26 14:16:34.504 | DEBUG    | __main__:trials:24 - Trial = 2251/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.506 | DEBUG    | __main__:trials:29 - Trial = 2251/30000 | Total reward = 44.30
2022-01-26 14:16:34.510 | DEBUG    | __main__:trials:24 - Trial = 2252/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.511 | DEBUG    | __main__:trials:29 - Trial = 2252/30000 | Total reward = 49.60
2022-01-26 14:16:34.515 | DEBUG    | __main__:trials:24 - Trial = 2253/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.516 | DEBUG    | __main__:trials:29 - Trial = 2253/30000 | Total reward = 53.07
2022-01-26 14:16:34.520 | DEBUG    | __main__:trials:24 - Trial = 2254/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.522 | DEBUG    | __main__:trials:29 - Trial = 2254/30000 | Total reward = 45.37
2022-01-26 14:16:34.526 | DEBUG    | __main__:trials:24 - Trial = 2255/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.527 | DEBUG    | __main__:trials:29 - Trial = 2255/30000 | Total reward = 35.77
2022-01-26 14:16:34.530 | DEBUG    | __main__:trials:24 - Trial = 2256/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.532 | DEBUG    | __main__:trials:29 - Trial = 2256/30000 | Total reward = 55.44
2022-01-26 14:16:34.536 | DEBUG    | __main__:trials:24 - Trial = 2257/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.537 | DEBUG    | __main__:trials:29 - Trial = 2257/30000 | Total reward = 48.46
2022-01-26 14:16:34.541 | DEBUG    | __main__:trials:24 - Trial = 2258/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.542 | DEBUG    | __main__:trials:29 - Trial = 2258/30000 | Total reward = 51.39
2022-01-26 14:16:34.546 | DEBUG    | __main__:trials:24 - Trial = 2259/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.547 | DEBUG    | __main__:trials:29 - Trial = 2259/30000 | Total reward = 30.17
2022-01-26 14:16:34.551 | DEBUG    | __main__:trials:24 - Trial = 2260/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.553 | DEBUG    | __main__:trials:29 - Trial = 2260/30000 | Total reward = 49.35
2022-01-26 14:16:34.556 | DEBUG    | __main__:trials:24 - Trial = 2261/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.557 | DEBUG    | __main__:trials:29 - Trial = 2261/30000 | Total reward = 47.58
2022-01-26 14:16:34.561 | DEBUG    | __main__:trials:26 - Trial = 2262/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.562 | DEBUG    | __main__:trials:29 - Trial = 2262/30000 | Total reward = 23.14
2022-01-26 14:16:34.565 | DEBUG    | __main__:trials:24 - Trial = 2263/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.566 | DEBUG    | __main__:trials:29 - Trial = 2263/30000 | Total reward = 55.08
2022-01-26 14:16:34.569 | DEBUG    | __main__:trials:24 - Trial = 2264/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.571 | DEBUG    | __main__:trials:29 - Trial = 2264/30000 | Total reward = 45.94
2022-01-26 14:16:34.574 | DEBUG    | __main__:trials:24 - Trial = 2265/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.576 | DEBUG    | __main__:trials:29 - Trial = 2265/30000 | Total reward = 54.92
2022-01-26 14:16:34.579 | DEBUG    | __main__:trials:24 - Trial = 2266/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.581 | DEBUG    | __main__:trials:29 - Trial = 2266/30000 | Total reward = 36.99
2022-01-26 14:16:34.585 | DEBUG    | __main__:trials:24 - Trial = 2267/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.586 | DEBUG    | __main__:trials:29 - Trial = 2267/30000 | Total reward = 50.43
2022-01-26 14:16:34.590 | DEBUG    | __main__:trials:24 - Trial = 2268/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.592 | DEBUG    | __main__:trials:29 - Trial = 2268/30000 | Total reward = 51.73
2022-01-26 14:16:34.596 | DEBUG    | __main__:trials:24 - Trial = 2269/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.597 | DEBUG    | __main__:trials:29 - Trial = 2269/30000 | Total reward = 32.76
2022-01-26 14:16:34.601 | DEBUG    | __main__:trials:24 - Trial = 2270/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.603 | DEBUG    | __main__:trials:29 - Trial = 2270/30000 | Total reward = 50.12
2022-01-26 14:16:34.606 | DEBUG    | __main__:trials:26 - Trial = 2271/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.608 | DEBUG    | __main__:trials:29 - Trial = 2271/30000 | Total reward = 22.62
2022-01-26 14:16:34.612 | DEBUG    | __main__:trials:24 - Trial = 2272/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.613 | DEBUG    | __main__:trials:29 - Trial = 2272/30000 | Total reward = 51.51
2022-01-26 14:16:34.617 | DEBUG    | __main__:trials:24 - Trial = 2273/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.618 | DEBUG    | __main__:trials:29 - Trial = 2273/30000 | Total reward = 49.92
2022-01-26 14:16:34.621 | DEBUG    | __main__:trials:24 - Trial = 2274/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.622 | DEBUG    | __main__:trials:29 - Trial = 2274/30000 | Total reward = 45.80
2022-01-26 14:16:34.625 | DEBUG    | __main__:trials:26 - Trial = 2275/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.626 | DEBUG    | __main__:trials:29 - Trial = 2275/30000 | Total reward = 23.06
2022-01-26 14:16:34.630 | DEBUG    | __main__:trials:24 - Trial = 2276/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.631 | DEBUG    | __main__:trials:29 - Trial = 2276/30000 | Total reward = 38.12
2022-01-26 14:16:34.635 | DEBUG    | __main__:trials:24 - Trial = 2277/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.637 | DEBUG    | __main__:trials:29 - Trial = 2277/30000 | Total reward = 55.03
2022-01-26 14:16:34.640 | DEBUG    | __main__:trials:24 - Trial = 2278/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.642 | DEBUG    | __main__:trials:29 - Trial = 2278/30000 | Total reward = 42.24
2022-01-26 14:16:34.645 | DEBUG    | __main__:trials:24 - Trial = 2279/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.647 | DEBUG    | __main__:trials:29 - Trial = 2279/30000 | Total reward = 50.83
2022-01-26 14:16:34.651 | DEBUG    | __main__:trials:24 - Trial = 2280/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.652 | DEBUG    | __main__:trials:29 - Trial = 2280/30000 | Total reward = 38.24
2022-01-26 14:16:34.656 | DEBUG    | __main__:trials:24 - Trial = 2281/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.658 | DEBUG    | __main__:trials:29 - Trial = 2281/30000 | Total reward = 53.36
2022-01-26 14:16:34.662 | DEBUG    | __main__:trials:24 - Trial = 2282/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.663 | DEBUG    | __main__:trials:29 - Trial = 2282/30000 | Total reward = 48.04
2022-01-26 14:16:34.667 | DEBUG    | __main__:trials:24 - Trial = 2283/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.669 | DEBUG    | __main__:trials:29 - Trial = 2283/30000 | Total reward = 41.64
2022-01-26 14:16:34.672 | DEBUG    | __main__:trials:24 - Trial = 2284/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.673 | DEBUG    | __main__:trials:29 - Trial = 2284/30000 | Total reward = 52.59
2022-01-26 14:16:34.676 | DEBUG    | __main__:trials:24 - Trial = 2285/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.678 | DEBUG    | __main__:trials:29 - Trial = 2285/30000 | Total reward = 50.56
2022-01-26 14:16:34.681 | DEBUG    | __main__:trials:24 - Trial = 2286/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.683 | DEBUG    | __main__:trials:29 - Trial = 2286/30000 | Total reward = 43.09
2022-01-26 14:16:34.686 | DEBUG    | __main__:trials:24 - Trial = 2287/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.688 | DEBUG    | __main__:trials:29 - Trial = 2287/30000 | Total reward = 39.97
2022-01-26 14:16:34.692 | DEBUG    | __main__:trials:24 - Trial = 2288/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.693 | DEBUG    | __main__:trials:29 - Trial = 2288/30000 | Total reward = 43.99
2022-01-26 14:16:34.697 | DEBUG    | __main__:trials:26 - Trial = 2289/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.698 | DEBUG    | __main__:trials:29 - Trial = 2289/30000 | Total reward = 23.53
2022-01-26 14:16:34.701 | DEBUG    | __main__:trials:24 - Trial = 2290/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.702 | DEBUG    | __main__:trials:29 - Trial = 2290/30000 | Total reward = 55.33
2022-01-26 14:16:34.705 | DEBUG    | __main__:trials:24 - Trial = 2291/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.707 | DEBUG    | __main__:trials:29 - Trial = 2291/30000 | Total reward = 37.99
2022-01-26 14:16:34.710 | DEBUG    | __main__:trials:24 - Trial = 2292/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.712 | DEBUG    | __main__:trials:29 - Trial = 2292/30000 | Total reward = 52.50
2022-01-26 14:16:34.715 | DEBUG    | __main__:trials:24 - Trial = 2293/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.717 | DEBUG    | __main__:trials:29 - Trial = 2293/30000 | Total reward = 50.72
2022-01-26 14:16:34.720 | DEBUG    | __main__:trials:24 - Trial = 2294/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.722 | DEBUG    | __main__:trials:29 - Trial = 2294/30000 | Total reward = 49.80
2022-01-26 14:16:34.725 | DEBUG    | __main__:trials:24 - Trial = 2295/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.727 | DEBUG    | __main__:trials:29 - Trial = 2295/30000 | Total reward = 52.32
2022-01-26 14:16:34.730 | DEBUG    | __main__:trials:24 - Trial = 2296/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.731 | DEBUG    | __main__:trials:29 - Trial = 2296/30000 | Total reward = 48.70
2022-01-26 14:16:34.735 | DEBUG    | __main__:trials:24 - Trial = 2297/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.736 | DEBUG    | __main__:trials:29 - Trial = 2297/30000 | Total reward = 49.07
2022-01-26 14:16:34.739 | DEBUG    | __main__:trials:24 - Trial = 2298/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.740 | DEBUG    | __main__:trials:29 - Trial = 2298/30000 | Total reward = 48.40
2022-01-26 14:16:34.743 | DEBUG    | __main__:trials:24 - Trial = 2299/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.744 | DEBUG    | __main__:trials:29 - Trial = 2299/30000 | Total reward = 47.25
2022-01-26 14:16:34.747 | DEBUG    | __main__:trials:24 - Trial = 2300/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.749 | DEBUG    | __main__:trials:29 - Trial = 2300/30000 | Total reward = 25.20
2022-01-26 14:16:34.752 | DEBUG    | __main__:trials:24 - Trial = 2301/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.754 | DEBUG    | __main__:trials:29 - Trial = 2301/30000 | Total reward = 51.19
2022-01-26 14:16:34.757 | DEBUG    | __main__:trials:24 - Trial = 2302/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.759 | DEBUG    | __main__:trials:29 - Trial = 2302/30000 | Total reward = 48.70
2022-01-26 14:16:34.762 | DEBUG    | __main__:trials:24 - Trial = 2303/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.764 | DEBUG    | __main__:trials:29 - Trial = 2303/30000 | Total reward = 47.77
2022-01-26 14:16:34.767 | DEBUG    | __main__:trials:24 - Trial = 2304/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.769 | DEBUG    | __main__:trials:29 - Trial = 2304/30000 | Total reward = 53.34
2022-01-26 14:16:34.773 | DEBUG    | __main__:trials:24 - Trial = 2305/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.775 | DEBUG    | __main__:trials:29 - Trial = 2305/30000 | Total reward = 52.26
2022-01-26 14:16:34.779 | DEBUG    | __main__:trials:24 - Trial = 2306/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.780 | DEBUG    | __main__:trials:29 - Trial = 2306/30000 | Total reward = 48.85
2022-01-26 14:16:34.784 | DEBUG    | __main__:trials:24 - Trial = 2307/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.786 | DEBUG    | __main__:trials:29 - Trial = 2307/30000 | Total reward = 50.62
2022-01-26 14:16:34.789 | DEBUG    | __main__:trials:24 - Trial = 2308/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.791 | DEBUG    | __main__:trials:29 - Trial = 2308/30000 | Total reward = 41.16
2022-01-26 14:16:34.795 | DEBUG    | __main__:trials:24 - Trial = 2309/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.796 | DEBUG    | __main__:trials:29 - Trial = 2309/30000 | Total reward = 49.45
2022-01-26 14:16:34.800 | DEBUG    | __main__:trials:24 - Trial = 2310/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.802 | DEBUG    | __main__:trials:29 - Trial = 2310/30000 | Total reward = 54.62
2022-01-26 14:16:34.806 | DEBUG    | __main__:trials:24 - Trial = 2311/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.807 | DEBUG    | __main__:trials:29 - Trial = 2311/30000 | Total reward = 27.97
2022-01-26 14:16:34.811 | DEBUG    | __main__:trials:24 - Trial = 2312/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.813 | DEBUG    | __main__:trials:29 - Trial = 2312/30000 | Total reward = 47.87
2022-01-26 14:16:34.816 | DEBUG    | __main__:trials:24 - Trial = 2313/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.817 | DEBUG    | __main__:trials:29 - Trial = 2313/30000 | Total reward = 52.37
2022-01-26 14:16:34.820 | DEBUG    | __main__:trials:24 - Trial = 2314/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.822 | DEBUG    | __main__:trials:29 - Trial = 2314/30000 | Total reward = 52.98
2022-01-26 14:16:34.826 | DEBUG    | __main__:trials:24 - Trial = 2315/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.827 | DEBUG    | __main__:trials:29 - Trial = 2315/30000 | Total reward = 51.44
2022-01-26 14:16:34.831 | DEBUG    | __main__:trials:24 - Trial = 2316/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.832 | DEBUG    | __main__:trials:29 - Trial = 2316/30000 | Total reward = 47.04
2022-01-26 14:16:34.836 | DEBUG    | __main__:trials:24 - Trial = 2317/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.838 | DEBUG    | __main__:trials:29 - Trial = 2317/30000 | Total reward = 47.53
2022-01-26 14:16:34.841 | DEBUG    | __main__:trials:26 - Trial = 2318/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.842 | DEBUG    | __main__:trials:29 - Trial = 2318/30000 | Total reward = 22.83
2022-01-26 14:16:34.846 | DEBUG    | __main__:trials:24 - Trial = 2319/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.848 | DEBUG    | __main__:trials:29 - Trial = 2319/30000 | Total reward = 53.57
2022-01-26 14:16:34.852 | DEBUG    | __main__:trials:24 - Trial = 2320/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.852 | DEBUG    | __main__:trials:29 - Trial = 2320/30000 | Total reward = 50.99
2022-01-26 14:16:34.856 | DEBUG    | __main__:trials:24 - Trial = 2321/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.858 | DEBUG    | __main__:trials:29 - Trial = 2321/30000 | Total reward = 55.59
2022-01-26 14:16:34.861 | DEBUG    | __main__:trials:24 - Trial = 2322/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.862 | DEBUG    | __main__:trials:29 - Trial = 2322/30000 | Total reward = 41.06
2022-01-26 14:16:34.865 | DEBUG    | __main__:trials:24 - Trial = 2323/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.866 | DEBUG    | __main__:trials:29 - Trial = 2323/30000 | Total reward = 57.10
2022-01-26 14:16:34.870 | DEBUG    | __main__:trials:24 - Trial = 2324/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.872 | DEBUG    | __main__:trials:29 - Trial = 2324/30000 | Total reward = 53.53
2022-01-26 14:16:34.875 | DEBUG    | __main__:trials:24 - Trial = 2325/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.877 | DEBUG    | __main__:trials:29 - Trial = 2325/30000 | Total reward = 47.99
2022-01-26 14:16:34.881 | DEBUG    | __main__:trials:24 - Trial = 2326/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.881 | DEBUG    | __main__:trials:29 - Trial = 2326/30000 | Total reward = 52.16
2022-01-26 14:16:34.885 | DEBUG    | __main__:trials:24 - Trial = 2327/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.886 | DEBUG    | __main__:trials:29 - Trial = 2327/30000 | Total reward = 49.61
2022-01-26 14:16:34.889 | DEBUG    | __main__:trials:24 - Trial = 2328/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.891 | DEBUG    | __main__:trials:29 - Trial = 2328/30000 | Total reward = 51.57
2022-01-26 14:16:34.894 | DEBUG    | __main__:trials:26 - Trial = 2329/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.895 | DEBUG    | __main__:trials:29 - Trial = 2329/30000 | Total reward = 29.91
2022-01-26 14:16:34.898 | DEBUG    | __main__:trials:24 - Trial = 2330/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.900 | DEBUG    | __main__:trials:29 - Trial = 2330/30000 | Total reward = 53.73
2022-01-26 14:16:34.905 | DEBUG    | __main__:trials:24 - Trial = 2331/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.906 | DEBUG    | __main__:trials:29 - Trial = 2331/30000 | Total reward = 55.20
2022-01-26 14:16:34.910 | DEBUG    | __main__:trials:24 - Trial = 2332/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.912 | DEBUG    | __main__:trials:29 - Trial = 2332/30000 | Total reward = 52.51
2022-01-26 14:16:34.915 | DEBUG    | __main__:trials:24 - Trial = 2333/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.917 | DEBUG    | __main__:trials:29 - Trial = 2333/30000 | Total reward = 65.25
2022-01-26 14:16:34.920 | DEBUG    | __main__:trials:24 - Trial = 2334/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.922 | DEBUG    | __main__:trials:29 - Trial = 2334/30000 | Total reward = 52.76
2022-01-26 14:16:34.926 | DEBUG    | __main__:trials:24 - Trial = 2335/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.927 | DEBUG    | __main__:trials:29 - Trial = 2335/30000 | Total reward = 50.54
2022-01-26 14:16:34.931 | DEBUG    | __main__:trials:24 - Trial = 2336/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.933 | DEBUG    | __main__:trials:29 - Trial = 2336/30000 | Total reward = 50.08
2022-01-26 14:16:34.937 | DEBUG    | __main__:trials:24 - Trial = 2337/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.938 | DEBUG    | __main__:trials:29 - Trial = 2337/30000 | Total reward = 53.47
2022-01-26 14:16:34.941 | DEBUG    | __main__:trials:26 - Trial = 2338/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.942 | DEBUG    | __main__:trials:29 - Trial = 2338/30000 | Total reward = 22.17
2022-01-26 14:16:34.945 | DEBUG    | __main__:trials:24 - Trial = 2339/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.947 | DEBUG    | __main__:trials:29 - Trial = 2339/30000 | Total reward = 33.39
2022-01-26 14:16:34.951 | DEBUG    | __main__:trials:24 - Trial = 2340/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.953 | DEBUG    | __main__:trials:29 - Trial = 2340/30000 | Total reward = 47.25
2022-01-26 14:16:34.955 | DEBUG    | __main__:trials:24 - Trial = 2341/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.957 | DEBUG    | __main__:trials:29 - Trial = 2341/30000 | Total reward = 55.92
2022-01-26 14:16:34.961 | DEBUG    | __main__:trials:26 - Trial = 2342/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:34.963 | DEBUG    | __main__:trials:29 - Trial = 2342/30000 | Total reward = 38.82
2022-01-26 14:16:34.967 | DEBUG    | __main__:trials:24 - Trial = 2343/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.968 | DEBUG    | __main__:trials:29 - Trial = 2343/30000 | Total reward = 52.35
2022-01-26 14:16:34.972 | DEBUG    | __main__:trials:24 - Trial = 2344/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.974 | DEBUG    | __main__:trials:29 - Trial = 2344/30000 | Total reward = 56.93
2022-01-26 14:16:34.978 | DEBUG    | __main__:trials:24 - Trial = 2345/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.979 | DEBUG    | __main__:trials:29 - Trial = 2345/30000 | Total reward = 49.88
2022-01-26 14:16:34.983 | DEBUG    | __main__:trials:24 - Trial = 2346/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.985 | DEBUG    | __main__:trials:29 - Trial = 2346/30000 | Total reward = 38.35
2022-01-26 14:16:34.988 | DEBUG    | __main__:trials:24 - Trial = 2347/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.989 | DEBUG    | __main__:trials:29 - Trial = 2347/30000 | Total reward = 47.25
2022-01-26 14:16:34.993 | DEBUG    | __main__:trials:24 - Trial = 2348/30000 | Max number of steps (20) reached
2022-01-26 14:16:34.995 | DEBUG    | __main__:trials:29 - Trial = 2348/30000 | Total reward = 56.05
2022-01-26 14:16:34.998 | DEBUG    | __main__:trials:24 - Trial = 2349/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.000 | DEBUG    | __main__:trials:29 - Trial = 2349/30000 | Total reward = 44.89
2022-01-26 14:16:35.004 | DEBUG    | __main__:trials:24 - Trial = 2350/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.005 | DEBUG    | __main__:trials:29 - Trial = 2350/30000 | Total reward = 54.25
2022-01-26 14:16:35.008 | DEBUG    | __main__:trials:24 - Trial = 2351/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.010 | DEBUG    | __main__:trials:29 - Trial = 2351/30000 | Total reward = 45.52
2022-01-26 14:16:35.014 | DEBUG    | __main__:trials:24 - Trial = 2352/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.015 | DEBUG    | __main__:trials:29 - Trial = 2352/30000 | Total reward = 51.57
2022-01-26 14:16:35.019 | DEBUG    | __main__:trials:24 - Trial = 2353/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.020 | DEBUG    | __main__:trials:29 - Trial = 2353/30000 | Total reward = 49.66
2022-01-26 14:16:35.025 | DEBUG    | __main__:trials:24 - Trial = 2354/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.027 | DEBUG    | __main__:trials:29 - Trial = 2354/30000 | Total reward = 55.21
2022-01-26 14:16:35.030 | DEBUG    | __main__:trials:24 - Trial = 2355/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.032 | DEBUG    | __main__:trials:29 - Trial = 2355/30000 | Total reward = 49.05
2022-01-26 14:16:35.036 | DEBUG    | __main__:trials:24 - Trial = 2356/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.037 | DEBUG    | __main__:trials:29 - Trial = 2356/30000 | Total reward = 49.81
2022-01-26 14:16:35.041 | DEBUG    | __main__:trials:24 - Trial = 2357/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.042 | DEBUG    | __main__:trials:29 - Trial = 2357/30000 | Total reward = 44.07
2022-01-26 14:16:35.046 | DEBUG    | __main__:trials:24 - Trial = 2358/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.047 | DEBUG    | __main__:trials:29 - Trial = 2358/30000 | Total reward = 47.52
2022-01-26 14:16:35.051 | DEBUG    | __main__:trials:24 - Trial = 2359/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.053 | DEBUG    | __main__:trials:29 - Trial = 2359/30000 | Total reward = 41.51
2022-01-26 14:16:35.056 | DEBUG    | __main__:trials:24 - Trial = 2360/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.058 | DEBUG    | __main__:trials:29 - Trial = 2360/30000 | Total reward = 52.16
2022-01-26 14:16:35.062 | DEBUG    | __main__:trials:24 - Trial = 2361/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.063 | DEBUG    | __main__:trials:29 - Trial = 2361/30000 | Total reward = 50.22
2022-01-26 14:16:35.067 | DEBUG    | __main__:trials:24 - Trial = 2362/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.068 | DEBUG    | __main__:trials:29 - Trial = 2362/30000 | Total reward = 44.27
2022-01-26 14:16:35.072 | DEBUG    | __main__:trials:24 - Trial = 2363/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.074 | DEBUG    | __main__:trials:29 - Trial = 2363/30000 | Total reward = 50.43
2022-01-26 14:16:35.077 | DEBUG    | __main__:trials:26 - Trial = 2364/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.079 | DEBUG    | __main__:trials:29 - Trial = 2364/30000 | Total reward = 24.32
2022-01-26 14:16:35.083 | DEBUG    | __main__:trials:24 - Trial = 2365/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.083 | DEBUG    | __main__:trials:29 - Trial = 2365/30000 | Total reward = 53.21
2022-01-26 14:16:35.176 | DEBUG    | __main__:trials:24 - Trial = 2366/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.177 | DEBUG    | __main__:trials:29 - Trial = 2366/30000 | Total reward = 46.89
2022-01-26 14:16:35.180 | DEBUG    | __main__:trials:24 - Trial = 2367/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.182 | DEBUG    | __main__:trials:29 - Trial = 2367/30000 | Total reward = 47.16
2022-01-26 14:16:35.185 | DEBUG    | __main__:trials:24 - Trial = 2368/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.186 | DEBUG    | __main__:trials:29 - Trial = 2368/30000 | Total reward = 29.95
2022-01-26 14:16:35.189 | DEBUG    | __main__:trials:24 - Trial = 2369/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.191 | DEBUG    | __main__:trials:29 - Trial = 2369/30000 | Total reward = 53.69
2022-01-26 14:16:35.195 | DEBUG    | __main__:trials:24 - Trial = 2370/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.196 | DEBUG    | __main__:trials:29 - Trial = 2370/30000 | Total reward = 56.06
2022-01-26 14:16:35.200 | DEBUG    | __main__:trials:24 - Trial = 2371/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.202 | DEBUG    | __main__:trials:29 - Trial = 2371/30000 | Total reward = 49.78
2022-01-26 14:16:35.205 | DEBUG    | __main__:trials:24 - Trial = 2372/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.207 | DEBUG    | __main__:trials:29 - Trial = 2372/30000 | Total reward = 49.85
2022-01-26 14:16:35.211 | DEBUG    | __main__:trials:24 - Trial = 2373/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.212 | DEBUG    | __main__:trials:29 - Trial = 2373/30000 | Total reward = 50.92
2022-01-26 14:16:35.216 | DEBUG    | __main__:trials:24 - Trial = 2374/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.217 | DEBUG    | __main__:trials:29 - Trial = 2374/30000 | Total reward = 52.53
2022-01-26 14:16:35.221 | DEBUG    | __main__:trials:24 - Trial = 2375/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.223 | DEBUG    | __main__:trials:29 - Trial = 2375/30000 | Total reward = 49.97
2022-01-26 14:16:35.226 | DEBUG    | __main__:trials:24 - Trial = 2376/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.228 | DEBUG    | __main__:trials:29 - Trial = 2376/30000 | Total reward = 49.66
2022-01-26 14:16:35.231 | DEBUG    | __main__:trials:24 - Trial = 2377/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.233 | DEBUG    | __main__:trials:29 - Trial = 2377/30000 | Total reward = 34.45
2022-01-26 14:16:35.236 | DEBUG    | __main__:trials:24 - Trial = 2378/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.237 | DEBUG    | __main__:trials:29 - Trial = 2378/30000 | Total reward = 55.93
2022-01-26 14:16:35.241 | DEBUG    | __main__:trials:24 - Trial = 2379/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.242 | DEBUG    | __main__:trials:29 - Trial = 2379/30000 | Total reward = 49.73
2022-01-26 14:16:35.246 | DEBUG    | __main__:trials:24 - Trial = 2380/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.246 | DEBUG    | __main__:trials:29 - Trial = 2380/30000 | Total reward = 44.68
2022-01-26 14:16:35.251 | DEBUG    | __main__:trials:24 - Trial = 2381/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.252 | DEBUG    | __main__:trials:29 - Trial = 2381/30000 | Total reward = 44.22
2022-01-26 14:16:35.256 | DEBUG    | __main__:trials:24 - Trial = 2382/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.256 | DEBUG    | __main__:trials:29 - Trial = 2382/30000 | Total reward = 61.75
2022-01-26 14:16:35.260 | DEBUG    | __main__:trials:24 - Trial = 2383/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.262 | DEBUG    | __main__:trials:29 - Trial = 2383/30000 | Total reward = 52.90
2022-01-26 14:16:35.266 | DEBUG    | __main__:trials:24 - Trial = 2384/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.267 | DEBUG    | __main__:trials:29 - Trial = 2384/30000 | Total reward = 20.03
2022-01-26 14:16:35.271 | DEBUG    | __main__:trials:24 - Trial = 2385/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.272 | DEBUG    | __main__:trials:29 - Trial = 2385/30000 | Total reward = 39.07
2022-01-26 14:16:35.275 | DEBUG    | __main__:trials:24 - Trial = 2386/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.277 | DEBUG    | __main__:trials:29 - Trial = 2386/30000 | Total reward = 49.73
2022-01-26 14:16:35.281 | DEBUG    | __main__:trials:24 - Trial = 2387/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.283 | DEBUG    | __main__:trials:29 - Trial = 2387/30000 | Total reward = 32.39
2022-01-26 14:16:35.286 | DEBUG    | __main__:trials:24 - Trial = 2388/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.288 | DEBUG    | __main__:trials:29 - Trial = 2388/30000 | Total reward = 46.45
2022-01-26 14:16:35.292 | DEBUG    | __main__:trials:24 - Trial = 2389/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.293 | DEBUG    | __main__:trials:29 - Trial = 2389/30000 | Total reward = 37.29
2022-01-26 14:16:35.296 | DEBUG    | __main__:trials:24 - Trial = 2390/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.298 | DEBUG    | __main__:trials:29 - Trial = 2390/30000 | Total reward = 53.08
2022-01-26 14:16:35.302 | DEBUG    | __main__:trials:24 - Trial = 2391/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.303 | DEBUG    | __main__:trials:29 - Trial = 2391/30000 | Total reward = 38.66
2022-01-26 14:16:35.307 | DEBUG    | __main__:trials:24 - Trial = 2392/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.308 | DEBUG    | __main__:trials:29 - Trial = 2392/30000 | Total reward = 49.40
2022-01-26 14:16:35.312 | DEBUG    | __main__:trials:24 - Trial = 2393/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.314 | DEBUG    | __main__:trials:29 - Trial = 2393/30000 | Total reward = 47.59
2022-01-26 14:16:35.317 | DEBUG    | __main__:trials:24 - Trial = 2394/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.318 | DEBUG    | __main__:trials:29 - Trial = 2394/30000 | Total reward = 50.32
2022-01-26 14:16:35.322 | DEBUG    | __main__:trials:24 - Trial = 2395/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.323 | DEBUG    | __main__:trials:29 - Trial = 2395/30000 | Total reward = 52.80
2022-01-26 14:16:35.326 | DEBUG    | __main__:trials:24 - Trial = 2396/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.327 | DEBUG    | __main__:trials:29 - Trial = 2396/30000 | Total reward = 52.44
2022-01-26 14:16:35.331 | DEBUG    | __main__:trials:24 - Trial = 2397/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.332 | DEBUG    | __main__:trials:29 - Trial = 2397/30000 | Total reward = 47.09
2022-01-26 14:16:35.336 | DEBUG    | __main__:trials:24 - Trial = 2398/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.338 | DEBUG    | __main__:trials:29 - Trial = 2398/30000 | Total reward = 59.72
2022-01-26 14:16:35.341 | DEBUG    | __main__:trials:24 - Trial = 2399/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.343 | DEBUG    | __main__:trials:29 - Trial = 2399/30000 | Total reward = 47.70
2022-01-26 14:16:35.347 | DEBUG    | __main__:trials:24 - Trial = 2400/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.348 | DEBUG    | __main__:trials:29 - Trial = 2400/30000 | Total reward = 50.43
2022-01-26 14:16:35.352 | DEBUG    | __main__:trials:24 - Trial = 2401/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.352 | DEBUG    | __main__:trials:29 - Trial = 2401/30000 | Total reward = 52.82
2022-01-26 14:16:35.356 | DEBUG    | __main__:trials:24 - Trial = 2402/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.358 | DEBUG    | __main__:trials:29 - Trial = 2402/30000 | Total reward = 52.77
2022-01-26 14:16:35.361 | DEBUG    | __main__:trials:24 - Trial = 2403/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.363 | DEBUG    | __main__:trials:29 - Trial = 2403/30000 | Total reward = 27.71
2022-01-26 14:16:35.367 | DEBUG    | __main__:trials:24 - Trial = 2404/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.368 | DEBUG    | __main__:trials:29 - Trial = 2404/30000 | Total reward = 26.79
2022-01-26 14:16:35.372 | DEBUG    | __main__:trials:24 - Trial = 2405/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.373 | DEBUG    | __main__:trials:29 - Trial = 2405/30000 | Total reward = 47.63
2022-01-26 14:16:35.377 | DEBUG    | __main__:trials:24 - Trial = 2406/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.378 | DEBUG    | __main__:trials:29 - Trial = 2406/30000 | Total reward = 51.22
2022-01-26 14:16:35.382 | DEBUG    | __main__:trials:24 - Trial = 2407/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.383 | DEBUG    | __main__:trials:29 - Trial = 2407/30000 | Total reward = 49.68
2022-01-26 14:16:35.387 | DEBUG    | __main__:trials:24 - Trial = 2408/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.388 | DEBUG    | __main__:trials:29 - Trial = 2408/30000 | Total reward = 46.90
2022-01-26 14:16:35.391 | DEBUG    | __main__:trials:24 - Trial = 2409/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.393 | DEBUG    | __main__:trials:29 - Trial = 2409/30000 | Total reward = 52.94
2022-01-26 14:16:35.397 | DEBUG    | __main__:trials:24 - Trial = 2410/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.399 | DEBUG    | __main__:trials:29 - Trial = 2410/30000 | Total reward = 45.97
2022-01-26 14:16:35.402 | DEBUG    | __main__:trials:24 - Trial = 2411/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.403 | DEBUG    | __main__:trials:29 - Trial = 2411/30000 | Total reward = 50.17
2022-01-26 14:16:35.407 | DEBUG    | __main__:trials:24 - Trial = 2412/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.409 | DEBUG    | __main__:trials:29 - Trial = 2412/30000 | Total reward = 54.54
2022-01-26 14:16:35.412 | DEBUG    | __main__:trials:26 - Trial = 2413/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.413 | DEBUG    | __main__:trials:29 - Trial = 2413/30000 | Total reward = 16.01
2022-01-26 14:16:35.417 | DEBUG    | __main__:trials:24 - Trial = 2414/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.418 | DEBUG    | __main__:trials:29 - Trial = 2414/30000 | Total reward = 43.20
2022-01-26 14:16:35.421 | DEBUG    | __main__:trials:24 - Trial = 2415/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.422 | DEBUG    | __main__:trials:29 - Trial = 2415/30000 | Total reward = 52.74
2022-01-26 14:16:35.425 | DEBUG    | __main__:trials:24 - Trial = 2416/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.426 | DEBUG    | __main__:trials:29 - Trial = 2416/30000 | Total reward = 52.75
2022-01-26 14:16:35.430 | DEBUG    | __main__:trials:24 - Trial = 2417/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.431 | DEBUG    | __main__:trials:29 - Trial = 2417/30000 | Total reward = 57.75
2022-01-26 14:16:35.434 | DEBUG    | __main__:trials:24 - Trial = 2418/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.435 | DEBUG    | __main__:trials:29 - Trial = 2418/30000 | Total reward = 52.72
2022-01-26 14:16:35.438 | DEBUG    | __main__:trials:24 - Trial = 2419/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.440 | DEBUG    | __main__:trials:29 - Trial = 2419/30000 | Total reward = 42.12
2022-01-26 14:16:35.444 | DEBUG    | __main__:trials:24 - Trial = 2420/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.445 | DEBUG    | __main__:trials:29 - Trial = 2420/30000 | Total reward = 58.68
2022-01-26 14:16:35.449 | DEBUG    | __main__:trials:24 - Trial = 2421/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.450 | DEBUG    | __main__:trials:29 - Trial = 2421/30000 | Total reward = 57.62
2022-01-26 14:16:35.454 | DEBUG    | __main__:trials:24 - Trial = 2422/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.455 | DEBUG    | __main__:trials:29 - Trial = 2422/30000 | Total reward = 45.49
2022-01-26 14:16:35.458 | DEBUG    | __main__:trials:26 - Trial = 2423/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.460 | DEBUG    | __main__:trials:29 - Trial = 2423/30000 | Total reward = 11.25
2022-01-26 14:16:35.463 | DEBUG    | __main__:trials:26 - Trial = 2424/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.464 | DEBUG    | __main__:trials:29 - Trial = 2424/30000 | Total reward = 43.22
2022-01-26 14:16:35.467 | DEBUG    | __main__:trials:24 - Trial = 2425/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.469 | DEBUG    | __main__:trials:29 - Trial = 2425/30000 | Total reward = 53.16
2022-01-26 14:16:35.472 | DEBUG    | __main__:trials:24 - Trial = 2426/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.474 | DEBUG    | __main__:trials:29 - Trial = 2426/30000 | Total reward = 50.86
2022-01-26 14:16:35.477 | DEBUG    | __main__:trials:24 - Trial = 2427/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.479 | DEBUG    | __main__:trials:29 - Trial = 2427/30000 | Total reward = 36.83
2022-01-26 14:16:35.483 | DEBUG    | __main__:trials:24 - Trial = 2428/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.484 | DEBUG    | __main__:trials:29 - Trial = 2428/30000 | Total reward = 45.40
2022-01-26 14:16:35.488 | DEBUG    | __main__:trials:24 - Trial = 2429/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.489 | DEBUG    | __main__:trials:29 - Trial = 2429/30000 | Total reward = 54.23
2022-01-26 14:16:35.493 | DEBUG    | __main__:trials:24 - Trial = 2430/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.493 | DEBUG    | __main__:trials:29 - Trial = 2430/30000 | Total reward = 59.57
2022-01-26 14:16:35.496 | DEBUG    | __main__:trials:24 - Trial = 2431/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.498 | DEBUG    | __main__:trials:29 - Trial = 2431/30000 | Total reward = 50.66
2022-01-26 14:16:35.501 | DEBUG    | __main__:trials:24 - Trial = 2432/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.501 | DEBUG    | __main__:trials:29 - Trial = 2432/30000 | Total reward = 31.71
2022-01-26 14:16:35.506 | DEBUG    | __main__:trials:24 - Trial = 2433/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.507 | DEBUG    | __main__:trials:29 - Trial = 2433/30000 | Total reward = 44.70
2022-01-26 14:16:35.511 | DEBUG    | __main__:trials:24 - Trial = 2434/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.512 | DEBUG    | __main__:trials:29 - Trial = 2434/30000 | Total reward = 47.20
2022-01-26 14:16:35.516 | DEBUG    | __main__:trials:26 - Trial = 2435/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.517 | DEBUG    | __main__:trials:29 - Trial = 2435/30000 | Total reward = 13.87
2022-01-26 14:16:35.521 | DEBUG    | __main__:trials:24 - Trial = 2436/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.522 | DEBUG    | __main__:trials:29 - Trial = 2436/30000 | Total reward = 49.22
2022-01-26 14:16:35.526 | DEBUG    | __main__:trials:24 - Trial = 2437/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.528 | DEBUG    | __main__:trials:29 - Trial = 2437/30000 | Total reward = 57.45
2022-01-26 14:16:35.531 | DEBUG    | __main__:trials:24 - Trial = 2438/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.532 | DEBUG    | __main__:trials:29 - Trial = 2438/30000 | Total reward = 49.48
2022-01-26 14:16:35.536 | DEBUG    | __main__:trials:24 - Trial = 2439/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.538 | DEBUG    | __main__:trials:29 - Trial = 2439/30000 | Total reward = 29.00
2022-01-26 14:16:35.542 | DEBUG    | __main__:trials:24 - Trial = 2440/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.543 | DEBUG    | __main__:trials:29 - Trial = 2440/30000 | Total reward = 59.44
2022-01-26 14:16:35.547 | DEBUG    | __main__:trials:24 - Trial = 2441/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.548 | DEBUG    | __main__:trials:29 - Trial = 2441/30000 | Total reward = 52.23
2022-01-26 14:16:35.552 | DEBUG    | __main__:trials:24 - Trial = 2442/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.553 | DEBUG    | __main__:trials:29 - Trial = 2442/30000 | Total reward = 52.32
2022-01-26 14:16:35.557 | DEBUG    | __main__:trials:24 - Trial = 2443/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.558 | DEBUG    | __main__:trials:29 - Trial = 2443/30000 | Total reward = 49.40
2022-01-26 14:16:35.562 | DEBUG    | __main__:trials:24 - Trial = 2444/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.563 | DEBUG    | __main__:trials:29 - Trial = 2444/30000 | Total reward = 53.04
2022-01-26 14:16:35.567 | DEBUG    | __main__:trials:24 - Trial = 2445/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.568 | DEBUG    | __main__:trials:29 - Trial = 2445/30000 | Total reward = 42.31
2022-01-26 14:16:35.572 | DEBUG    | __main__:trials:24 - Trial = 2446/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.572 | DEBUG    | __main__:trials:29 - Trial = 2446/30000 | Total reward = 52.41
2022-01-26 14:16:35.577 | DEBUG    | __main__:trials:24 - Trial = 2447/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.579 | DEBUG    | __main__:trials:29 - Trial = 2447/30000 | Total reward = 50.53
2022-01-26 14:16:35.583 | DEBUG    | __main__:trials:24 - Trial = 2448/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.585 | DEBUG    | __main__:trials:29 - Trial = 2448/30000 | Total reward = 49.57
2022-01-26 14:16:35.588 | DEBUG    | __main__:trials:24 - Trial = 2449/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.590 | DEBUG    | __main__:trials:29 - Trial = 2449/30000 | Total reward = 50.64
2022-01-26 14:16:35.593 | DEBUG    | __main__:trials:24 - Trial = 2450/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.595 | DEBUG    | __main__:trials:29 - Trial = 2450/30000 | Total reward = 52.86
2022-01-26 14:16:35.599 | DEBUG    | __main__:trials:24 - Trial = 2451/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.600 | DEBUG    | __main__:trials:29 - Trial = 2451/30000 | Total reward = 45.28
2022-01-26 14:16:35.604 | DEBUG    | __main__:trials:24 - Trial = 2452/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.605 | DEBUG    | __main__:trials:29 - Trial = 2452/30000 | Total reward = 41.67
2022-01-26 14:16:35.608 | DEBUG    | __main__:trials:24 - Trial = 2453/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.610 | DEBUG    | __main__:trials:29 - Trial = 2453/30000 | Total reward = 38.15
2022-01-26 14:16:35.613 | DEBUG    | __main__:trials:24 - Trial = 2454/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.614 | DEBUG    | __main__:trials:29 - Trial = 2454/30000 | Total reward = 49.09
2022-01-26 14:16:35.618 | DEBUG    | __main__:trials:24 - Trial = 2455/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.619 | DEBUG    | __main__:trials:29 - Trial = 2455/30000 | Total reward = 55.55
2022-01-26 14:16:35.623 | DEBUG    | __main__:trials:24 - Trial = 2456/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.625 | DEBUG    | __main__:trials:29 - Trial = 2456/30000 | Total reward = 53.47
2022-01-26 14:16:35.628 | DEBUG    | __main__:trials:24 - Trial = 2457/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.630 | DEBUG    | __main__:trials:29 - Trial = 2457/30000 | Total reward = 48.80
2022-01-26 14:16:35.634 | DEBUG    | __main__:trials:24 - Trial = 2458/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.635 | DEBUG    | __main__:trials:29 - Trial = 2458/30000 | Total reward = 45.66
2022-01-26 14:16:35.638 | DEBUG    | __main__:trials:24 - Trial = 2459/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.640 | DEBUG    | __main__:trials:29 - Trial = 2459/30000 | Total reward = 48.31
2022-01-26 14:16:35.644 | DEBUG    | __main__:trials:24 - Trial = 2460/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.644 | DEBUG    | __main__:trials:29 - Trial = 2460/30000 | Total reward = 48.28
2022-01-26 14:16:35.648 | DEBUG    | __main__:trials:24 - Trial = 2461/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.650 | DEBUG    | __main__:trials:29 - Trial = 2461/30000 | Total reward = 50.19
2022-01-26 14:16:35.654 | DEBUG    | __main__:trials:24 - Trial = 2462/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.654 | DEBUG    | __main__:trials:29 - Trial = 2462/30000 | Total reward = 54.59
2022-01-26 14:16:35.658 | DEBUG    | __main__:trials:24 - Trial = 2463/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.659 | DEBUG    | __main__:trials:29 - Trial = 2463/30000 | Total reward = 54.63
2022-01-26 14:16:35.663 | DEBUG    | __main__:trials:24 - Trial = 2464/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.665 | DEBUG    | __main__:trials:29 - Trial = 2464/30000 | Total reward = 47.07
2022-01-26 14:16:35.669 | DEBUG    | __main__:trials:24 - Trial = 2465/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.670 | DEBUG    | __main__:trials:29 - Trial = 2465/30000 | Total reward = 61.11
2022-01-26 14:16:35.674 | DEBUG    | __main__:trials:24 - Trial = 2466/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.674 | DEBUG    | __main__:trials:29 - Trial = 2466/30000 | Total reward = 51.56
2022-01-26 14:16:35.679 | DEBUG    | __main__:trials:26 - Trial = 2467/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.680 | DEBUG    | __main__:trials:29 - Trial = 2467/30000 | Total reward = 27.78
2022-01-26 14:16:35.684 | DEBUG    | __main__:trials:24 - Trial = 2468/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.685 | DEBUG    | __main__:trials:29 - Trial = 2468/30000 | Total reward = 51.98
2022-01-26 14:16:35.689 | DEBUG    | __main__:trials:24 - Trial = 2469/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.690 | DEBUG    | __main__:trials:29 - Trial = 2469/30000 | Total reward = 50.75
2022-01-26 14:16:35.694 | DEBUG    | __main__:trials:24 - Trial = 2470/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.695 | DEBUG    | __main__:trials:29 - Trial = 2470/30000 | Total reward = 50.51
2022-01-26 14:16:35.699 | DEBUG    | __main__:trials:24 - Trial = 2471/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.700 | DEBUG    | __main__:trials:29 - Trial = 2471/30000 | Total reward = 50.58
2022-01-26 14:16:35.704 | DEBUG    | __main__:trials:24 - Trial = 2472/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.706 | DEBUG    | __main__:trials:29 - Trial = 2472/30000 | Total reward = 49.26
2022-01-26 14:16:35.709 | DEBUG    | __main__:trials:24 - Trial = 2473/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.711 | DEBUG    | __main__:trials:29 - Trial = 2473/30000 | Total reward = 44.88
2022-01-26 14:16:35.714 | DEBUG    | __main__:trials:24 - Trial = 2474/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.715 | DEBUG    | __main__:trials:29 - Trial = 2474/30000 | Total reward = 54.21
2022-01-26 14:16:35.718 | DEBUG    | __main__:trials:24 - Trial = 2475/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.720 | DEBUG    | __main__:trials:29 - Trial = 2475/30000 | Total reward = 47.37
2022-01-26 14:16:35.724 | DEBUG    | __main__:trials:24 - Trial = 2476/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.725 | DEBUG    | __main__:trials:29 - Trial = 2476/30000 | Total reward = 48.05
2022-01-26 14:16:35.729 | DEBUG    | __main__:trials:24 - Trial = 2477/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.730 | DEBUG    | __main__:trials:29 - Trial = 2477/30000 | Total reward = 46.38
2022-01-26 14:16:35.734 | DEBUG    | __main__:trials:24 - Trial = 2478/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.736 | DEBUG    | __main__:trials:29 - Trial = 2478/30000 | Total reward = 28.58
2022-01-26 14:16:35.739 | DEBUG    | __main__:trials:24 - Trial = 2479/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.740 | DEBUG    | __main__:trials:29 - Trial = 2479/30000 | Total reward = 55.72
2022-01-26 14:16:35.744 | DEBUG    | __main__:trials:24 - Trial = 2480/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.745 | DEBUG    | __main__:trials:29 - Trial = 2480/30000 | Total reward = 50.59
2022-01-26 14:16:35.748 | DEBUG    | __main__:trials:24 - Trial = 2481/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.750 | DEBUG    | __main__:trials:29 - Trial = 2481/30000 | Total reward = 49.43
2022-01-26 14:16:35.754 | DEBUG    | __main__:trials:24 - Trial = 2482/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.755 | DEBUG    | __main__:trials:29 - Trial = 2482/30000 | Total reward = 54.08
2022-01-26 14:16:35.758 | DEBUG    | __main__:trials:24 - Trial = 2483/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.760 | DEBUG    | __main__:trials:29 - Trial = 2483/30000 | Total reward = 48.16
2022-01-26 14:16:35.763 | DEBUG    | __main__:trials:24 - Trial = 2484/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.765 | DEBUG    | __main__:trials:29 - Trial = 2484/30000 | Total reward = 43.35
2022-01-26 14:16:35.768 | DEBUG    | __main__:trials:24 - Trial = 2485/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.770 | DEBUG    | __main__:trials:29 - Trial = 2485/30000 | Total reward = 46.30
2022-01-26 14:16:35.773 | DEBUG    | __main__:trials:24 - Trial = 2486/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.774 | DEBUG    | __main__:trials:29 - Trial = 2486/30000 | Total reward = 29.06
2022-01-26 14:16:35.778 | DEBUG    | __main__:trials:24 - Trial = 2487/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.779 | DEBUG    | __main__:trials:29 - Trial = 2487/30000 | Total reward = 45.63
2022-01-26 14:16:35.784 | DEBUG    | __main__:trials:24 - Trial = 2488/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.784 | DEBUG    | __main__:trials:29 - Trial = 2488/30000 | Total reward = 39.02
2022-01-26 14:16:35.789 | DEBUG    | __main__:trials:24 - Trial = 2489/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.790 | DEBUG    | __main__:trials:29 - Trial = 2489/30000 | Total reward = 41.41
2022-01-26 14:16:35.794 | DEBUG    | __main__:trials:24 - Trial = 2490/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.795 | DEBUG    | __main__:trials:29 - Trial = 2490/30000 | Total reward = 59.81
2022-01-26 14:16:35.798 | DEBUG    | __main__:trials:24 - Trial = 2491/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.798 | DEBUG    | __main__:trials:29 - Trial = 2491/30000 | Total reward = 43.12
2022-01-26 14:16:35.802 | DEBUG    | __main__:trials:24 - Trial = 2492/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.802 | DEBUG    | __main__:trials:29 - Trial = 2492/30000 | Total reward = 51.77
2022-01-26 14:16:35.806 | DEBUG    | __main__:trials:24 - Trial = 2493/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.807 | DEBUG    | __main__:trials:29 - Trial = 2493/30000 | Total reward = 45.31
2022-01-26 14:16:35.811 | DEBUG    | __main__:trials:24 - Trial = 2494/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.813 | DEBUG    | __main__:trials:29 - Trial = 2494/30000 | Total reward = 55.75
2022-01-26 14:16:35.816 | DEBUG    | __main__:trials:24 - Trial = 2495/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.817 | DEBUG    | __main__:trials:29 - Trial = 2495/30000 | Total reward = 49.93
2022-01-26 14:16:35.820 | DEBUG    | __main__:trials:24 - Trial = 2496/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.821 | DEBUG    | __main__:trials:29 - Trial = 2496/30000 | Total reward = 45.91
2022-01-26 14:16:35.825 | DEBUG    | __main__:trials:24 - Trial = 2497/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.825 | DEBUG    | __main__:trials:29 - Trial = 2497/30000 | Total reward = 44.10
2022-01-26 14:16:35.829 | DEBUG    | __main__:trials:24 - Trial = 2498/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.829 | DEBUG    | __main__:trials:29 - Trial = 2498/30000 | Total reward = 28.06
2022-01-26 14:16:35.835 | DEBUG    | __main__:trials:24 - Trial = 2499/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.836 | DEBUG    | __main__:trials:29 - Trial = 2499/30000 | Total reward = 51.70
2022-01-26 14:16:35.839 | DEBUG    | __main__:trials:24 - Trial = 2500/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.841 | DEBUG    | __main__:trials:29 - Trial = 2500/30000 | Total reward = 29.93
2022-01-26 14:16:35.845 | DEBUG    | __main__:trials:24 - Trial = 2501/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.846 | DEBUG    | __main__:trials:29 - Trial = 2501/30000 | Total reward = 51.47
2022-01-26 14:16:35.849 | DEBUG    | __main__:trials:24 - Trial = 2502/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.851 | DEBUG    | __main__:trials:29 - Trial = 2502/30000 | Total reward = 49.36
2022-01-26 14:16:35.855 | DEBUG    | __main__:trials:24 - Trial = 2503/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.857 | DEBUG    | __main__:trials:29 - Trial = 2503/30000 | Total reward = 56.44
2022-01-26 14:16:35.860 | DEBUG    | __main__:trials:24 - Trial = 2504/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.862 | DEBUG    | __main__:trials:29 - Trial = 2504/30000 | Total reward = 53.02
2022-01-26 14:16:35.866 | DEBUG    | __main__:trials:24 - Trial = 2505/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.867 | DEBUG    | __main__:trials:29 - Trial = 2505/30000 | Total reward = 35.15
2022-01-26 14:16:35.870 | DEBUG    | __main__:trials:24 - Trial = 2506/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.872 | DEBUG    | __main__:trials:29 - Trial = 2506/30000 | Total reward = 52.73
2022-01-26 14:16:35.876 | DEBUG    | __main__:trials:24 - Trial = 2507/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.877 | DEBUG    | __main__:trials:29 - Trial = 2507/30000 | Total reward = 49.00
2022-01-26 14:16:35.881 | DEBUG    | __main__:trials:24 - Trial = 2508/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.883 | DEBUG    | __main__:trials:29 - Trial = 2508/30000 | Total reward = 50.10
2022-01-26 14:16:35.887 | DEBUG    | __main__:trials:24 - Trial = 2509/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.888 | DEBUG    | __main__:trials:29 - Trial = 2509/30000 | Total reward = 26.36
2022-01-26 14:16:35.892 | DEBUG    | __main__:trials:24 - Trial = 2510/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.893 | DEBUG    | __main__:trials:29 - Trial = 2510/30000 | Total reward = 50.80
2022-01-26 14:16:35.897 | DEBUG    | __main__:trials:24 - Trial = 2511/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.897 | DEBUG    | __main__:trials:29 - Trial = 2511/30000 | Total reward = 55.09
2022-01-26 14:16:35.902 | DEBUG    | __main__:trials:24 - Trial = 2512/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.902 | DEBUG    | __main__:trials:29 - Trial = 2512/30000 | Total reward = 47.39
2022-01-26 14:16:35.906 | DEBUG    | __main__:trials:24 - Trial = 2513/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.908 | DEBUG    | __main__:trials:29 - Trial = 2513/30000 | Total reward = 45.63
2022-01-26 14:16:35.911 | DEBUG    | __main__:trials:24 - Trial = 2514/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.912 | DEBUG    | __main__:trials:29 - Trial = 2514/30000 | Total reward = 53.27
2022-01-26 14:16:35.916 | DEBUG    | __main__:trials:24 - Trial = 2515/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.917 | DEBUG    | __main__:trials:29 - Trial = 2515/30000 | Total reward = 48.29
2022-01-26 14:16:35.921 | DEBUG    | __main__:trials:24 - Trial = 2516/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.921 | DEBUG    | __main__:trials:29 - Trial = 2516/30000 | Total reward = 52.82
2022-01-26 14:16:35.925 | DEBUG    | __main__:trials:24 - Trial = 2517/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.926 | DEBUG    | __main__:trials:29 - Trial = 2517/30000 | Total reward = 45.91
2022-01-26 14:16:35.930 | DEBUG    | __main__:trials:24 - Trial = 2518/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.931 | DEBUG    | __main__:trials:29 - Trial = 2518/30000 | Total reward = 49.08
2022-01-26 14:16:35.935 | DEBUG    | __main__:trials:24 - Trial = 2519/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.936 | DEBUG    | __main__:trials:29 - Trial = 2519/30000 | Total reward = 57.08
2022-01-26 14:16:35.940 | DEBUG    | __main__:trials:24 - Trial = 2520/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.941 | DEBUG    | __main__:trials:29 - Trial = 2520/30000 | Total reward = 53.39
2022-01-26 14:16:35.945 | DEBUG    | __main__:trials:24 - Trial = 2521/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.946 | DEBUG    | __main__:trials:29 - Trial = 2521/30000 | Total reward = 50.46
2022-01-26 14:16:35.950 | DEBUG    | __main__:trials:24 - Trial = 2522/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.952 | DEBUG    | __main__:trials:29 - Trial = 2522/30000 | Total reward = 47.20
2022-01-26 14:16:35.954 | DEBUG    | __main__:trials:24 - Trial = 2523/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.956 | DEBUG    | __main__:trials:29 - Trial = 2523/30000 | Total reward = 49.24
2022-01-26 14:16:35.960 | DEBUG    | __main__:trials:24 - Trial = 2524/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.961 | DEBUG    | __main__:trials:29 - Trial = 2524/30000 | Total reward = 54.63
2022-01-26 14:16:35.965 | DEBUG    | __main__:trials:26 - Trial = 2525/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:35.966 | DEBUG    | __main__:trials:29 - Trial = 2525/30000 | Total reward = 32.89
2022-01-26 14:16:35.970 | DEBUG    | __main__:trials:24 - Trial = 2526/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.971 | DEBUG    | __main__:trials:29 - Trial = 2526/30000 | Total reward = 37.38
2022-01-26 14:16:35.975 | DEBUG    | __main__:trials:24 - Trial = 2527/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.976 | DEBUG    | __main__:trials:29 - Trial = 2527/30000 | Total reward = 50.72
2022-01-26 14:16:35.980 | DEBUG    | __main__:trials:24 - Trial = 2528/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.982 | DEBUG    | __main__:trials:29 - Trial = 2528/30000 | Total reward = 51.20
2022-01-26 14:16:35.985 | DEBUG    | __main__:trials:24 - Trial = 2529/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.987 | DEBUG    | __main__:trials:29 - Trial = 2529/30000 | Total reward = 53.02
2022-01-26 14:16:35.991 | DEBUG    | __main__:trials:24 - Trial = 2530/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.991 | DEBUG    | __main__:trials:29 - Trial = 2530/30000 | Total reward = 34.57
2022-01-26 14:16:35.996 | DEBUG    | __main__:trials:24 - Trial = 2531/30000 | Max number of steps (20) reached
2022-01-26 14:16:35.996 | DEBUG    | __main__:trials:29 - Trial = 2531/30000 | Total reward = 50.50
2022-01-26 14:16:36.000 | DEBUG    | __main__:trials:24 - Trial = 2532/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.001 | DEBUG    | __main__:trials:29 - Trial = 2532/30000 | Total reward = 52.57
2022-01-26 14:16:36.005 | DEBUG    | __main__:trials:24 - Trial = 2533/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.006 | DEBUG    | __main__:trials:29 - Trial = 2533/30000 | Total reward = 32.57
2022-01-26 14:16:36.009 | DEBUG    | __main__:trials:24 - Trial = 2534/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.010 | DEBUG    | __main__:trials:29 - Trial = 2534/30000 | Total reward = 47.91
2022-01-26 14:16:36.015 | DEBUG    | __main__:trials:24 - Trial = 2535/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.017 | DEBUG    | __main__:trials:29 - Trial = 2535/30000 | Total reward = 36.24
2022-01-26 14:16:36.020 | DEBUG    | __main__:trials:24 - Trial = 2536/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.022 | DEBUG    | __main__:trials:29 - Trial = 2536/30000 | Total reward = 50.59
2022-01-26 14:16:36.026 | DEBUG    | __main__:trials:24 - Trial = 2537/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.027 | DEBUG    | __main__:trials:29 - Trial = 2537/30000 | Total reward = 46.18
2022-01-26 14:16:36.030 | DEBUG    | __main__:trials:24 - Trial = 2538/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.032 | DEBUG    | __main__:trials:29 - Trial = 2538/30000 | Total reward = 61.92
2022-01-26 14:16:36.035 | DEBUG    | __main__:trials:24 - Trial = 2539/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.037 | DEBUG    | __main__:trials:29 - Trial = 2539/30000 | Total reward = 43.57
2022-01-26 14:16:36.040 | DEBUG    | __main__:trials:24 - Trial = 2540/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.042 | DEBUG    | __main__:trials:29 - Trial = 2540/30000 | Total reward = 43.78
2022-01-26 14:16:36.044 | DEBUG    | __main__:trials:24 - Trial = 2541/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.046 | DEBUG    | __main__:trials:29 - Trial = 2541/30000 | Total reward = 55.93
2022-01-26 14:16:36.050 | DEBUG    | __main__:trials:24 - Trial = 2542/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.051 | DEBUG    | __main__:trials:29 - Trial = 2542/30000 | Total reward = 53.21
2022-01-26 14:16:36.054 | DEBUG    | __main__:trials:24 - Trial = 2543/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.056 | DEBUG    | __main__:trials:29 - Trial = 2543/30000 | Total reward = 45.91
2022-01-26 14:16:36.060 | DEBUG    | __main__:trials:24 - Trial = 2544/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.062 | DEBUG    | __main__:trials:29 - Trial = 2544/30000 | Total reward = 50.33
2022-01-26 14:16:36.065 | DEBUG    | __main__:trials:24 - Trial = 2545/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.067 | DEBUG    | __main__:trials:29 - Trial = 2545/30000 | Total reward = 49.80
2022-01-26 14:16:36.071 | DEBUG    | __main__:trials:24 - Trial = 2546/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.072 | DEBUG    | __main__:trials:29 - Trial = 2546/30000 | Total reward = 38.16
2022-01-26 14:16:36.075 | DEBUG    | __main__:trials:24 - Trial = 2547/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.077 | DEBUG    | __main__:trials:29 - Trial = 2547/30000 | Total reward = 29.36
2022-01-26 14:16:36.081 | DEBUG    | __main__:trials:24 - Trial = 2548/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.082 | DEBUG    | __main__:trials:29 - Trial = 2548/30000 | Total reward = 50.36
2022-01-26 14:16:36.086 | DEBUG    | __main__:trials:24 - Trial = 2549/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.087 | DEBUG    | __main__:trials:29 - Trial = 2549/30000 | Total reward = 49.60
2022-01-26 14:16:36.090 | DEBUG    | __main__:trials:24 - Trial = 2550/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.098 | DEBUG    | __main__:trials:29 - Trial = 2550/30000 | Total reward = 40.41
2022-01-26 14:16:36.104 | DEBUG    | __main__:trials:24 - Trial = 2551/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.106 | DEBUG    | __main__:trials:29 - Trial = 2551/30000 | Total reward = 42.75
2022-01-26 14:16:36.110 | DEBUG    | __main__:trials:24 - Trial = 2552/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.111 | DEBUG    | __main__:trials:29 - Trial = 2552/30000 | Total reward = 48.87
2022-01-26 14:16:36.115 | DEBUG    | __main__:trials:24 - Trial = 2553/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.117 | DEBUG    | __main__:trials:29 - Trial = 2553/30000 | Total reward = 48.88
2022-01-26 14:16:36.122 | DEBUG    | __main__:trials:24 - Trial = 2554/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.123 | DEBUG    | __main__:trials:29 - Trial = 2554/30000 | Total reward = 46.84
2022-01-26 14:16:36.127 | DEBUG    | __main__:trials:26 - Trial = 2555/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.128 | DEBUG    | __main__:trials:29 - Trial = 2555/30000 | Total reward = 21.49
2022-01-26 14:16:36.133 | DEBUG    | __main__:trials:24 - Trial = 2556/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.135 | DEBUG    | __main__:trials:29 - Trial = 2556/30000 | Total reward = 48.20
2022-01-26 14:16:36.138 | DEBUG    | __main__:trials:24 - Trial = 2557/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.140 | DEBUG    | __main__:trials:29 - Trial = 2557/30000 | Total reward = 44.99
2022-01-26 14:16:36.143 | DEBUG    | __main__:trials:24 - Trial = 2558/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.146 | DEBUG    | __main__:trials:29 - Trial = 2558/30000 | Total reward = 42.81
2022-01-26 14:16:36.150 | DEBUG    | __main__:trials:24 - Trial = 2559/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.151 | DEBUG    | __main__:trials:29 - Trial = 2559/30000 | Total reward = 45.14
2022-01-26 14:16:36.155 | DEBUG    | __main__:trials:24 - Trial = 2560/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.157 | DEBUG    | __main__:trials:29 - Trial = 2560/30000 | Total reward = 55.69
2022-01-26 14:16:36.160 | DEBUG    | __main__:trials:24 - Trial = 2561/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.162 | DEBUG    | __main__:trials:29 - Trial = 2561/30000 | Total reward = 53.27
2022-01-26 14:16:36.166 | DEBUG    | __main__:trials:24 - Trial = 2562/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.167 | DEBUG    | __main__:trials:29 - Trial = 2562/30000 | Total reward = 36.71
2022-01-26 14:16:36.171 | DEBUG    | __main__:trials:24 - Trial = 2563/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.173 | DEBUG    | __main__:trials:29 - Trial = 2563/30000 | Total reward = 56.08
2022-01-26 14:16:36.177 | DEBUG    | __main__:trials:24 - Trial = 2564/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.179 | DEBUG    | __main__:trials:29 - Trial = 2564/30000 | Total reward = 52.53
2022-01-26 14:16:36.182 | DEBUG    | __main__:trials:24 - Trial = 2565/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.184 | DEBUG    | __main__:trials:29 - Trial = 2565/30000 | Total reward = 53.07
2022-01-26 14:16:36.187 | DEBUG    | __main__:trials:24 - Trial = 2566/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.189 | DEBUG    | __main__:trials:29 - Trial = 2566/30000 | Total reward = 53.92
2022-01-26 14:16:36.193 | DEBUG    | __main__:trials:24 - Trial = 2567/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.195 | DEBUG    | __main__:trials:29 - Trial = 2567/30000 | Total reward = 50.92
2022-01-26 14:16:36.198 | DEBUG    | __main__:trials:24 - Trial = 2568/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.200 | DEBUG    | __main__:trials:29 - Trial = 2568/30000 | Total reward = 43.88
2022-01-26 14:16:36.203 | DEBUG    | __main__:trials:24 - Trial = 2569/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.205 | DEBUG    | __main__:trials:29 - Trial = 2569/30000 | Total reward = 44.89
2022-01-26 14:16:36.210 | DEBUG    | __main__:trials:24 - Trial = 2570/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.211 | DEBUG    | __main__:trials:29 - Trial = 2570/30000 | Total reward = 47.90
2022-01-26 14:16:36.215 | DEBUG    | __main__:trials:24 - Trial = 2571/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.216 | DEBUG    | __main__:trials:29 - Trial = 2571/30000 | Total reward = 48.24
2022-01-26 14:16:36.219 | DEBUG    | __main__:trials:24 - Trial = 2572/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.223 | DEBUG    | __main__:trials:29 - Trial = 2572/30000 | Total reward = 49.29
2022-01-26 14:16:36.227 | DEBUG    | __main__:trials:24 - Trial = 2573/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.229 | DEBUG    | __main__:trials:29 - Trial = 2573/30000 | Total reward = 47.81
2022-01-26 14:16:36.232 | DEBUG    | __main__:trials:24 - Trial = 2574/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.233 | DEBUG    | __main__:trials:29 - Trial = 2574/30000 | Total reward = 52.83
2022-01-26 14:16:36.237 | DEBUG    | __main__:trials:24 - Trial = 2575/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.238 | DEBUG    | __main__:trials:29 - Trial = 2575/30000 | Total reward = 50.84
2022-01-26 14:16:36.242 | DEBUG    | __main__:trials:24 - Trial = 2576/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.243 | DEBUG    | __main__:trials:29 - Trial = 2576/30000 | Total reward = 55.05
2022-01-26 14:16:36.247 | DEBUG    | __main__:trials:24 - Trial = 2577/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.248 | DEBUG    | __main__:trials:29 - Trial = 2577/30000 | Total reward = 52.09
2022-01-26 14:16:36.251 | DEBUG    | __main__:trials:24 - Trial = 2578/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.253 | DEBUG    | __main__:trials:29 - Trial = 2578/30000 | Total reward = 50.92
2022-01-26 14:16:36.257 | DEBUG    | __main__:trials:24 - Trial = 2579/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.259 | DEBUG    | __main__:trials:29 - Trial = 2579/30000 | Total reward = 47.14
2022-01-26 14:16:36.262 | DEBUG    | __main__:trials:24 - Trial = 2580/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.264 | DEBUG    | __main__:trials:29 - Trial = 2580/30000 | Total reward = 56.17
2022-01-26 14:16:36.268 | DEBUG    | __main__:trials:24 - Trial = 2581/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.268 | DEBUG    | __main__:trials:29 - Trial = 2581/30000 | Total reward = 53.27
2022-01-26 14:16:36.272 | DEBUG    | __main__:trials:26 - Trial = 2582/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.273 | DEBUG    | __main__:trials:29 - Trial = 2582/30000 | Total reward = 19.38
2022-01-26 14:16:36.276 | DEBUG    | __main__:trials:26 - Trial = 2583/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.278 | DEBUG    | __main__:trials:29 - Trial = 2583/30000 | Total reward = 27.31
2022-01-26 14:16:36.280 | DEBUG    | __main__:trials:26 - Trial = 2584/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.284 | DEBUG    | __main__:trials:29 - Trial = 2584/30000 | Total reward = 16.54
2022-01-26 14:16:36.288 | DEBUG    | __main__:trials:24 - Trial = 2585/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.290 | DEBUG    | __main__:trials:29 - Trial = 2585/30000 | Total reward = 44.28
2022-01-26 14:16:36.294 | DEBUG    | __main__:trials:24 - Trial = 2586/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.295 | DEBUG    | __main__:trials:29 - Trial = 2586/30000 | Total reward = 50.34
2022-01-26 14:16:36.299 | DEBUG    | __main__:trials:24 - Trial = 2587/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.301 | DEBUG    | __main__:trials:29 - Trial = 2587/30000 | Total reward = 48.33
2022-01-26 14:16:36.304 | DEBUG    | __main__:trials:24 - Trial = 2588/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.306 | DEBUG    | __main__:trials:29 - Trial = 2588/30000 | Total reward = 56.02
2022-01-26 14:16:36.310 | DEBUG    | __main__:trials:24 - Trial = 2589/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.312 | DEBUG    | __main__:trials:29 - Trial = 2589/30000 | Total reward = 63.71
2022-01-26 14:16:36.315 | DEBUG    | __main__:trials:24 - Trial = 2590/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.317 | DEBUG    | __main__:trials:29 - Trial = 2590/30000 | Total reward = 40.62
2022-01-26 14:16:36.321 | DEBUG    | __main__:trials:24 - Trial = 2591/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.327 | DEBUG    | __main__:trials:29 - Trial = 2591/30000 | Total reward = 49.96
2022-01-26 14:16:36.331 | DEBUG    | __main__:trials:24 - Trial = 2592/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.333 | DEBUG    | __main__:trials:29 - Trial = 2592/30000 | Total reward = 63.83
2022-01-26 14:16:36.337 | DEBUG    | __main__:trials:24 - Trial = 2593/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.338 | DEBUG    | __main__:trials:29 - Trial = 2593/30000 | Total reward = 53.86
2022-01-26 14:16:36.341 | DEBUG    | __main__:trials:24 - Trial = 2594/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.342 | DEBUG    | __main__:trials:29 - Trial = 2594/30000 | Total reward = 48.65
2022-01-26 14:16:36.345 | DEBUG    | __main__:trials:24 - Trial = 2595/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.347 | DEBUG    | __main__:trials:29 - Trial = 2595/30000 | Total reward = 52.31
2022-01-26 14:16:36.351 | DEBUG    | __main__:trials:24 - Trial = 2596/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.352 | DEBUG    | __main__:trials:29 - Trial = 2596/30000 | Total reward = 55.60
2022-01-26 14:16:36.356 | DEBUG    | __main__:trials:24 - Trial = 2597/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.357 | DEBUG    | __main__:trials:29 - Trial = 2597/30000 | Total reward = 69.24
2022-01-26 14:16:36.360 | DEBUG    | __main__:trials:24 - Trial = 2598/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.362 | DEBUG    | __main__:trials:29 - Trial = 2598/30000 | Total reward = 50.95
2022-01-26 14:16:36.366 | DEBUG    | __main__:trials:24 - Trial = 2599/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.367 | DEBUG    | __main__:trials:29 - Trial = 2599/30000 | Total reward = 49.43
2022-01-26 14:16:36.371 | DEBUG    | __main__:trials:24 - Trial = 2600/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.372 | DEBUG    | __main__:trials:29 - Trial = 2600/30000 | Total reward = 57.97
2022-01-26 14:16:36.376 | DEBUG    | __main__:trials:24 - Trial = 2601/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.378 | DEBUG    | __main__:trials:29 - Trial = 2601/30000 | Total reward = 61.74
2022-01-26 14:16:36.381 | DEBUG    | __main__:trials:26 - Trial = 2602/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.382 | DEBUG    | __main__:trials:29 - Trial = 2602/30000 | Total reward = 21.17
2022-01-26 14:16:36.388 | DEBUG    | __main__:trials:24 - Trial = 2603/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.390 | DEBUG    | __main__:trials:29 - Trial = 2603/30000 | Total reward = 50.36
2022-01-26 14:16:36.393 | DEBUG    | __main__:trials:24 - Trial = 2604/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.395 | DEBUG    | __main__:trials:29 - Trial = 2604/30000 | Total reward = 46.73
2022-01-26 14:16:36.399 | DEBUG    | __main__:trials:24 - Trial = 2605/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.400 | DEBUG    | __main__:trials:29 - Trial = 2605/30000 | Total reward = 43.65
2022-01-26 14:16:36.403 | DEBUG    | __main__:trials:24 - Trial = 2606/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.406 | DEBUG    | __main__:trials:29 - Trial = 2606/30000 | Total reward = 55.31
2022-01-26 14:16:36.409 | DEBUG    | __main__:trials:24 - Trial = 2607/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.411 | DEBUG    | __main__:trials:29 - Trial = 2607/30000 | Total reward = 50.63
2022-01-26 14:16:36.415 | DEBUG    | __main__:trials:24 - Trial = 2608/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.416 | DEBUG    | __main__:trials:29 - Trial = 2608/30000 | Total reward = 51.82
2022-01-26 14:16:36.420 | DEBUG    | __main__:trials:24 - Trial = 2609/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.422 | DEBUG    | __main__:trials:29 - Trial = 2609/30000 | Total reward = 53.27
2022-01-26 14:16:36.426 | DEBUG    | __main__:trials:24 - Trial = 2610/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.427 | DEBUG    | __main__:trials:29 - Trial = 2610/30000 | Total reward = 47.11
2022-01-26 14:16:36.431 | DEBUG    | __main__:trials:24 - Trial = 2611/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.433 | DEBUG    | __main__:trials:29 - Trial = 2611/30000 | Total reward = 48.90
2022-01-26 14:16:36.436 | DEBUG    | __main__:trials:24 - Trial = 2612/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.438 | DEBUG    | __main__:trials:29 - Trial = 2612/30000 | Total reward = 54.98
2022-01-26 14:16:36.441 | DEBUG    | __main__:trials:26 - Trial = 2613/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.443 | DEBUG    | __main__:trials:29 - Trial = 2613/30000 | Total reward = 21.25
2022-01-26 14:16:36.447 | DEBUG    | __main__:trials:24 - Trial = 2614/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.448 | DEBUG    | __main__:trials:29 - Trial = 2614/30000 | Total reward = 53.68
2022-01-26 14:16:36.452 | DEBUG    | __main__:trials:24 - Trial = 2615/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.454 | DEBUG    | __main__:trials:29 - Trial = 2615/30000 | Total reward = 39.11
2022-01-26 14:16:36.457 | DEBUG    | __main__:trials:24 - Trial = 2616/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.458 | DEBUG    | __main__:trials:29 - Trial = 2616/30000 | Total reward = 34.05
2022-01-26 14:16:36.462 | DEBUG    | __main__:trials:24 - Trial = 2617/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.463 | DEBUG    | __main__:trials:29 - Trial = 2617/30000 | Total reward = 49.13
2022-01-26 14:16:36.467 | DEBUG    | __main__:trials:26 - Trial = 2618/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.468 | DEBUG    | __main__:trials:29 - Trial = 2618/30000 | Total reward = 38.65
2022-01-26 14:16:36.472 | DEBUG    | __main__:trials:24 - Trial = 2619/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.472 | DEBUG    | __main__:trials:29 - Trial = 2619/30000 | Total reward = 40.75
2022-01-26 14:16:36.477 | DEBUG    | __main__:trials:24 - Trial = 2620/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.477 | DEBUG    | __main__:trials:29 - Trial = 2620/30000 | Total reward = 53.27
2022-01-26 14:16:36.480 | DEBUG    | __main__:trials:24 - Trial = 2621/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.481 | DEBUG    | __main__:trials:29 - Trial = 2621/30000 | Total reward = 54.60
2022-01-26 14:16:36.484 | DEBUG    | __main__:trials:24 - Trial = 2622/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.485 | DEBUG    | __main__:trials:29 - Trial = 2622/30000 | Total reward = 42.79
2022-01-26 14:16:36.489 | DEBUG    | __main__:trials:24 - Trial = 2623/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.490 | DEBUG    | __main__:trials:29 - Trial = 2623/30000 | Total reward = 48.81
2022-01-26 14:16:36.494 | DEBUG    | __main__:trials:24 - Trial = 2624/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.496 | DEBUG    | __main__:trials:29 - Trial = 2624/30000 | Total reward = 51.43
2022-01-26 14:16:36.499 | DEBUG    | __main__:trials:24 - Trial = 2625/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.501 | DEBUG    | __main__:trials:29 - Trial = 2625/30000 | Total reward = 53.27
2022-01-26 14:16:36.504 | DEBUG    | __main__:trials:24 - Trial = 2626/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.506 | DEBUG    | __main__:trials:29 - Trial = 2626/30000 | Total reward = 40.95
2022-01-26 14:16:36.509 | DEBUG    | __main__:trials:24 - Trial = 2627/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.511 | DEBUG    | __main__:trials:29 - Trial = 2627/30000 | Total reward = 26.02
2022-01-26 14:16:36.515 | DEBUG    | __main__:trials:24 - Trial = 2628/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.517 | DEBUG    | __main__:trials:29 - Trial = 2628/30000 | Total reward = 52.13
2022-01-26 14:16:36.520 | DEBUG    | __main__:trials:24 - Trial = 2629/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.522 | DEBUG    | __main__:trials:29 - Trial = 2629/30000 | Total reward = 45.41
2022-01-26 14:16:36.526 | DEBUG    | __main__:trials:24 - Trial = 2630/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.527 | DEBUG    | __main__:trials:29 - Trial = 2630/30000 | Total reward = 42.22
2022-01-26 14:16:36.531 | DEBUG    | __main__:trials:24 - Trial = 2631/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.532 | DEBUG    | __main__:trials:29 - Trial = 2631/30000 | Total reward = 53.17
2022-01-26 14:16:36.536 | DEBUG    | __main__:trials:24 - Trial = 2632/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.537 | DEBUG    | __main__:trials:29 - Trial = 2632/30000 | Total reward = 57.54
2022-01-26 14:16:36.541 | DEBUG    | __main__:trials:24 - Trial = 2633/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.543 | DEBUG    | __main__:trials:29 - Trial = 2633/30000 | Total reward = 29.62
2022-01-26 14:16:36.546 | DEBUG    | __main__:trials:24 - Trial = 2634/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.548 | DEBUG    | __main__:trials:29 - Trial = 2634/30000 | Total reward = 51.07
2022-01-26 14:16:36.552 | DEBUG    | __main__:trials:24 - Trial = 2635/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.554 | DEBUG    | __main__:trials:29 - Trial = 2635/30000 | Total reward = 67.59
2022-01-26 14:16:36.558 | DEBUG    | __main__:trials:24 - Trial = 2636/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.560 | DEBUG    | __main__:trials:29 - Trial = 2636/30000 | Total reward = 50.79
2022-01-26 14:16:36.563 | DEBUG    | __main__:trials:26 - Trial = 2637/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.570 | DEBUG    | __main__:trials:29 - Trial = 2637/30000 | Total reward = 30.08
2022-01-26 14:16:36.576 | DEBUG    | __main__:trials:24 - Trial = 2638/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.576 | DEBUG    | __main__:trials:29 - Trial = 2638/30000 | Total reward = 56.05
2022-01-26 14:16:36.580 | DEBUG    | __main__:trials:26 - Trial = 2639/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.581 | DEBUG    | __main__:trials:29 - Trial = 2639/30000 | Total reward = 17.09
2022-01-26 14:16:36.585 | DEBUG    | __main__:trials:24 - Trial = 2640/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.586 | DEBUG    | __main__:trials:29 - Trial = 2640/30000 | Total reward = 46.96
2022-01-26 14:16:36.589 | DEBUG    | __main__:trials:24 - Trial = 2641/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.590 | DEBUG    | __main__:trials:29 - Trial = 2641/30000 | Total reward = 53.27
2022-01-26 14:16:36.593 | DEBUG    | __main__:trials:24 - Trial = 2642/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.595 | DEBUG    | __main__:trials:29 - Trial = 2642/30000 | Total reward = 24.60
2022-01-26 14:16:36.599 | DEBUG    | __main__:trials:24 - Trial = 2643/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.600 | DEBUG    | __main__:trials:29 - Trial = 2643/30000 | Total reward = 53.27
2022-01-26 14:16:36.604 | DEBUG    | __main__:trials:26 - Trial = 2644/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.605 | DEBUG    | __main__:trials:29 - Trial = 2644/30000 | Total reward = 30.96
2022-01-26 14:16:36.609 | DEBUG    | __main__:trials:24 - Trial = 2645/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.610 | DEBUG    | __main__:trials:29 - Trial = 2645/30000 | Total reward = 50.77
2022-01-26 14:16:36.613 | DEBUG    | __main__:trials:24 - Trial = 2646/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.615 | DEBUG    | __main__:trials:29 - Trial = 2646/30000 | Total reward = 46.66
2022-01-26 14:16:36.619 | DEBUG    | __main__:trials:24 - Trial = 2647/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.620 | DEBUG    | __main__:trials:29 - Trial = 2647/30000 | Total reward = 41.28
2022-01-26 14:16:36.623 | DEBUG    | __main__:trials:24 - Trial = 2648/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.625 | DEBUG    | __main__:trials:29 - Trial = 2648/30000 | Total reward = 52.47
2022-01-26 14:16:36.630 | DEBUG    | __main__:trials:24 - Trial = 2649/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.635 | DEBUG    | __main__:trials:29 - Trial = 2649/30000 | Total reward = 34.52
2022-01-26 14:16:36.638 | DEBUG    | __main__:trials:24 - Trial = 2650/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.641 | DEBUG    | __main__:trials:29 - Trial = 2650/30000 | Total reward = 53.22
2022-01-26 14:16:36.644 | DEBUG    | __main__:trials:24 - Trial = 2651/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.646 | DEBUG    | __main__:trials:29 - Trial = 2651/30000 | Total reward = 50.10
2022-01-26 14:16:36.649 | DEBUG    | __main__:trials:24 - Trial = 2652/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.651 | DEBUG    | __main__:trials:29 - Trial = 2652/30000 | Total reward = 53.53
2022-01-26 14:16:36.655 | DEBUG    | __main__:trials:24 - Trial = 2653/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.656 | DEBUG    | __main__:trials:29 - Trial = 2653/30000 | Total reward = 50.71
2022-01-26 14:16:36.659 | DEBUG    | __main__:trials:24 - Trial = 2654/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.661 | DEBUG    | __main__:trials:29 - Trial = 2654/30000 | Total reward = 45.75
2022-01-26 14:16:36.665 | DEBUG    | __main__:trials:24 - Trial = 2655/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.666 | DEBUG    | __main__:trials:29 - Trial = 2655/30000 | Total reward = 53.67
2022-01-26 14:16:36.669 | DEBUG    | __main__:trials:24 - Trial = 2656/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.670 | DEBUG    | __main__:trials:29 - Trial = 2656/30000 | Total reward = 30.78
2022-01-26 14:16:36.674 | DEBUG    | __main__:trials:24 - Trial = 2657/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.675 | DEBUG    | __main__:trials:29 - Trial = 2657/30000 | Total reward = 55.03
2022-01-26 14:16:36.679 | DEBUG    | __main__:trials:24 - Trial = 2658/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.679 | DEBUG    | __main__:trials:29 - Trial = 2658/30000 | Total reward = 37.30
2022-01-26 14:16:36.683 | DEBUG    | __main__:trials:24 - Trial = 2659/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.684 | DEBUG    | __main__:trials:29 - Trial = 2659/30000 | Total reward = 26.54
2022-01-26 14:16:36.688 | DEBUG    | __main__:trials:24 - Trial = 2660/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.690 | DEBUG    | __main__:trials:29 - Trial = 2660/30000 | Total reward = 39.30
2022-01-26 14:16:36.693 | DEBUG    | __main__:trials:24 - Trial = 2661/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.694 | DEBUG    | __main__:trials:29 - Trial = 2661/30000 | Total reward = 27.62
2022-01-26 14:16:36.698 | DEBUG    | __main__:trials:24 - Trial = 2662/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.700 | DEBUG    | __main__:trials:29 - Trial = 2662/30000 | Total reward = 41.65
2022-01-26 14:16:36.703 | DEBUG    | __main__:trials:24 - Trial = 2663/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.705 | DEBUG    | __main__:trials:29 - Trial = 2663/30000 | Total reward = 48.66
2022-01-26 14:16:36.709 | DEBUG    | __main__:trials:24 - Trial = 2664/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.709 | DEBUG    | __main__:trials:29 - Trial = 2664/30000 | Total reward = 49.16
2022-01-26 14:16:36.714 | DEBUG    | __main__:trials:24 - Trial = 2665/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.716 | DEBUG    | __main__:trials:29 - Trial = 2665/30000 | Total reward = 49.01
2022-01-26 14:16:36.720 | DEBUG    | __main__:trials:24 - Trial = 2666/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.721 | DEBUG    | __main__:trials:29 - Trial = 2666/30000 | Total reward = 43.59
2022-01-26 14:16:36.725 | DEBUG    | __main__:trials:24 - Trial = 2667/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.727 | DEBUG    | __main__:trials:29 - Trial = 2667/30000 | Total reward = 39.74
2022-01-26 14:16:36.731 | DEBUG    | __main__:trials:24 - Trial = 2668/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.733 | DEBUG    | __main__:trials:29 - Trial = 2668/30000 | Total reward = 47.47
2022-01-26 14:16:36.737 | DEBUG    | __main__:trials:24 - Trial = 2669/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.738 | DEBUG    | __main__:trials:29 - Trial = 2669/30000 | Total reward = 53.71
2022-01-26 14:16:36.742 | DEBUG    | __main__:trials:24 - Trial = 2670/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.743 | DEBUG    | __main__:trials:29 - Trial = 2670/30000 | Total reward = 47.88
2022-01-26 14:16:36.747 | DEBUG    | __main__:trials:24 - Trial = 2671/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.749 | DEBUG    | __main__:trials:29 - Trial = 2671/30000 | Total reward = 52.69
2022-01-26 14:16:36.752 | DEBUG    | __main__:trials:24 - Trial = 2672/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.755 | DEBUG    | __main__:trials:29 - Trial = 2672/30000 | Total reward = 46.69
2022-01-26 14:16:36.758 | DEBUG    | __main__:trials:24 - Trial = 2673/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.760 | DEBUG    | __main__:trials:29 - Trial = 2673/30000 | Total reward = 56.18
2022-01-26 14:16:36.764 | DEBUG    | __main__:trials:24 - Trial = 2674/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.766 | DEBUG    | __main__:trials:29 - Trial = 2674/30000 | Total reward = 33.11
2022-01-26 14:16:36.770 | DEBUG    | __main__:trials:24 - Trial = 2675/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.772 | DEBUG    | __main__:trials:29 - Trial = 2675/30000 | Total reward = 51.75
2022-01-26 14:16:36.776 | DEBUG    | __main__:trials:24 - Trial = 2676/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.777 | DEBUG    | __main__:trials:29 - Trial = 2676/30000 | Total reward = 44.67
2022-01-26 14:16:36.781 | DEBUG    | __main__:trials:24 - Trial = 2677/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.783 | DEBUG    | __main__:trials:29 - Trial = 2677/30000 | Total reward = 50.73
2022-01-26 14:16:36.787 | DEBUG    | __main__:trials:24 - Trial = 2678/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.788 | DEBUG    | __main__:trials:29 - Trial = 2678/30000 | Total reward = 49.59
2022-01-26 14:16:36.792 | DEBUG    | __main__:trials:24 - Trial = 2679/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.793 | DEBUG    | __main__:trials:29 - Trial = 2679/30000 | Total reward = 49.35
2022-01-26 14:16:36.796 | DEBUG    | __main__:trials:24 - Trial = 2680/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.798 | DEBUG    | __main__:trials:29 - Trial = 2680/30000 | Total reward = 50.00
2022-01-26 14:16:36.802 | DEBUG    | __main__:trials:24 - Trial = 2681/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.803 | DEBUG    | __main__:trials:29 - Trial = 2681/30000 | Total reward = 55.22
2022-01-26 14:16:36.807 | DEBUG    | __main__:trials:26 - Trial = 2682/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.809 | DEBUG    | __main__:trials:29 - Trial = 2682/30000 | Total reward = 28.69
2022-01-26 14:16:36.813 | DEBUG    | __main__:trials:24 - Trial = 2683/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.814 | DEBUG    | __main__:trials:29 - Trial = 2683/30000 | Total reward = 47.89
2022-01-26 14:16:36.817 | DEBUG    | __main__:trials:24 - Trial = 2684/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.818 | DEBUG    | __main__:trials:29 - Trial = 2684/30000 | Total reward = 51.77
2022-01-26 14:16:36.822 | DEBUG    | __main__:trials:24 - Trial = 2685/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.824 | DEBUG    | __main__:trials:29 - Trial = 2685/30000 | Total reward = 43.18
2022-01-26 14:16:36.829 | DEBUG    | __main__:trials:24 - Trial = 2686/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.835 | DEBUG    | __main__:trials:29 - Trial = 2686/30000 | Total reward = 60.28
2022-01-26 14:16:36.838 | DEBUG    | __main__:trials:24 - Trial = 2687/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.839 | DEBUG    | __main__:trials:29 - Trial = 2687/30000 | Total reward = 50.95
2022-01-26 14:16:36.842 | DEBUG    | __main__:trials:24 - Trial = 2688/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.846 | DEBUG    | __main__:trials:29 - Trial = 2688/30000 | Total reward = 42.82
2022-01-26 14:16:36.849 | DEBUG    | __main__:trials:24 - Trial = 2689/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.850 | DEBUG    | __main__:trials:29 - Trial = 2689/30000 | Total reward = 54.75
2022-01-26 14:16:36.854 | DEBUG    | __main__:trials:24 - Trial = 2690/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.855 | DEBUG    | __main__:trials:29 - Trial = 2690/30000 | Total reward = 52.35
2022-01-26 14:16:36.857 | DEBUG    | __main__:trials:26 - Trial = 2691/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.859 | DEBUG    | __main__:trials:29 - Trial = 2691/30000 | Total reward = 21.02
2022-01-26 14:16:36.863 | DEBUG    | __main__:trials:24 - Trial = 2692/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.864 | DEBUG    | __main__:trials:29 - Trial = 2692/30000 | Total reward = 49.41
2022-01-26 14:16:36.868 | DEBUG    | __main__:trials:24 - Trial = 2693/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.869 | DEBUG    | __main__:trials:29 - Trial = 2693/30000 | Total reward = 53.27
2022-01-26 14:16:36.873 | DEBUG    | __main__:trials:24 - Trial = 2694/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.875 | DEBUG    | __main__:trials:29 - Trial = 2694/30000 | Total reward = 49.06
2022-01-26 14:16:36.878 | DEBUG    | __main__:trials:24 - Trial = 2695/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.880 | DEBUG    | __main__:trials:29 - Trial = 2695/30000 | Total reward = 48.05
2022-01-26 14:16:36.884 | DEBUG    | __main__:trials:24 - Trial = 2696/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.885 | DEBUG    | __main__:trials:29 - Trial = 2696/30000 | Total reward = 54.01
2022-01-26 14:16:36.889 | DEBUG    | __main__:trials:24 - Trial = 2697/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.890 | DEBUG    | __main__:trials:29 - Trial = 2697/30000 | Total reward = 49.78
2022-01-26 14:16:36.893 | DEBUG    | __main__:trials:24 - Trial = 2698/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.894 | DEBUG    | __main__:trials:29 - Trial = 2698/30000 | Total reward = 51.00
2022-01-26 14:16:36.897 | DEBUG    | __main__:trials:24 - Trial = 2699/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.898 | DEBUG    | __main__:trials:29 - Trial = 2699/30000 | Total reward = 50.24
2022-01-26 14:16:36.901 | DEBUG    | __main__:trials:24 - Trial = 2700/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.902 | DEBUG    | __main__:trials:29 - Trial = 2700/30000 | Total reward = 57.40
2022-01-26 14:16:36.906 | DEBUG    | __main__:trials:24 - Trial = 2701/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.906 | DEBUG    | __main__:trials:29 - Trial = 2701/30000 | Total reward = 50.74
2022-01-26 14:16:36.910 | DEBUG    | __main__:trials:24 - Trial = 2702/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.911 | DEBUG    | __main__:trials:29 - Trial = 2702/30000 | Total reward = 63.48
2022-01-26 14:16:36.914 | DEBUG    | __main__:trials:24 - Trial = 2703/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.916 | DEBUG    | __main__:trials:29 - Trial = 2703/30000 | Total reward = 52.18
2022-01-26 14:16:36.919 | DEBUG    | __main__:trials:24 - Trial = 2704/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.921 | DEBUG    | __main__:trials:29 - Trial = 2704/30000 | Total reward = 40.09
2022-01-26 14:16:36.925 | DEBUG    | __main__:trials:24 - Trial = 2705/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.925 | DEBUG    | __main__:trials:29 - Trial = 2705/30000 | Total reward = 48.14
2022-01-26 14:16:36.929 | DEBUG    | __main__:trials:24 - Trial = 2706/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.930 | DEBUG    | __main__:trials:29 - Trial = 2706/30000 | Total reward = 51.37
2022-01-26 14:16:36.933 | DEBUG    | __main__:trials:24 - Trial = 2707/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.934 | DEBUG    | __main__:trials:29 - Trial = 2707/30000 | Total reward = 54.76
2022-01-26 14:16:36.938 | DEBUG    | __main__:trials:24 - Trial = 2708/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.940 | DEBUG    | __main__:trials:29 - Trial = 2708/30000 | Total reward = 53.27
2022-01-26 14:16:36.944 | DEBUG    | __main__:trials:24 - Trial = 2709/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.945 | DEBUG    | __main__:trials:29 - Trial = 2709/30000 | Total reward = 30.05
2022-01-26 14:16:36.949 | DEBUG    | __main__:trials:24 - Trial = 2710/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.951 | DEBUG    | __main__:trials:29 - Trial = 2710/30000 | Total reward = 48.99
2022-01-26 14:16:36.954 | DEBUG    | __main__:trials:24 - Trial = 2711/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.956 | DEBUG    | __main__:trials:29 - Trial = 2711/30000 | Total reward = 55.26
2022-01-26 14:16:36.960 | DEBUG    | __main__:trials:24 - Trial = 2712/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.960 | DEBUG    | __main__:trials:29 - Trial = 2712/30000 | Total reward = 49.76
2022-01-26 14:16:36.964 | DEBUG    | __main__:trials:24 - Trial = 2713/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.965 | DEBUG    | __main__:trials:29 - Trial = 2713/30000 | Total reward = 48.42
2022-01-26 14:16:36.969 | DEBUG    | __main__:trials:24 - Trial = 2714/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.970 | DEBUG    | __main__:trials:29 - Trial = 2714/30000 | Total reward = 43.43
2022-01-26 14:16:36.974 | DEBUG    | __main__:trials:24 - Trial = 2715/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.974 | DEBUG    | __main__:trials:29 - Trial = 2715/30000 | Total reward = 38.74
2022-01-26 14:16:36.979 | DEBUG    | __main__:trials:24 - Trial = 2716/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.980 | DEBUG    | __main__:trials:29 - Trial = 2716/30000 | Total reward = 37.93
2022-01-26 14:16:36.983 | DEBUG    | __main__:trials:26 - Trial = 2717/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:36.985 | DEBUG    | __main__:trials:29 - Trial = 2717/30000 | Total reward = 33.90
2022-01-26 14:16:36.989 | DEBUG    | __main__:trials:24 - Trial = 2718/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.990 | DEBUG    | __main__:trials:29 - Trial = 2718/30000 | Total reward = 50.12
2022-01-26 14:16:36.994 | DEBUG    | __main__:trials:24 - Trial = 2719/30000 | Max number of steps (20) reached
2022-01-26 14:16:36.995 | DEBUG    | __main__:trials:29 - Trial = 2719/30000 | Total reward = 51.64
2022-01-26 14:16:36.998 | DEBUG    | __main__:trials:24 - Trial = 2720/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.000 | DEBUG    | __main__:trials:29 - Trial = 2720/30000 | Total reward = 33.54
2022-01-26 14:16:37.003 | DEBUG    | __main__:trials:24 - Trial = 2721/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.005 | DEBUG    | __main__:trials:29 - Trial = 2721/30000 | Total reward = 47.90
2022-01-26 14:16:37.009 | DEBUG    | __main__:trials:24 - Trial = 2722/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.011 | DEBUG    | __main__:trials:29 - Trial = 2722/30000 | Total reward = 39.56
2022-01-26 14:16:37.015 | DEBUG    | __main__:trials:24 - Trial = 2723/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.017 | DEBUG    | __main__:trials:29 - Trial = 2723/30000 | Total reward = 54.89
2022-01-26 14:16:37.020 | DEBUG    | __main__:trials:26 - Trial = 2724/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.021 | DEBUG    | __main__:trials:29 - Trial = 2724/30000 | Total reward = 14.92
2022-01-26 14:16:37.025 | DEBUG    | __main__:trials:24 - Trial = 2725/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.027 | DEBUG    | __main__:trials:29 - Trial = 2725/30000 | Total reward = 53.27
2022-01-26 14:16:37.031 | DEBUG    | __main__:trials:24 - Trial = 2726/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.032 | DEBUG    | __main__:trials:29 - Trial = 2726/30000 | Total reward = 47.70
2022-01-26 14:16:37.036 | DEBUG    | __main__:trials:24 - Trial = 2727/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.037 | DEBUG    | __main__:trials:29 - Trial = 2727/30000 | Total reward = 44.13
2022-01-26 14:16:37.041 | DEBUG    | __main__:trials:24 - Trial = 2728/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.042 | DEBUG    | __main__:trials:29 - Trial = 2728/30000 | Total reward = 53.78
2022-01-26 14:16:37.045 | DEBUG    | __main__:trials:24 - Trial = 2729/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.047 | DEBUG    | __main__:trials:29 - Trial = 2729/30000 | Total reward = 59.19
2022-01-26 14:16:37.050 | DEBUG    | __main__:trials:24 - Trial = 2730/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.050 | DEBUG    | __main__:trials:29 - Trial = 2730/30000 | Total reward = 40.30
2022-01-26 14:16:37.054 | DEBUG    | __main__:trials:24 - Trial = 2731/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.055 | DEBUG    | __main__:trials:29 - Trial = 2731/30000 | Total reward = 55.81
2022-01-26 14:16:37.058 | DEBUG    | __main__:trials:24 - Trial = 2732/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.060 | DEBUG    | __main__:trials:29 - Trial = 2732/30000 | Total reward = 49.14
2022-01-26 14:16:37.063 | DEBUG    | __main__:trials:24 - Trial = 2733/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.064 | DEBUG    | __main__:trials:29 - Trial = 2733/30000 | Total reward = 49.22
2022-01-26 14:16:37.068 | DEBUG    | __main__:trials:24 - Trial = 2734/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.069 | DEBUG    | __main__:trials:29 - Trial = 2734/30000 | Total reward = 51.09
2022-01-26 14:16:37.073 | DEBUG    | __main__:trials:24 - Trial = 2735/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.075 | DEBUG    | __main__:trials:29 - Trial = 2735/30000 | Total reward = 51.90
2022-01-26 14:16:37.079 | DEBUG    | __main__:trials:24 - Trial = 2736/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.080 | DEBUG    | __main__:trials:29 - Trial = 2736/30000 | Total reward = 49.06
2022-01-26 14:16:37.083 | DEBUG    | __main__:trials:24 - Trial = 2737/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.083 | DEBUG    | __main__:trials:29 - Trial = 2737/30000 | Total reward = 33.71
2022-01-26 14:16:37.087 | DEBUG    | __main__:trials:24 - Trial = 2738/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.088 | DEBUG    | __main__:trials:29 - Trial = 2738/30000 | Total reward = 65.23
2022-01-26 14:16:37.092 | DEBUG    | __main__:trials:26 - Trial = 2739/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.093 | DEBUG    | __main__:trials:29 - Trial = 2739/30000 | Total reward = 24.92
2022-01-26 14:16:37.097 | DEBUG    | __main__:trials:24 - Trial = 2740/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.098 | DEBUG    | __main__:trials:29 - Trial = 2740/30000 | Total reward = 49.31
2022-01-26 14:16:37.101 | DEBUG    | __main__:trials:24 - Trial = 2741/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.103 | DEBUG    | __main__:trials:29 - Trial = 2741/30000 | Total reward = 50.04
2022-01-26 14:16:37.106 | DEBUG    | __main__:trials:24 - Trial = 2742/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.108 | DEBUG    | __main__:trials:29 - Trial = 2742/30000 | Total reward = 47.24
2022-01-26 14:16:37.112 | DEBUG    | __main__:trials:24 - Trial = 2743/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.113 | DEBUG    | __main__:trials:29 - Trial = 2743/30000 | Total reward = 52.48
2022-01-26 14:16:37.117 | DEBUG    | __main__:trials:24 - Trial = 2744/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.117 | DEBUG    | __main__:trials:29 - Trial = 2744/30000 | Total reward = 25.59
2022-01-26 14:16:37.122 | DEBUG    | __main__:trials:24 - Trial = 2745/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.123 | DEBUG    | __main__:trials:29 - Trial = 2745/30000 | Total reward = 50.50
2022-01-26 14:16:37.127 | DEBUG    | __main__:trials:24 - Trial = 2746/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.129 | DEBUG    | __main__:trials:29 - Trial = 2746/30000 | Total reward = 60.47
2022-01-26 14:16:37.132 | DEBUG    | __main__:trials:24 - Trial = 2747/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.134 | DEBUG    | __main__:trials:29 - Trial = 2747/30000 | Total reward = 28.12
2022-01-26 14:16:37.137 | DEBUG    | __main__:trials:24 - Trial = 2748/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.139 | DEBUG    | __main__:trials:29 - Trial = 2748/30000 | Total reward = 60.27
2022-01-26 14:16:37.142 | DEBUG    | __main__:trials:24 - Trial = 2749/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.143 | DEBUG    | __main__:trials:29 - Trial = 2749/30000 | Total reward = 51.92
2022-01-26 14:16:37.146 | DEBUG    | __main__:trials:24 - Trial = 2750/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.147 | DEBUG    | __main__:trials:29 - Trial = 2750/30000 | Total reward = 43.46
2022-01-26 14:16:37.150 | DEBUG    | __main__:trials:24 - Trial = 2751/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.153 | DEBUG    | __main__:trials:29 - Trial = 2751/30000 | Total reward = 55.17
2022-01-26 14:16:37.156 | DEBUG    | __main__:trials:24 - Trial = 2752/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.157 | DEBUG    | __main__:trials:29 - Trial = 2752/30000 | Total reward = 4.17
2022-01-26 14:16:37.162 | DEBUG    | __main__:trials:24 - Trial = 2753/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.164 | DEBUG    | __main__:trials:29 - Trial = 2753/30000 | Total reward = 51.27
2022-01-26 14:16:37.167 | DEBUG    | __main__:trials:24 - Trial = 2754/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.169 | DEBUG    | __main__:trials:29 - Trial = 2754/30000 | Total reward = 52.47
2022-01-26 14:16:37.172 | DEBUG    | __main__:trials:24 - Trial = 2755/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.173 | DEBUG    | __main__:trials:29 - Trial = 2755/30000 | Total reward = 53.39
2022-01-26 14:16:37.177 | DEBUG    | __main__:trials:24 - Trial = 2756/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.178 | DEBUG    | __main__:trials:29 - Trial = 2756/30000 | Total reward = 63.05
2022-01-26 14:16:37.181 | DEBUG    | __main__:trials:26 - Trial = 2757/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.182 | DEBUG    | __main__:trials:29 - Trial = 2757/30000 | Total reward = 33.23
2022-01-26 14:16:37.185 | DEBUG    | __main__:trials:24 - Trial = 2758/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.187 | DEBUG    | __main__:trials:29 - Trial = 2758/30000 | Total reward = 51.84
2022-01-26 14:16:37.190 | DEBUG    | __main__:trials:24 - Trial = 2759/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.192 | DEBUG    | __main__:trials:29 - Trial = 2759/30000 | Total reward = 53.17
2022-01-26 14:16:37.195 | DEBUG    | __main__:trials:24 - Trial = 2760/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.197 | DEBUG    | __main__:trials:29 - Trial = 2760/30000 | Total reward = 59.86
2022-01-26 14:16:37.200 | DEBUG    | __main__:trials:24 - Trial = 2761/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.202 | DEBUG    | __main__:trials:29 - Trial = 2761/30000 | Total reward = 57.15
2022-01-26 14:16:37.206 | DEBUG    | __main__:trials:24 - Trial = 2762/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.208 | DEBUG    | __main__:trials:29 - Trial = 2762/30000 | Total reward = 49.14
2022-01-26 14:16:37.212 | DEBUG    | __main__:trials:24 - Trial = 2763/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.213 | DEBUG    | __main__:trials:29 - Trial = 2763/30000 | Total reward = 41.03
2022-01-26 14:16:37.216 | DEBUG    | __main__:trials:24 - Trial = 2764/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.218 | DEBUG    | __main__:trials:29 - Trial = 2764/30000 | Total reward = 47.12
2022-01-26 14:16:37.222 | DEBUG    | __main__:trials:24 - Trial = 2765/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.223 | DEBUG    | __main__:trials:29 - Trial = 2765/30000 | Total reward = 53.04
2022-01-26 14:16:37.227 | DEBUG    | __main__:trials:24 - Trial = 2766/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.228 | DEBUG    | __main__:trials:29 - Trial = 2766/30000 | Total reward = 50.45
2022-01-26 14:16:37.232 | DEBUG    | __main__:trials:24 - Trial = 2767/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.234 | DEBUG    | __main__:trials:29 - Trial = 2767/30000 | Total reward = 64.00
2022-01-26 14:16:37.237 | DEBUG    | __main__:trials:24 - Trial = 2768/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.239 | DEBUG    | __main__:trials:29 - Trial = 2768/30000 | Total reward = 53.02
2022-01-26 14:16:37.242 | DEBUG    | __main__:trials:24 - Trial = 2769/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.244 | DEBUG    | __main__:trials:29 - Trial = 2769/30000 | Total reward = 54.36
2022-01-26 14:16:37.248 | DEBUG    | __main__:trials:24 - Trial = 2770/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.250 | DEBUG    | __main__:trials:29 - Trial = 2770/30000 | Total reward = 49.43
2022-01-26 14:16:37.253 | DEBUG    | __main__:trials:24 - Trial = 2771/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.255 | DEBUG    | __main__:trials:29 - Trial = 2771/30000 | Total reward = 50.18
2022-01-26 14:16:37.258 | DEBUG    | __main__:trials:26 - Trial = 2772/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.260 | DEBUG    | __main__:trials:29 - Trial = 2772/30000 | Total reward = 17.28
2022-01-26 14:16:37.264 | DEBUG    | __main__:trials:24 - Trial = 2773/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.266 | DEBUG    | __main__:trials:29 - Trial = 2773/30000 | Total reward = 56.84
2022-01-26 14:16:37.270 | DEBUG    | __main__:trials:24 - Trial = 2774/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.271 | DEBUG    | __main__:trials:29 - Trial = 2774/30000 | Total reward = 47.80
2022-01-26 14:16:37.275 | DEBUG    | __main__:trials:24 - Trial = 2775/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.277 | DEBUG    | __main__:trials:29 - Trial = 2775/30000 | Total reward = 52.87
2022-01-26 14:16:37.280 | DEBUG    | __main__:trials:24 - Trial = 2776/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.282 | DEBUG    | __main__:trials:29 - Trial = 2776/30000 | Total reward = 51.52
2022-01-26 14:16:37.286 | DEBUG    | __main__:trials:24 - Trial = 2777/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.288 | DEBUG    | __main__:trials:29 - Trial = 2777/30000 | Total reward = 49.54
2022-01-26 14:16:37.291 | DEBUG    | __main__:trials:24 - Trial = 2778/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.292 | DEBUG    | __main__:trials:29 - Trial = 2778/30000 | Total reward = 50.32
2022-01-26 14:16:37.296 | DEBUG    | __main__:trials:24 - Trial = 2779/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.298 | DEBUG    | __main__:trials:29 - Trial = 2779/30000 | Total reward = 30.58
2022-01-26 14:16:37.302 | DEBUG    | __main__:trials:24 - Trial = 2780/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.304 | DEBUG    | __main__:trials:29 - Trial = 2780/30000 | Total reward = 44.87
2022-01-26 14:16:37.308 | DEBUG    | __main__:trials:24 - Trial = 2781/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.309 | DEBUG    | __main__:trials:29 - Trial = 2781/30000 | Total reward = 53.20
2022-01-26 14:16:37.313 | DEBUG    | __main__:trials:24 - Trial = 2782/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.315 | DEBUG    | __main__:trials:29 - Trial = 2782/30000 | Total reward = 49.30
2022-01-26 14:16:37.318 | DEBUG    | __main__:trials:24 - Trial = 2783/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.320 | DEBUG    | __main__:trials:29 - Trial = 2783/30000 | Total reward = 50.93
2022-01-26 14:16:37.324 | DEBUG    | __main__:trials:24 - Trial = 2784/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.326 | DEBUG    | __main__:trials:29 - Trial = 2784/30000 | Total reward = 52.18
2022-01-26 14:16:37.330 | DEBUG    | __main__:trials:24 - Trial = 2785/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.331 | DEBUG    | __main__:trials:29 - Trial = 2785/30000 | Total reward = 56.35
2022-01-26 14:16:37.335 | DEBUG    | __main__:trials:24 - Trial = 2786/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.337 | DEBUG    | __main__:trials:29 - Trial = 2786/30000 | Total reward = 49.03
2022-01-26 14:16:37.341 | DEBUG    | __main__:trials:24 - Trial = 2787/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.342 | DEBUG    | __main__:trials:29 - Trial = 2787/30000 | Total reward = 45.26
2022-01-26 14:16:37.345 | DEBUG    | __main__:trials:24 - Trial = 2788/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.347 | DEBUG    | __main__:trials:29 - Trial = 2788/30000 | Total reward = 45.27
2022-01-26 14:16:37.350 | DEBUG    | __main__:trials:24 - Trial = 2789/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.351 | DEBUG    | __main__:trials:29 - Trial = 2789/30000 | Total reward = 41.67
2022-01-26 14:16:37.355 | DEBUG    | __main__:trials:24 - Trial = 2790/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.357 | DEBUG    | __main__:trials:29 - Trial = 2790/30000 | Total reward = 49.56
2022-01-26 14:16:37.361 | DEBUG    | __main__:trials:24 - Trial = 2791/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.361 | DEBUG    | __main__:trials:29 - Trial = 2791/30000 | Total reward = 48.38
2022-01-26 14:16:37.366 | DEBUG    | __main__:trials:24 - Trial = 2792/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.367 | DEBUG    | __main__:trials:29 - Trial = 2792/30000 | Total reward = 50.05
2022-01-26 14:16:37.370 | DEBUG    | __main__:trials:24 - Trial = 2793/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.372 | DEBUG    | __main__:trials:29 - Trial = 2793/30000 | Total reward = 45.62
2022-01-26 14:16:37.376 | DEBUG    | __main__:trials:24 - Trial = 2794/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.378 | DEBUG    | __main__:trials:29 - Trial = 2794/30000 | Total reward = 56.49
2022-01-26 14:16:37.381 | DEBUG    | __main__:trials:24 - Trial = 2795/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.383 | DEBUG    | __main__:trials:29 - Trial = 2795/30000 | Total reward = 31.20
2022-01-26 14:16:37.387 | DEBUG    | __main__:trials:24 - Trial = 2796/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.388 | DEBUG    | __main__:trials:29 - Trial = 2796/30000 | Total reward = 63.23
2022-01-26 14:16:37.392 | DEBUG    | __main__:trials:24 - Trial = 2797/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.393 | DEBUG    | __main__:trials:29 - Trial = 2797/30000 | Total reward = 53.96
2022-01-26 14:16:37.396 | DEBUG    | __main__:trials:24 - Trial = 2798/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.397 | DEBUG    | __main__:trials:29 - Trial = 2798/30000 | Total reward = 48.32
2022-01-26 14:16:37.400 | DEBUG    | __main__:trials:24 - Trial = 2799/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.402 | DEBUG    | __main__:trials:29 - Trial = 2799/30000 | Total reward = 48.90
2022-01-26 14:16:37.405 | DEBUG    | __main__:trials:24 - Trial = 2800/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.406 | DEBUG    | __main__:trials:29 - Trial = 2800/30000 | Total reward = 43.77
2022-01-26 14:16:37.410 | DEBUG    | __main__:trials:24 - Trial = 2801/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.411 | DEBUG    | __main__:trials:29 - Trial = 2801/30000 | Total reward = 53.65
2022-01-26 14:16:37.415 | DEBUG    | __main__:trials:24 - Trial = 2802/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.417 | DEBUG    | __main__:trials:29 - Trial = 2802/30000 | Total reward = 64.47
2022-01-26 14:16:37.421 | DEBUG    | __main__:trials:24 - Trial = 2803/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.421 | DEBUG    | __main__:trials:29 - Trial = 2803/30000 | Total reward = 50.41
2022-01-26 14:16:37.425 | DEBUG    | __main__:trials:24 - Trial = 2804/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.426 | DEBUG    | __main__:trials:29 - Trial = 2804/30000 | Total reward = 50.93
2022-01-26 14:16:37.430 | DEBUG    | __main__:trials:24 - Trial = 2805/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.431 | DEBUG    | __main__:trials:29 - Trial = 2805/30000 | Total reward = 44.56
2022-01-26 14:16:37.435 | DEBUG    | __main__:trials:24 - Trial = 2806/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.436 | DEBUG    | __main__:trials:29 - Trial = 2806/30000 | Total reward = 48.48
2022-01-26 14:16:37.439 | DEBUG    | __main__:trials:26 - Trial = 2807/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.441 | DEBUG    | __main__:trials:29 - Trial = 2807/30000 | Total reward = 40.30
2022-01-26 14:16:37.444 | DEBUG    | __main__:trials:24 - Trial = 2808/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.446 | DEBUG    | __main__:trials:29 - Trial = 2808/30000 | Total reward = 53.28
2022-01-26 14:16:37.450 | DEBUG    | __main__:trials:24 - Trial = 2809/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.451 | DEBUG    | __main__:trials:29 - Trial = 2809/30000 | Total reward = 49.03
2022-01-26 14:16:37.455 | DEBUG    | __main__:trials:24 - Trial = 2810/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.455 | DEBUG    | __main__:trials:29 - Trial = 2810/30000 | Total reward = 50.04
2022-01-26 14:16:37.460 | DEBUG    | __main__:trials:24 - Trial = 2811/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.460 | DEBUG    | __main__:trials:29 - Trial = 2811/30000 | Total reward = 51.39
2022-01-26 14:16:37.464 | DEBUG    | __main__:trials:24 - Trial = 2812/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.465 | DEBUG    | __main__:trials:29 - Trial = 2812/30000 | Total reward = 44.51
2022-01-26 14:16:37.469 | DEBUG    | __main__:trials:24 - Trial = 2813/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.470 | DEBUG    | __main__:trials:29 - Trial = 2813/30000 | Total reward = 49.31
2022-01-26 14:16:37.474 | DEBUG    | __main__:trials:24 - Trial = 2814/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.475 | DEBUG    | __main__:trials:29 - Trial = 2814/30000 | Total reward = 52.07
2022-01-26 14:16:37.479 | DEBUG    | __main__:trials:26 - Trial = 2815/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.480 | DEBUG    | __main__:trials:29 - Trial = 2815/30000 | Total reward = 23.80
2022-01-26 14:16:37.484 | DEBUG    | __main__:trials:24 - Trial = 2816/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.485 | DEBUG    | __main__:trials:29 - Trial = 2816/30000 | Total reward = 48.25
2022-01-26 14:16:37.489 | DEBUG    | __main__:trials:24 - Trial = 2817/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.490 | DEBUG    | __main__:trials:29 - Trial = 2817/30000 | Total reward = 55.03
2022-01-26 14:16:37.494 | DEBUG    | __main__:trials:24 - Trial = 2818/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.495 | DEBUG    | __main__:trials:29 - Trial = 2818/30000 | Total reward = 59.94
2022-01-26 14:16:37.498 | DEBUG    | __main__:trials:26 - Trial = 2819/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.500 | DEBUG    | __main__:trials:29 - Trial = 2819/30000 | Total reward = 15.66
2022-01-26 14:16:37.504 | DEBUG    | __main__:trials:24 - Trial = 2820/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.505 | DEBUG    | __main__:trials:29 - Trial = 2820/30000 | Total reward = 58.03
2022-01-26 14:16:37.508 | DEBUG    | __main__:trials:26 - Trial = 2821/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.510 | DEBUG    | __main__:trials:29 - Trial = 2821/30000 | Total reward = 16.60
2022-01-26 14:16:37.513 | DEBUG    | __main__:trials:26 - Trial = 2822/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.515 | DEBUG    | __main__:trials:29 - Trial = 2822/30000 | Total reward = 40.30
2022-01-26 14:16:37.518 | DEBUG    | __main__:trials:24 - Trial = 2823/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.520 | DEBUG    | __main__:trials:29 - Trial = 2823/30000 | Total reward = 52.17
2022-01-26 14:16:37.524 | DEBUG    | __main__:trials:24 - Trial = 2824/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.525 | DEBUG    | __main__:trials:29 - Trial = 2824/30000 | Total reward = 35.59
2022-01-26 14:16:37.528 | DEBUG    | __main__:trials:24 - Trial = 2825/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.528 | DEBUG    | __main__:trials:29 - Trial = 2825/30000 | Total reward = 49.06
2022-01-26 14:16:37.532 | DEBUG    | __main__:trials:26 - Trial = 2826/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.533 | DEBUG    | __main__:trials:29 - Trial = 2826/30000 | Total reward = 35.48
2022-01-26 14:16:37.536 | DEBUG    | __main__:trials:24 - Trial = 2827/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.538 | DEBUG    | __main__:trials:29 - Trial = 2827/30000 | Total reward = 57.98
2022-01-26 14:16:37.541 | DEBUG    | __main__:trials:24 - Trial = 2828/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.542 | DEBUG    | __main__:trials:29 - Trial = 2828/30000 | Total reward = 46.64
2022-01-26 14:16:37.546 | DEBUG    | __main__:trials:24 - Trial = 2829/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.547 | DEBUG    | __main__:trials:29 - Trial = 2829/30000 | Total reward = 49.03
2022-01-26 14:16:37.550 | DEBUG    | __main__:trials:24 - Trial = 2830/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.552 | DEBUG    | __main__:trials:29 - Trial = 2830/30000 | Total reward = 57.79
2022-01-26 14:16:37.555 | DEBUG    | __main__:trials:24 - Trial = 2831/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.557 | DEBUG    | __main__:trials:29 - Trial = 2831/30000 | Total reward = 45.96
2022-01-26 14:16:37.560 | DEBUG    | __main__:trials:24 - Trial = 2832/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.562 | DEBUG    | __main__:trials:29 - Trial = 2832/30000 | Total reward = 46.88
2022-01-26 14:16:37.565 | DEBUG    | __main__:trials:24 - Trial = 2833/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.567 | DEBUG    | __main__:trials:29 - Trial = 2833/30000 | Total reward = 53.35
2022-01-26 14:16:37.571 | DEBUG    | __main__:trials:24 - Trial = 2834/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.572 | DEBUG    | __main__:trials:29 - Trial = 2834/30000 | Total reward = 50.12
2022-01-26 14:16:37.576 | DEBUG    | __main__:trials:24 - Trial = 2835/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.577 | DEBUG    | __main__:trials:29 - Trial = 2835/30000 | Total reward = 53.08
2022-01-26 14:16:37.581 | DEBUG    | __main__:trials:24 - Trial = 2836/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.581 | DEBUG    | __main__:trials:29 - Trial = 2836/30000 | Total reward = 50.72
2022-01-26 14:16:37.586 | DEBUG    | __main__:trials:24 - Trial = 2837/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.587 | DEBUG    | __main__:trials:29 - Trial = 2837/30000 | Total reward = 49.05
2022-01-26 14:16:37.590 | DEBUG    | __main__:trials:24 - Trial = 2838/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.593 | DEBUG    | __main__:trials:29 - Trial = 2838/30000 | Total reward = 49.11
2022-01-26 14:16:37.596 | DEBUG    | __main__:trials:24 - Trial = 2839/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.597 | DEBUG    | __main__:trials:29 - Trial = 2839/30000 | Total reward = 46.24
2022-01-26 14:16:37.601 | DEBUG    | __main__:trials:24 - Trial = 2840/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.603 | DEBUG    | __main__:trials:29 - Trial = 2840/30000 | Total reward = 45.97
2022-01-26 14:16:37.606 | DEBUG    | __main__:trials:24 - Trial = 2841/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.608 | DEBUG    | __main__:trials:29 - Trial = 2841/30000 | Total reward = 50.02
2022-01-26 14:16:37.612 | DEBUG    | __main__:trials:24 - Trial = 2842/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.613 | DEBUG    | __main__:trials:29 - Trial = 2842/30000 | Total reward = 48.50
2022-01-26 14:16:37.617 | DEBUG    | __main__:trials:24 - Trial = 2843/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.618 | DEBUG    | __main__:trials:29 - Trial = 2843/30000 | Total reward = 61.86
2022-01-26 14:16:37.622 | DEBUG    | __main__:trials:24 - Trial = 2844/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.623 | DEBUG    | __main__:trials:29 - Trial = 2844/30000 | Total reward = 49.91
2022-01-26 14:16:37.627 | DEBUG    | __main__:trials:24 - Trial = 2845/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.628 | DEBUG    | __main__:trials:29 - Trial = 2845/30000 | Total reward = 49.57
2022-01-26 14:16:37.632 | DEBUG    | __main__:trials:24 - Trial = 2846/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.633 | DEBUG    | __main__:trials:29 - Trial = 2846/30000 | Total reward = 50.03
2022-01-26 14:16:37.637 | DEBUG    | __main__:trials:26 - Trial = 2847/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.638 | DEBUG    | __main__:trials:29 - Trial = 2847/30000 | Total reward = 37.17
2022-01-26 14:16:37.642 | DEBUG    | __main__:trials:24 - Trial = 2848/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.643 | DEBUG    | __main__:trials:29 - Trial = 2848/30000 | Total reward = 41.41
2022-01-26 14:16:37.647 | DEBUG    | __main__:trials:24 - Trial = 2849/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.649 | DEBUG    | __main__:trials:29 - Trial = 2849/30000 | Total reward = 46.25
2022-01-26 14:16:37.652 | DEBUG    | __main__:trials:24 - Trial = 2850/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.654 | DEBUG    | __main__:trials:29 - Trial = 2850/30000 | Total reward = 46.41
2022-01-26 14:16:37.657 | DEBUG    | __main__:trials:24 - Trial = 2851/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.659 | DEBUG    | __main__:trials:29 - Trial = 2851/30000 | Total reward = 45.57
2022-01-26 14:16:37.663 | DEBUG    | __main__:trials:24 - Trial = 2852/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.664 | DEBUG    | __main__:trials:29 - Trial = 2852/30000 | Total reward = 48.01
2022-01-26 14:16:37.668 | DEBUG    | __main__:trials:24 - Trial = 2853/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.669 | DEBUG    | __main__:trials:29 - Trial = 2853/30000 | Total reward = 53.06
2022-01-26 14:16:37.673 | DEBUG    | __main__:trials:24 - Trial = 2854/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.675 | DEBUG    | __main__:trials:29 - Trial = 2854/30000 | Total reward = 51.75
2022-01-26 14:16:37.678 | DEBUG    | __main__:trials:24 - Trial = 2855/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.680 | DEBUG    | __main__:trials:29 - Trial = 2855/30000 | Total reward = 55.39
2022-01-26 14:16:37.683 | DEBUG    | __main__:trials:24 - Trial = 2856/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.685 | DEBUG    | __main__:trials:29 - Trial = 2856/30000 | Total reward = 49.35
2022-01-26 14:16:37.688 | DEBUG    | __main__:trials:24 - Trial = 2857/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.690 | DEBUG    | __main__:trials:29 - Trial = 2857/30000 | Total reward = 49.44
2022-01-26 14:16:37.693 | DEBUG    | __main__:trials:24 - Trial = 2858/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.695 | DEBUG    | __main__:trials:29 - Trial = 2858/30000 | Total reward = 62.61
2022-01-26 14:16:37.698 | DEBUG    | __main__:trials:24 - Trial = 2859/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.700 | DEBUG    | __main__:trials:29 - Trial = 2859/30000 | Total reward = 44.41
2022-01-26 14:16:37.703 | DEBUG    | __main__:trials:24 - Trial = 2860/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.705 | DEBUG    | __main__:trials:29 - Trial = 2860/30000 | Total reward = 34.72
2022-01-26 14:16:37.708 | DEBUG    | __main__:trials:24 - Trial = 2861/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.710 | DEBUG    | __main__:trials:29 - Trial = 2861/30000 | Total reward = 48.77
2022-01-26 14:16:37.713 | DEBUG    | __main__:trials:24 - Trial = 2862/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.715 | DEBUG    | __main__:trials:29 - Trial = 2862/30000 | Total reward = 32.43
2022-01-26 14:16:37.719 | DEBUG    | __main__:trials:24 - Trial = 2863/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.721 | DEBUG    | __main__:trials:29 - Trial = 2863/30000 | Total reward = 60.85
2022-01-26 14:16:37.724 | DEBUG    | __main__:trials:24 - Trial = 2864/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.726 | DEBUG    | __main__:trials:29 - Trial = 2864/30000 | Total reward = 45.08
2022-01-26 14:16:37.729 | DEBUG    | __main__:trials:24 - Trial = 2865/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.731 | DEBUG    | __main__:trials:29 - Trial = 2865/30000 | Total reward = 36.13
2022-01-26 14:16:37.734 | DEBUG    | __main__:trials:24 - Trial = 2866/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.736 | DEBUG    | __main__:trials:29 - Trial = 2866/30000 | Total reward = 46.22
2022-01-26 14:16:37.740 | DEBUG    | __main__:trials:24 - Trial = 2867/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.742 | DEBUG    | __main__:trials:29 - Trial = 2867/30000 | Total reward = 27.56
2022-01-26 14:16:37.746 | DEBUG    | __main__:trials:24 - Trial = 2868/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.747 | DEBUG    | __main__:trials:29 - Trial = 2868/30000 | Total reward = 51.63
2022-01-26 14:16:37.750 | DEBUG    | __main__:trials:24 - Trial = 2869/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.751 | DEBUG    | __main__:trials:29 - Trial = 2869/30000 | Total reward = 30.94
2022-01-26 14:16:37.755 | DEBUG    | __main__:trials:24 - Trial = 2870/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.757 | DEBUG    | __main__:trials:29 - Trial = 2870/30000 | Total reward = 49.98
2022-01-26 14:16:37.760 | DEBUG    | __main__:trials:24 - Trial = 2871/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.761 | DEBUG    | __main__:trials:29 - Trial = 2871/30000 | Total reward = 56.72
2022-01-26 14:16:37.765 | DEBUG    | __main__:trials:24 - Trial = 2872/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.767 | DEBUG    | __main__:trials:29 - Trial = 2872/30000 | Total reward = 51.32
2022-01-26 14:16:37.770 | DEBUG    | __main__:trials:24 - Trial = 2873/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.772 | DEBUG    | __main__:trials:29 - Trial = 2873/30000 | Total reward = 52.51
2022-01-26 14:16:37.775 | DEBUG    | __main__:trials:24 - Trial = 2874/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.777 | DEBUG    | __main__:trials:29 - Trial = 2874/30000 | Total reward = 39.68
2022-01-26 14:16:37.780 | DEBUG    | __main__:trials:24 - Trial = 2875/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.782 | DEBUG    | __main__:trials:29 - Trial = 2875/30000 | Total reward = 25.55
2022-01-26 14:16:37.786 | DEBUG    | __main__:trials:24 - Trial = 2876/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.788 | DEBUG    | __main__:trials:29 - Trial = 2876/30000 | Total reward = 47.71
2022-01-26 14:16:37.790 | DEBUG    | __main__:trials:24 - Trial = 2877/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.792 | DEBUG    | __main__:trials:29 - Trial = 2877/30000 | Total reward = 44.95
2022-01-26 14:16:37.795 | DEBUG    | __main__:trials:24 - Trial = 2878/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.797 | DEBUG    | __main__:trials:29 - Trial = 2878/30000 | Total reward = 38.34
2022-01-26 14:16:37.800 | DEBUG    | __main__:trials:24 - Trial = 2879/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.802 | DEBUG    | __main__:trials:29 - Trial = 2879/30000 | Total reward = 46.29
2022-01-26 14:16:37.806 | DEBUG    | __main__:trials:26 - Trial = 2880/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.806 | DEBUG    | __main__:trials:29 - Trial = 2880/30000 | Total reward = 22.61
2022-01-26 14:16:37.811 | DEBUG    | __main__:trials:24 - Trial = 2881/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.812 | DEBUG    | __main__:trials:29 - Trial = 2881/30000 | Total reward = 35.11
2022-01-26 14:16:37.816 | DEBUG    | __main__:trials:24 - Trial = 2882/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.818 | DEBUG    | __main__:trials:29 - Trial = 2882/30000 | Total reward = 36.96
2022-01-26 14:16:37.821 | DEBUG    | __main__:trials:24 - Trial = 2883/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.823 | DEBUG    | __main__:trials:29 - Trial = 2883/30000 | Total reward = 51.45
2022-01-26 14:16:37.826 | DEBUG    | __main__:trials:24 - Trial = 2884/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.828 | DEBUG    | __main__:trials:29 - Trial = 2884/30000 | Total reward = 47.53
2022-01-26 14:16:37.832 | DEBUG    | __main__:trials:24 - Trial = 2885/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.833 | DEBUG    | __main__:trials:29 - Trial = 2885/30000 | Total reward = 54.71
2022-01-26 14:16:37.837 | DEBUG    | __main__:trials:24 - Trial = 2886/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.838 | DEBUG    | __main__:trials:29 - Trial = 2886/30000 | Total reward = 46.47
2022-01-26 14:16:37.842 | DEBUG    | __main__:trials:24 - Trial = 2887/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.843 | DEBUG    | __main__:trials:29 - Trial = 2887/30000 | Total reward = 49.62
2022-01-26 14:16:37.847 | DEBUG    | __main__:trials:24 - Trial = 2888/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.849 | DEBUG    | __main__:trials:29 - Trial = 2888/30000 | Total reward = 48.52
2022-01-26 14:16:37.852 | DEBUG    | __main__:trials:24 - Trial = 2889/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.854 | DEBUG    | __main__:trials:29 - Trial = 2889/30000 | Total reward = 47.02
2022-01-26 14:16:37.857 | DEBUG    | __main__:trials:24 - Trial = 2890/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.859 | DEBUG    | __main__:trials:29 - Trial = 2890/30000 | Total reward = 23.29
2022-01-26 14:16:37.862 | DEBUG    | __main__:trials:24 - Trial = 2891/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.864 | DEBUG    | __main__:trials:29 - Trial = 2891/30000 | Total reward = 42.54
2022-01-26 14:16:37.867 | DEBUG    | __main__:trials:24 - Trial = 2892/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.869 | DEBUG    | __main__:trials:29 - Trial = 2892/30000 | Total reward = 48.32
2022-01-26 14:16:37.873 | DEBUG    | __main__:trials:24 - Trial = 2893/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.875 | DEBUG    | __main__:trials:29 - Trial = 2893/30000 | Total reward = 27.60
2022-01-26 14:16:37.878 | DEBUG    | __main__:trials:24 - Trial = 2894/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.880 | DEBUG    | __main__:trials:29 - Trial = 2894/30000 | Total reward = 41.68
2022-01-26 14:16:37.883 | DEBUG    | __main__:trials:24 - Trial = 2895/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.885 | DEBUG    | __main__:trials:29 - Trial = 2895/30000 | Total reward = 46.23
2022-01-26 14:16:37.888 | DEBUG    | __main__:trials:24 - Trial = 2896/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.890 | DEBUG    | __main__:trials:29 - Trial = 2896/30000 | Total reward = 56.84
2022-01-26 14:16:37.893 | DEBUG    | __main__:trials:24 - Trial = 2897/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.894 | DEBUG    | __main__:trials:29 - Trial = 2897/30000 | Total reward = 52.72
2022-01-26 14:16:37.898 | DEBUG    | __main__:trials:24 - Trial = 2898/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.900 | DEBUG    | __main__:trials:29 - Trial = 2898/30000 | Total reward = 46.09
2022-01-26 14:16:37.902 | DEBUG    | __main__:trials:26 - Trial = 2899/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.904 | DEBUG    | __main__:trials:29 - Trial = 2899/30000 | Total reward = 13.84
2022-01-26 14:16:37.908 | DEBUG    | __main__:trials:24 - Trial = 2900/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.909 | DEBUG    | __main__:trials:29 - Trial = 2900/30000 | Total reward = 49.35
2022-01-26 14:16:37.912 | DEBUG    | __main__:trials:24 - Trial = 2901/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.914 | DEBUG    | __main__:trials:29 - Trial = 2901/30000 | Total reward = 57.86
2022-01-26 14:16:37.918 | DEBUG    | __main__:trials:24 - Trial = 2902/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.919 | DEBUG    | __main__:trials:29 - Trial = 2902/30000 | Total reward = 51.18
2022-01-26 14:16:37.923 | DEBUG    | __main__:trials:24 - Trial = 2903/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.925 | DEBUG    | __main__:trials:29 - Trial = 2903/30000 | Total reward = 55.75
2022-01-26 14:16:37.928 | DEBUG    | __main__:trials:26 - Trial = 2904/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.928 | DEBUG    | __main__:trials:29 - Trial = 2904/30000 | Total reward = 18.51
2022-01-26 14:16:37.932 | DEBUG    | __main__:trials:24 - Trial = 2905/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.933 | DEBUG    | __main__:trials:29 - Trial = 2905/30000 | Total reward = 32.78
2022-01-26 14:16:37.937 | DEBUG    | __main__:trials:24 - Trial = 2906/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.938 | DEBUG    | __main__:trials:29 - Trial = 2906/30000 | Total reward = 61.73
2022-01-26 14:16:37.941 | DEBUG    | __main__:trials:24 - Trial = 2907/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.943 | DEBUG    | __main__:trials:29 - Trial = 2907/30000 | Total reward = 55.53
2022-01-26 14:16:37.947 | DEBUG    | __main__:trials:24 - Trial = 2908/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.947 | DEBUG    | __main__:trials:29 - Trial = 2908/30000 | Total reward = 54.80
2022-01-26 14:16:37.950 | DEBUG    | __main__:trials:26 - Trial = 2909/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.951 | DEBUG    | __main__:trials:29 - Trial = 2909/30000 | Total reward = 28.61
2022-01-26 14:16:37.955 | DEBUG    | __main__:trials:24 - Trial = 2910/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.956 | DEBUG    | __main__:trials:29 - Trial = 2910/30000 | Total reward = 51.50
2022-01-26 14:16:37.961 | DEBUG    | __main__:trials:24 - Trial = 2911/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.962 | DEBUG    | __main__:trials:29 - Trial = 2911/30000 | Total reward = 56.83
2022-01-26 14:16:37.965 | DEBUG    | __main__:trials:24 - Trial = 2912/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.966 | DEBUG    | __main__:trials:29 - Trial = 2912/30000 | Total reward = 45.47
2022-01-26 14:16:37.969 | DEBUG    | __main__:trials:26 - Trial = 2913/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.970 | DEBUG    | __main__:trials:29 - Trial = 2913/30000 | Total reward = 28.19
2022-01-26 14:16:37.973 | DEBUG    | __main__:trials:24 - Trial = 2914/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.974 | DEBUG    | __main__:trials:29 - Trial = 2914/30000 | Total reward = 55.01
2022-01-26 14:16:37.979 | DEBUG    | __main__:trials:24 - Trial = 2915/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.980 | DEBUG    | __main__:trials:29 - Trial = 2915/30000 | Total reward = 49.95
2022-01-26 14:16:37.984 | DEBUG    | __main__:trials:26 - Trial = 2916/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:37.985 | DEBUG    | __main__:trials:29 - Trial = 2916/30000 | Total reward = 36.58
2022-01-26 14:16:37.989 | DEBUG    | __main__:trials:24 - Trial = 2917/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.991 | DEBUG    | __main__:trials:29 - Trial = 2917/30000 | Total reward = 52.51
2022-01-26 14:16:37.995 | DEBUG    | __main__:trials:24 - Trial = 2918/30000 | Max number of steps (20) reached
2022-01-26 14:16:37.996 | DEBUG    | __main__:trials:29 - Trial = 2918/30000 | Total reward = 56.89
2022-01-26 14:16:38.000 | DEBUG    | __main__:trials:24 - Trial = 2919/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.001 | DEBUG    | __main__:trials:29 - Trial = 2919/30000 | Total reward = 47.43
2022-01-26 14:16:38.005 | DEBUG    | __main__:trials:24 - Trial = 2920/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.007 | DEBUG    | __main__:trials:29 - Trial = 2920/30000 | Total reward = 30.07
2022-01-26 14:16:38.010 | DEBUG    | __main__:trials:24 - Trial = 2921/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.012 | DEBUG    | __main__:trials:29 - Trial = 2921/30000 | Total reward = 45.53
2022-01-26 14:16:38.015 | DEBUG    | __main__:trials:24 - Trial = 2922/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.017 | DEBUG    | __main__:trials:29 - Trial = 2922/30000 | Total reward = 49.35
2022-01-26 14:16:38.020 | DEBUG    | __main__:trials:24 - Trial = 2923/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.022 | DEBUG    | __main__:trials:29 - Trial = 2923/30000 | Total reward = 47.18
2022-01-26 14:16:38.025 | DEBUG    | __main__:trials:24 - Trial = 2924/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.027 | DEBUG    | __main__:trials:29 - Trial = 2924/30000 | Total reward = 51.74
2022-01-26 14:16:38.030 | DEBUG    | __main__:trials:24 - Trial = 2925/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.032 | DEBUG    | __main__:trials:29 - Trial = 2925/30000 | Total reward = 44.82
2022-01-26 14:16:38.036 | DEBUG    | __main__:trials:24 - Trial = 2926/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.037 | DEBUG    | __main__:trials:29 - Trial = 2926/30000 | Total reward = 54.28
2022-01-26 14:16:38.041 | DEBUG    | __main__:trials:24 - Trial = 2927/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.041 | DEBUG    | __main__:trials:29 - Trial = 2927/30000 | Total reward = 63.30
2022-01-26 14:16:38.046 | DEBUG    | __main__:trials:24 - Trial = 2928/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.046 | DEBUG    | __main__:trials:29 - Trial = 2928/30000 | Total reward = 48.79
2022-01-26 14:16:38.051 | DEBUG    | __main__:trials:24 - Trial = 2929/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.052 | DEBUG    | __main__:trials:29 - Trial = 2929/30000 | Total reward = 27.90
2022-01-26 14:16:38.056 | DEBUG    | __main__:trials:24 - Trial = 2930/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.058 | DEBUG    | __main__:trials:29 - Trial = 2930/30000 | Total reward = 47.87
2022-01-26 14:16:38.061 | DEBUG    | __main__:trials:24 - Trial = 2931/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.062 | DEBUG    | __main__:trials:29 - Trial = 2931/30000 | Total reward = 49.56
2022-01-26 14:16:38.066 | DEBUG    | __main__:trials:24 - Trial = 2932/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.068 | DEBUG    | __main__:trials:29 - Trial = 2932/30000 | Total reward = 65.34
2022-01-26 14:16:38.071 | DEBUG    | __main__:trials:24 - Trial = 2933/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.073 | DEBUG    | __main__:trials:29 - Trial = 2933/30000 | Total reward = 50.15
2022-01-26 14:16:38.076 | DEBUG    | __main__:trials:24 - Trial = 2934/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.078 | DEBUG    | __main__:trials:29 - Trial = 2934/30000 | Total reward = 54.66
2022-01-26 14:16:38.081 | DEBUG    | __main__:trials:24 - Trial = 2935/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.082 | DEBUG    | __main__:trials:29 - Trial = 2935/30000 | Total reward = 61.37
2022-01-26 14:16:38.085 | DEBUG    | __main__:trials:24 - Trial = 2936/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.086 | DEBUG    | __main__:trials:29 - Trial = 2936/30000 | Total reward = 47.65
2022-01-26 14:16:38.089 | DEBUG    | __main__:trials:24 - Trial = 2937/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.091 | DEBUG    | __main__:trials:29 - Trial = 2937/30000 | Total reward = 41.11
2022-01-26 14:16:38.094 | DEBUG    | __main__:trials:24 - Trial = 2938/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.095 | DEBUG    | __main__:trials:29 - Trial = 2938/30000 | Total reward = 30.18
2022-01-26 14:16:38.098 | DEBUG    | __main__:trials:24 - Trial = 2939/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.100 | DEBUG    | __main__:trials:29 - Trial = 2939/30000 | Total reward = 38.42
2022-01-26 14:16:38.104 | DEBUG    | __main__:trials:24 - Trial = 2940/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.105 | DEBUG    | __main__:trials:29 - Trial = 2940/30000 | Total reward = 43.91
2022-01-26 14:16:38.108 | DEBUG    | __main__:trials:24 - Trial = 2941/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.110 | DEBUG    | __main__:trials:29 - Trial = 2941/30000 | Total reward = 50.60
2022-01-26 14:16:38.114 | DEBUG    | __main__:trials:24 - Trial = 2942/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.114 | DEBUG    | __main__:trials:29 - Trial = 2942/30000 | Total reward = 53.27
2022-01-26 14:16:38.118 | DEBUG    | __main__:trials:24 - Trial = 2943/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.120 | DEBUG    | __main__:trials:29 - Trial = 2943/30000 | Total reward = 50.11
2022-01-26 14:16:38.124 | DEBUG    | __main__:trials:24 - Trial = 2944/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.125 | DEBUG    | __main__:trials:29 - Trial = 2944/30000 | Total reward = 53.47
2022-01-26 14:16:38.129 | DEBUG    | __main__:trials:24 - Trial = 2945/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.130 | DEBUG    | __main__:trials:29 - Trial = 2945/30000 | Total reward = 63.97
2022-01-26 14:16:38.134 | DEBUG    | __main__:trials:24 - Trial = 2946/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.135 | DEBUG    | __main__:trials:29 - Trial = 2946/30000 | Total reward = 47.16
2022-01-26 14:16:38.138 | DEBUG    | __main__:trials:24 - Trial = 2947/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.140 | DEBUG    | __main__:trials:29 - Trial = 2947/30000 | Total reward = 59.73
2022-01-26 14:16:38.144 | DEBUG    | __main__:trials:24 - Trial = 2948/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.145 | DEBUG    | __main__:trials:29 - Trial = 2948/30000 | Total reward = 52.44
2022-01-26 14:16:38.149 | DEBUG    | __main__:trials:24 - Trial = 2949/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.150 | DEBUG    | __main__:trials:29 - Trial = 2949/30000 | Total reward = 53.02
2022-01-26 14:16:38.154 | DEBUG    | __main__:trials:24 - Trial = 2950/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.156 | DEBUG    | __main__:trials:29 - Trial = 2950/30000 | Total reward = 38.01
2022-01-26 14:16:38.160 | DEBUG    | __main__:trials:24 - Trial = 2951/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.160 | DEBUG    | __main__:trials:29 - Trial = 2951/30000 | Total reward = 43.10
2022-01-26 14:16:38.164 | DEBUG    | __main__:trials:24 - Trial = 2952/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.166 | DEBUG    | __main__:trials:29 - Trial = 2952/30000 | Total reward = 53.79
2022-01-26 14:16:38.170 | DEBUG    | __main__:trials:24 - Trial = 2953/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.171 | DEBUG    | __main__:trials:29 - Trial = 2953/30000 | Total reward = 53.47
2022-01-26 14:16:38.175 | DEBUG    | __main__:trials:24 - Trial = 2954/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.177 | DEBUG    | __main__:trials:29 - Trial = 2954/30000 | Total reward = 55.19
2022-01-26 14:16:38.180 | DEBUG    | __main__:trials:24 - Trial = 2955/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.182 | DEBUG    | __main__:trials:29 - Trial = 2955/30000 | Total reward = 50.27
2022-01-26 14:16:38.186 | DEBUG    | __main__:trials:24 - Trial = 2956/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.187 | DEBUG    | __main__:trials:29 - Trial = 2956/30000 | Total reward = 52.98
2022-01-26 14:16:38.190 | DEBUG    | __main__:trials:24 - Trial = 2957/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.192 | DEBUG    | __main__:trials:29 - Trial = 2957/30000 | Total reward = 11.56
2022-01-26 14:16:38.195 | DEBUG    | __main__:trials:24 - Trial = 2958/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.197 | DEBUG    | __main__:trials:29 - Trial = 2958/30000 | Total reward = 49.59
2022-01-26 14:16:38.201 | DEBUG    | __main__:trials:24 - Trial = 2959/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.202 | DEBUG    | __main__:trials:29 - Trial = 2959/30000 | Total reward = 17.21
2022-01-26 14:16:38.206 | DEBUG    | __main__:trials:24 - Trial = 2960/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.207 | DEBUG    | __main__:trials:29 - Trial = 2960/30000 | Total reward = 44.95
2022-01-26 14:16:38.211 | DEBUG    | __main__:trials:24 - Trial = 2961/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.213 | DEBUG    | __main__:trials:29 - Trial = 2961/30000 | Total reward = 50.61
2022-01-26 14:16:38.216 | DEBUG    | __main__:trials:24 - Trial = 2962/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.218 | DEBUG    | __main__:trials:29 - Trial = 2962/30000 | Total reward = 50.89
2022-01-26 14:16:38.221 | DEBUG    | __main__:trials:24 - Trial = 2963/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.223 | DEBUG    | __main__:trials:29 - Trial = 2963/30000 | Total reward = 41.92
2022-01-26 14:16:38.227 | DEBUG    | __main__:trials:24 - Trial = 2964/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.228 | DEBUG    | __main__:trials:29 - Trial = 2964/30000 | Total reward = 43.28
2022-01-26 14:16:38.230 | DEBUG    | __main__:trials:26 - Trial = 2965/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.232 | DEBUG    | __main__:trials:29 - Trial = 2965/30000 | Total reward = 13.84
2022-01-26 14:16:38.236 | DEBUG    | __main__:trials:24 - Trial = 2966/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.237 | DEBUG    | __main__:trials:29 - Trial = 2966/30000 | Total reward = 63.11
2022-01-26 14:16:38.241 | DEBUG    | __main__:trials:24 - Trial = 2967/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.242 | DEBUG    | __main__:trials:29 - Trial = 2967/30000 | Total reward = 53.51
2022-01-26 14:16:38.246 | DEBUG    | __main__:trials:24 - Trial = 2968/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.247 | DEBUG    | __main__:trials:29 - Trial = 2968/30000 | Total reward = 51.48
2022-01-26 14:16:38.251 | DEBUG    | __main__:trials:24 - Trial = 2969/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.253 | DEBUG    | __main__:trials:29 - Trial = 2969/30000 | Total reward = 47.82
2022-01-26 14:16:38.256 | DEBUG    | __main__:trials:26 - Trial = 2970/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.258 | DEBUG    | __main__:trials:29 - Trial = 2970/30000 | Total reward = 34.57
2022-01-26 14:16:38.261 | DEBUG    | __main__:trials:26 - Trial = 2971/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.263 | DEBUG    | __main__:trials:29 - Trial = 2971/30000 | Total reward = 15.17
2022-01-26 14:16:38.266 | DEBUG    | __main__:trials:26 - Trial = 2972/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.267 | DEBUG    | __main__:trials:29 - Trial = 2972/30000 | Total reward = 31.87
2022-01-26 14:16:38.271 | DEBUG    | __main__:trials:24 - Trial = 2973/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.273 | DEBUG    | __main__:trials:29 - Trial = 2973/30000 | Total reward = 49.32
2022-01-26 14:16:38.276 | DEBUG    | __main__:trials:24 - Trial = 2974/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.278 | DEBUG    | __main__:trials:29 - Trial = 2974/30000 | Total reward = 45.55
2022-01-26 14:16:38.282 | DEBUG    | __main__:trials:24 - Trial = 2975/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.283 | DEBUG    | __main__:trials:29 - Trial = 2975/30000 | Total reward = 61.36
2022-01-26 14:16:38.287 | DEBUG    | __main__:trials:24 - Trial = 2976/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.288 | DEBUG    | __main__:trials:29 - Trial = 2976/30000 | Total reward = 53.27
2022-01-26 14:16:38.292 | DEBUG    | __main__:trials:24 - Trial = 2977/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.293 | DEBUG    | __main__:trials:29 - Trial = 2977/30000 | Total reward = 29.86
2022-01-26 14:16:38.297 | DEBUG    | __main__:trials:24 - Trial = 2978/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.299 | DEBUG    | __main__:trials:29 - Trial = 2978/30000 | Total reward = 49.83
2022-01-26 14:16:38.302 | DEBUG    | __main__:trials:24 - Trial = 2979/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.303 | DEBUG    | __main__:trials:29 - Trial = 2979/30000 | Total reward = 39.33
2022-01-26 14:16:38.305 | DEBUG    | __main__:trials:26 - Trial = 2980/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.307 | DEBUG    | __main__:trials:29 - Trial = 2980/30000 | Total reward = 16.85
2022-01-26 14:16:38.310 | DEBUG    | __main__:trials:24 - Trial = 2981/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.312 | DEBUG    | __main__:trials:29 - Trial = 2981/30000 | Total reward = 62.57
2022-01-26 14:16:38.316 | DEBUG    | __main__:trials:24 - Trial = 2982/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.318 | DEBUG    | __main__:trials:29 - Trial = 2982/30000 | Total reward = 63.08
2022-01-26 14:16:38.321 | DEBUG    | __main__:trials:24 - Trial = 2983/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.322 | DEBUG    | __main__:trials:29 - Trial = 2983/30000 | Total reward = 47.01
2022-01-26 14:16:38.325 | DEBUG    | __main__:trials:24 - Trial = 2984/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.326 | DEBUG    | __main__:trials:29 - Trial = 2984/30000 | Total reward = 45.99
2022-01-26 14:16:38.329 | DEBUG    | __main__:trials:24 - Trial = 2985/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.331 | DEBUG    | __main__:trials:29 - Trial = 2985/30000 | Total reward = 45.39
2022-01-26 14:16:38.334 | DEBUG    | __main__:trials:24 - Trial = 2986/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.336 | DEBUG    | __main__:trials:29 - Trial = 2986/30000 | Total reward = 34.74
2022-01-26 14:16:38.338 | DEBUG    | __main__:trials:26 - Trial = 2987/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.340 | DEBUG    | __main__:trials:29 - Trial = 2987/30000 | Total reward = 20.46
2022-01-26 14:16:38.344 | DEBUG    | __main__:trials:24 - Trial = 2988/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.345 | DEBUG    | __main__:trials:29 - Trial = 2988/30000 | Total reward = 30.31
2022-01-26 14:16:38.348 | DEBUG    | __main__:trials:26 - Trial = 2989/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.350 | DEBUG    | __main__:trials:29 - Trial = 2989/30000 | Total reward = 27.49
2022-01-26 14:16:38.354 | DEBUG    | __main__:trials:24 - Trial = 2990/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.355 | DEBUG    | __main__:trials:29 - Trial = 2990/30000 | Total reward = 53.27
2022-01-26 14:16:38.359 | DEBUG    | __main__:trials:24 - Trial = 2991/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.361 | DEBUG    | __main__:trials:29 - Trial = 2991/30000 | Total reward = 53.85
2022-01-26 14:16:38.364 | DEBUG    | __main__:trials:24 - Trial = 2992/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.366 | DEBUG    | __main__:trials:29 - Trial = 2992/30000 | Total reward = 35.45
2022-01-26 14:16:38.370 | DEBUG    | __main__:trials:24 - Trial = 2993/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.371 | DEBUG    | __main__:trials:29 - Trial = 2993/30000 | Total reward = 53.02
2022-01-26 14:16:38.375 | DEBUG    | __main__:trials:24 - Trial = 2994/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.377 | DEBUG    | __main__:trials:29 - Trial = 2994/30000 | Total reward = 49.03
2022-01-26 14:16:38.380 | DEBUG    | __main__:trials:24 - Trial = 2995/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.382 | DEBUG    | __main__:trials:29 - Trial = 2995/30000 | Total reward = 54.12
2022-01-26 14:16:38.385 | DEBUG    | __main__:trials:26 - Trial = 2996/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.387 | DEBUG    | __main__:trials:29 - Trial = 2996/30000 | Total reward = 38.28
2022-01-26 14:16:38.390 | DEBUG    | __main__:trials:24 - Trial = 2997/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.392 | DEBUG    | __main__:trials:29 - Trial = 2997/30000 | Total reward = 57.52
2022-01-26 14:16:38.395 | DEBUG    | __main__:trials:24 - Trial = 2998/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.397 | DEBUG    | __main__:trials:29 - Trial = 2998/30000 | Total reward = 50.58
2022-01-26 14:16:38.400 | DEBUG    | __main__:trials:24 - Trial = 2999/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.401 | DEBUG    | __main__:trials:29 - Trial = 2999/30000 | Total reward = 51.44
2022-01-26 14:16:38.405 | DEBUG    | __main__:trials:24 - Trial = 3000/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.405 | DEBUG    | __main__:trials:29 - Trial = 3000/30000 | Total reward = 46.61
2022-01-26 14:16:38.409 | DEBUG    | __main__:trials:24 - Trial = 3001/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.411 | DEBUG    | __main__:trials:29 - Trial = 3001/30000 | Total reward = 45.83
2022-01-26 14:16:38.414 | DEBUG    | __main__:trials:24 - Trial = 3002/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.415 | DEBUG    | __main__:trials:29 - Trial = 3002/30000 | Total reward = 52.23
2022-01-26 14:16:38.419 | DEBUG    | __main__:trials:24 - Trial = 3003/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.420 | DEBUG    | __main__:trials:29 - Trial = 3003/30000 | Total reward = 50.38
2022-01-26 14:16:38.423 | DEBUG    | __main__:trials:24 - Trial = 3004/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.425 | DEBUG    | __main__:trials:29 - Trial = 3004/30000 | Total reward = 59.14
2022-01-26 14:16:38.428 | DEBUG    | __main__:trials:24 - Trial = 3005/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.430 | DEBUG    | __main__:trials:29 - Trial = 3005/30000 | Total reward = 52.36
2022-01-26 14:16:38.434 | DEBUG    | __main__:trials:24 - Trial = 3006/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.436 | DEBUG    | __main__:trials:29 - Trial = 3006/30000 | Total reward = 56.45
2022-01-26 14:16:38.440 | DEBUG    | __main__:trials:24 - Trial = 3007/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.441 | DEBUG    | __main__:trials:29 - Trial = 3007/30000 | Total reward = 51.57
2022-01-26 14:16:38.445 | DEBUG    | __main__:trials:24 - Trial = 3008/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.446 | DEBUG    | __main__:trials:29 - Trial = 3008/30000 | Total reward = 51.14
2022-01-26 14:16:38.449 | DEBUG    | __main__:trials:24 - Trial = 3009/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.451 | DEBUG    | __main__:trials:29 - Trial = 3009/30000 | Total reward = 48.01
2022-01-26 14:16:38.454 | DEBUG    | __main__:trials:24 - Trial = 3010/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.456 | DEBUG    | __main__:trials:29 - Trial = 3010/30000 | Total reward = 52.08
2022-01-26 14:16:38.460 | DEBUG    | __main__:trials:24 - Trial = 3011/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.462 | DEBUG    | __main__:trials:29 - Trial = 3011/30000 | Total reward = 47.11
2022-01-26 14:16:38.466 | DEBUG    | __main__:trials:24 - Trial = 3012/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.467 | DEBUG    | __main__:trials:29 - Trial = 3012/30000 | Total reward = 61.34
2022-01-26 14:16:38.471 | DEBUG    | __main__:trials:24 - Trial = 3013/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.472 | DEBUG    | __main__:trials:29 - Trial = 3013/30000 | Total reward = 47.78
2022-01-26 14:16:38.476 | DEBUG    | __main__:trials:24 - Trial = 3014/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.478 | DEBUG    | __main__:trials:29 - Trial = 3014/30000 | Total reward = 62.59
2022-01-26 14:16:38.481 | DEBUG    | __main__:trials:26 - Trial = 3015/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.483 | DEBUG    | __main__:trials:29 - Trial = 3015/30000 | Total reward = 26.84
2022-01-26 14:16:38.486 | DEBUG    | __main__:trials:24 - Trial = 3016/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.488 | DEBUG    | __main__:trials:29 - Trial = 3016/30000 | Total reward = 46.68
2022-01-26 14:16:38.491 | DEBUG    | __main__:trials:26 - Trial = 3017/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.492 | DEBUG    | __main__:trials:29 - Trial = 3017/30000 | Total reward = 14.60
2022-01-26 14:16:38.496 | DEBUG    | __main__:trials:24 - Trial = 3018/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.498 | DEBUG    | __main__:trials:29 - Trial = 3018/30000 | Total reward = 48.27
2022-01-26 14:16:38.502 | DEBUG    | __main__:trials:24 - Trial = 3019/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.502 | DEBUG    | __main__:trials:29 - Trial = 3019/30000 | Total reward = 57.82
2022-01-26 14:16:38.506 | DEBUG    | __main__:trials:24 - Trial = 3020/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.508 | DEBUG    | __main__:trials:29 - Trial = 3020/30000 | Total reward = 45.07
2022-01-26 14:16:38.511 | DEBUG    | __main__:trials:24 - Trial = 3021/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.513 | DEBUG    | __main__:trials:29 - Trial = 3021/30000 | Total reward = 48.63
2022-01-26 14:16:38.516 | DEBUG    | __main__:trials:24 - Trial = 3022/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.517 | DEBUG    | __main__:trials:29 - Trial = 3022/30000 | Total reward = 55.93
2022-01-26 14:16:38.520 | DEBUG    | __main__:trials:26 - Trial = 3023/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.522 | DEBUG    | __main__:trials:29 - Trial = 3023/30000 | Total reward = 34.36
2022-01-26 14:16:38.526 | DEBUG    | __main__:trials:24 - Trial = 3024/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.527 | DEBUG    | __main__:trials:29 - Trial = 3024/30000 | Total reward = 47.45
2022-01-26 14:16:38.531 | DEBUG    | __main__:trials:24 - Trial = 3025/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.532 | DEBUG    | __main__:trials:29 - Trial = 3025/30000 | Total reward = 46.88
2022-01-26 14:16:38.536 | DEBUG    | __main__:trials:24 - Trial = 3026/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.537 | DEBUG    | __main__:trials:29 - Trial = 3026/30000 | Total reward = 48.49
2022-01-26 14:16:38.541 | DEBUG    | __main__:trials:24 - Trial = 3027/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.543 | DEBUG    | __main__:trials:29 - Trial = 3027/30000 | Total reward = 34.17
2022-01-26 14:16:38.546 | DEBUG    | __main__:trials:24 - Trial = 3028/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.548 | DEBUG    | __main__:trials:29 - Trial = 3028/30000 | Total reward = 52.62
2022-01-26 14:16:38.552 | DEBUG    | __main__:trials:26 - Trial = 3029/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.552 | DEBUG    | __main__:trials:29 - Trial = 3029/30000 | Total reward = 21.69
2022-01-26 14:16:38.556 | DEBUG    | __main__:trials:24 - Trial = 3030/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.558 | DEBUG    | __main__:trials:29 - Trial = 3030/30000 | Total reward = 53.57
2022-01-26 14:16:38.562 | DEBUG    | __main__:trials:24 - Trial = 3031/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.563 | DEBUG    | __main__:trials:29 - Trial = 3031/30000 | Total reward = 44.06
2022-01-26 14:16:38.567 | DEBUG    | __main__:trials:24 - Trial = 3032/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.568 | DEBUG    | __main__:trials:29 - Trial = 3032/30000 | Total reward = 50.71
2022-01-26 14:16:38.572 | DEBUG    | __main__:trials:24 - Trial = 3033/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.574 | DEBUG    | __main__:trials:29 - Trial = 3033/30000 | Total reward = 60.12
2022-01-26 14:16:38.578 | DEBUG    | __main__:trials:24 - Trial = 3034/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.579 | DEBUG    | __main__:trials:29 - Trial = 3034/30000 | Total reward = 53.86
2022-01-26 14:16:38.583 | DEBUG    | __main__:trials:24 - Trial = 3035/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.584 | DEBUG    | __main__:trials:29 - Trial = 3035/30000 | Total reward = 56.44
2022-01-26 14:16:38.588 | DEBUG    | __main__:trials:24 - Trial = 3036/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.590 | DEBUG    | __main__:trials:29 - Trial = 3036/30000 | Total reward = 48.04
2022-01-26 14:16:38.593 | DEBUG    | __main__:trials:24 - Trial = 3037/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.595 | DEBUG    | __main__:trials:29 - Trial = 3037/30000 | Total reward = 48.56
2022-01-26 14:16:38.599 | DEBUG    | __main__:trials:24 - Trial = 3038/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.600 | DEBUG    | __main__:trials:29 - Trial = 3038/30000 | Total reward = 45.60
2022-01-26 14:16:38.604 | DEBUG    | __main__:trials:24 - Trial = 3039/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.606 | DEBUG    | __main__:trials:29 - Trial = 3039/30000 | Total reward = 61.77
2022-01-26 14:16:38.609 | DEBUG    | __main__:trials:24 - Trial = 3040/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.611 | DEBUG    | __main__:trials:29 - Trial = 3040/30000 | Total reward = 60.95
2022-01-26 14:16:38.614 | DEBUG    | __main__:trials:24 - Trial = 3041/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.616 | DEBUG    | __main__:trials:29 - Trial = 3041/30000 | Total reward = 43.91
2022-01-26 14:16:38.619 | DEBUG    | __main__:trials:24 - Trial = 3042/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.621 | DEBUG    | __main__:trials:29 - Trial = 3042/30000 | Total reward = 39.99
2022-01-26 14:16:38.625 | DEBUG    | __main__:trials:24 - Trial = 3043/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.626 | DEBUG    | __main__:trials:29 - Trial = 3043/30000 | Total reward = 62.80
2022-01-26 14:16:38.630 | DEBUG    | __main__:trials:24 - Trial = 3044/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.631 | DEBUG    | __main__:trials:29 - Trial = 3044/30000 | Total reward = 51.05
2022-01-26 14:16:38.635 | DEBUG    | __main__:trials:24 - Trial = 3045/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.637 | DEBUG    | __main__:trials:29 - Trial = 3045/30000 | Total reward = 52.57
2022-01-26 14:16:38.640 | DEBUG    | __main__:trials:24 - Trial = 3046/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.642 | DEBUG    | __main__:trials:29 - Trial = 3046/30000 | Total reward = 51.54
2022-01-26 14:16:38.644 | DEBUG    | __main__:trials:26 - Trial = 3047/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.646 | DEBUG    | __main__:trials:29 - Trial = 3047/30000 | Total reward = 10.21
2022-01-26 14:16:38.650 | DEBUG    | __main__:trials:24 - Trial = 3048/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.651 | DEBUG    | __main__:trials:29 - Trial = 3048/30000 | Total reward = 37.92
2022-01-26 14:16:38.655 | DEBUG    | __main__:trials:24 - Trial = 3049/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.656 | DEBUG    | __main__:trials:29 - Trial = 3049/30000 | Total reward = 58.44
2022-01-26 14:16:38.660 | DEBUG    | __main__:trials:24 - Trial = 3050/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.662 | DEBUG    | __main__:trials:29 - Trial = 3050/30000 | Total reward = 63.66
2022-01-26 14:16:38.666 | DEBUG    | __main__:trials:24 - Trial = 3051/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.668 | DEBUG    | __main__:trials:29 - Trial = 3051/30000 | Total reward = 57.21
2022-01-26 14:16:38.672 | DEBUG    | __main__:trials:24 - Trial = 3052/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.674 | DEBUG    | __main__:trials:29 - Trial = 3052/30000 | Total reward = 46.86
2022-01-26 14:16:38.677 | DEBUG    | __main__:trials:24 - Trial = 3053/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.679 | DEBUG    | __main__:trials:29 - Trial = 3053/30000 | Total reward = 32.72
2022-01-26 14:16:38.682 | DEBUG    | __main__:trials:24 - Trial = 3054/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.684 | DEBUG    | __main__:trials:29 - Trial = 3054/30000 | Total reward = 50.48
2022-01-26 14:16:38.688 | DEBUG    | __main__:trials:24 - Trial = 3055/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.689 | DEBUG    | __main__:trials:29 - Trial = 3055/30000 | Total reward = 45.76
2022-01-26 14:16:38.693 | DEBUG    | __main__:trials:24 - Trial = 3056/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.695 | DEBUG    | __main__:trials:29 - Trial = 3056/30000 | Total reward = 60.02
2022-01-26 14:16:38.697 | DEBUG    | __main__:trials:24 - Trial = 3057/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.699 | DEBUG    | __main__:trials:29 - Trial = 3057/30000 | Total reward = 59.12
2022-01-26 14:16:38.702 | DEBUG    | __main__:trials:24 - Trial = 3058/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.704 | DEBUG    | __main__:trials:29 - Trial = 3058/30000 | Total reward = 23.45
2022-01-26 14:16:38.707 | DEBUG    | __main__:trials:26 - Trial = 3059/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.708 | DEBUG    | __main__:trials:29 - Trial = 3059/30000 | Total reward = 17.31
2022-01-26 14:16:38.712 | DEBUG    | __main__:trials:24 - Trial = 3060/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.713 | DEBUG    | __main__:trials:29 - Trial = 3060/30000 | Total reward = 51.48
2022-01-26 14:16:38.717 | DEBUG    | __main__:trials:24 - Trial = 3061/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.718 | DEBUG    | __main__:trials:29 - Trial = 3061/30000 | Total reward = 46.10
2022-01-26 14:16:38.722 | DEBUG    | __main__:trials:24 - Trial = 3062/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.724 | DEBUG    | __main__:trials:29 - Trial = 3062/30000 | Total reward = 53.68
2022-01-26 14:16:38.728 | DEBUG    | __main__:trials:24 - Trial = 3063/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.729 | DEBUG    | __main__:trials:29 - Trial = 3063/30000 | Total reward = 59.47
2022-01-26 14:16:38.733 | DEBUG    | __main__:trials:24 - Trial = 3064/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.734 | DEBUG    | __main__:trials:29 - Trial = 3064/30000 | Total reward = 51.86
2022-01-26 14:16:38.737 | DEBUG    | __main__:trials:24 - Trial = 3065/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.739 | DEBUG    | __main__:trials:29 - Trial = 3065/30000 | Total reward = 51.64
2022-01-26 14:16:38.743 | DEBUG    | __main__:trials:24 - Trial = 3066/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.744 | DEBUG    | __main__:trials:29 - Trial = 3066/30000 | Total reward = 61.24
2022-01-26 14:16:38.749 | DEBUG    | __main__:trials:24 - Trial = 3067/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.749 | DEBUG    | __main__:trials:29 - Trial = 3067/30000 | Total reward = 48.71
2022-01-26 14:16:38.754 | DEBUG    | __main__:trials:24 - Trial = 3068/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.755 | DEBUG    | __main__:trials:29 - Trial = 3068/30000 | Total reward = 62.04
2022-01-26 14:16:38.759 | DEBUG    | __main__:trials:24 - Trial = 3069/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.761 | DEBUG    | __main__:trials:29 - Trial = 3069/30000 | Total reward = 62.51
2022-01-26 14:16:38.764 | DEBUG    | __main__:trials:24 - Trial = 3070/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.766 | DEBUG    | __main__:trials:29 - Trial = 3070/30000 | Total reward = 57.06
2022-01-26 14:16:38.769 | DEBUG    | __main__:trials:24 - Trial = 3071/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.771 | DEBUG    | __main__:trials:29 - Trial = 3071/30000 | Total reward = 60.29
2022-01-26 14:16:38.775 | DEBUG    | __main__:trials:24 - Trial = 3072/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.776 | DEBUG    | __main__:trials:29 - Trial = 3072/30000 | Total reward = 56.44
2022-01-26 14:16:38.780 | DEBUG    | __main__:trials:26 - Trial = 3073/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.780 | DEBUG    | __main__:trials:29 - Trial = 3073/30000 | Total reward = 10.40
2022-01-26 14:16:38.785 | DEBUG    | __main__:trials:24 - Trial = 3074/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.786 | DEBUG    | __main__:trials:29 - Trial = 3074/30000 | Total reward = 56.37
2022-01-26 14:16:38.790 | DEBUG    | __main__:trials:24 - Trial = 3075/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.791 | DEBUG    | __main__:trials:29 - Trial = 3075/30000 | Total reward = 43.81
2022-01-26 14:16:38.794 | DEBUG    | __main__:trials:24 - Trial = 3076/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.796 | DEBUG    | __main__:trials:29 - Trial = 3076/30000 | Total reward = 55.50
2022-01-26 14:16:38.799 | DEBUG    | __main__:trials:26 - Trial = 3077/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.800 | DEBUG    | __main__:trials:29 - Trial = 3077/30000 | Total reward = 12.91
2022-01-26 14:16:38.804 | DEBUG    | __main__:trials:24 - Trial = 3078/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.806 | DEBUG    | __main__:trials:29 - Trial = 3078/30000 | Total reward = 49.05
2022-01-26 14:16:38.808 | DEBUG    | __main__:trials:24 - Trial = 3079/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.810 | DEBUG    | __main__:trials:29 - Trial = 3079/30000 | Total reward = 57.98
2022-01-26 14:16:38.814 | DEBUG    | __main__:trials:24 - Trial = 3080/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.815 | DEBUG    | __main__:trials:29 - Trial = 3080/30000 | Total reward = 55.35
2022-01-26 14:16:38.819 | DEBUG    | __main__:trials:24 - Trial = 3081/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.821 | DEBUG    | __main__:trials:29 - Trial = 3081/30000 | Total reward = 58.68
2022-01-26 14:16:38.824 | DEBUG    | __main__:trials:24 - Trial = 3082/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.825 | DEBUG    | __main__:trials:29 - Trial = 3082/30000 | Total reward = 56.37
2022-01-26 14:16:38.829 | DEBUG    | __main__:trials:24 - Trial = 3083/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.829 | DEBUG    | __main__:trials:29 - Trial = 3083/30000 | Total reward = 56.37
2022-01-26 14:16:38.833 | DEBUG    | __main__:trials:24 - Trial = 3084/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.834 | DEBUG    | __main__:trials:29 - Trial = 3084/30000 | Total reward = 47.23
2022-01-26 14:16:38.837 | DEBUG    | __main__:trials:24 - Trial = 3085/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.838 | DEBUG    | __main__:trials:29 - Trial = 3085/30000 | Total reward = 37.28
2022-01-26 14:16:38.841 | DEBUG    | __main__:trials:24 - Trial = 3086/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.843 | DEBUG    | __main__:trials:29 - Trial = 3086/30000 | Total reward = 28.84
2022-01-26 14:16:38.846 | DEBUG    | __main__:trials:24 - Trial = 3087/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.847 | DEBUG    | __main__:trials:29 - Trial = 3087/30000 | Total reward = 27.92
2022-01-26 14:16:38.851 | DEBUG    | __main__:trials:24 - Trial = 3088/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.853 | DEBUG    | __main__:trials:29 - Trial = 3088/30000 | Total reward = 56.27
2022-01-26 14:16:38.855 | DEBUG    | __main__:trials:24 - Trial = 3089/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.857 | DEBUG    | __main__:trials:29 - Trial = 3089/30000 | Total reward = 54.15
2022-01-26 14:16:38.860 | DEBUG    | __main__:trials:24 - Trial = 3090/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.862 | DEBUG    | __main__:trials:29 - Trial = 3090/30000 | Total reward = 56.40
2022-01-26 14:16:38.866 | DEBUG    | __main__:trials:24 - Trial = 3091/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.867 | DEBUG    | __main__:trials:29 - Trial = 3091/30000 | Total reward = 49.90
2022-01-26 14:16:38.871 | DEBUG    | __main__:trials:26 - Trial = 3092/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.873 | DEBUG    | __main__:trials:29 - Trial = 3092/30000 | Total reward = 36.00
2022-01-26 14:16:38.876 | DEBUG    | __main__:trials:24 - Trial = 3093/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.878 | DEBUG    | __main__:trials:29 - Trial = 3093/30000 | Total reward = 44.01
2022-01-26 14:16:38.881 | DEBUG    | __main__:trials:24 - Trial = 3094/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.883 | DEBUG    | __main__:trials:29 - Trial = 3094/30000 | Total reward = 54.43
2022-01-26 14:16:38.887 | DEBUG    | __main__:trials:24 - Trial = 3095/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.888 | DEBUG    | __main__:trials:29 - Trial = 3095/30000 | Total reward = 51.56
2022-01-26 14:16:38.892 | DEBUG    | __main__:trials:24 - Trial = 3096/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.894 | DEBUG    | __main__:trials:29 - Trial = 3096/30000 | Total reward = 48.10
2022-01-26 14:16:38.896 | DEBUG    | __main__:trials:26 - Trial = 3097/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.898 | DEBUG    | __main__:trials:29 - Trial = 3097/30000 | Total reward = 16.82
2022-01-26 14:16:38.901 | DEBUG    | __main__:trials:24 - Trial = 3098/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.903 | DEBUG    | __main__:trials:29 - Trial = 3098/30000 | Total reward = 46.18
2022-01-26 14:16:38.907 | DEBUG    | __main__:trials:24 - Trial = 3099/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.908 | DEBUG    | __main__:trials:29 - Trial = 3099/30000 | Total reward = 53.26
2022-01-26 14:16:38.912 | DEBUG    | __main__:trials:26 - Trial = 3100/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.913 | DEBUG    | __main__:trials:29 - Trial = 3100/30000 | Total reward = 20.85
2022-01-26 14:16:38.917 | DEBUG    | __main__:trials:24 - Trial = 3101/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.917 | DEBUG    | __main__:trials:29 - Trial = 3101/30000 | Total reward = 60.94
2022-01-26 14:16:38.921 | DEBUG    | __main__:trials:24 - Trial = 3102/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.922 | DEBUG    | __main__:trials:29 - Trial = 3102/30000 | Total reward = 54.06
2022-01-26 14:16:38.926 | DEBUG    | __main__:trials:24 - Trial = 3103/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.928 | DEBUG    | __main__:trials:29 - Trial = 3103/30000 | Total reward = 55.98
2022-01-26 14:16:38.932 | DEBUG    | __main__:trials:24 - Trial = 3104/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.933 | DEBUG    | __main__:trials:29 - Trial = 3104/30000 | Total reward = 49.21
2022-01-26 14:16:38.937 | DEBUG    | __main__:trials:24 - Trial = 3105/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.938 | DEBUG    | __main__:trials:29 - Trial = 3105/30000 | Total reward = 50.16
2022-01-26 14:16:38.941 | DEBUG    | __main__:trials:24 - Trial = 3106/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.942 | DEBUG    | __main__:trials:29 - Trial = 3106/30000 | Total reward = 58.31
2022-01-26 14:16:38.945 | DEBUG    | __main__:trials:26 - Trial = 3107/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:38.946 | DEBUG    | __main__:trials:29 - Trial = 3107/30000 | Total reward = 22.50
2022-01-26 14:16:38.950 | DEBUG    | __main__:trials:24 - Trial = 3108/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.952 | DEBUG    | __main__:trials:29 - Trial = 3108/30000 | Total reward = 57.55
2022-01-26 14:16:38.955 | DEBUG    | __main__:trials:24 - Trial = 3109/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.957 | DEBUG    | __main__:trials:29 - Trial = 3109/30000 | Total reward = 51.93
2022-01-26 14:16:38.960 | DEBUG    | __main__:trials:24 - Trial = 3110/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.961 | DEBUG    | __main__:trials:29 - Trial = 3110/30000 | Total reward = 49.43
2022-01-26 14:16:38.964 | DEBUG    | __main__:trials:24 - Trial = 3111/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.966 | DEBUG    | __main__:trials:29 - Trial = 3111/30000 | Total reward = 56.19
2022-01-26 14:16:38.970 | DEBUG    | __main__:trials:24 - Trial = 3112/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.971 | DEBUG    | __main__:trials:29 - Trial = 3112/30000 | Total reward = 57.63
2022-01-26 14:16:38.975 | DEBUG    | __main__:trials:24 - Trial = 3113/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.977 | DEBUG    | __main__:trials:29 - Trial = 3113/30000 | Total reward = 47.38
2022-01-26 14:16:38.980 | DEBUG    | __main__:trials:24 - Trial = 3114/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.982 | DEBUG    | __main__:trials:29 - Trial = 3114/30000 | Total reward = 34.46
2022-01-26 14:16:38.986 | DEBUG    | __main__:trials:24 - Trial = 3115/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.987 | DEBUG    | __main__:trials:29 - Trial = 3115/30000 | Total reward = 16.36
2022-01-26 14:16:38.991 | DEBUG    | __main__:trials:24 - Trial = 3116/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.993 | DEBUG    | __main__:trials:29 - Trial = 3116/30000 | Total reward = 56.34
2022-01-26 14:16:38.996 | DEBUG    | __main__:trials:24 - Trial = 3117/30000 | Max number of steps (20) reached
2022-01-26 14:16:38.997 | DEBUG    | __main__:trials:29 - Trial = 3117/30000 | Total reward = 41.43
2022-01-26 14:16:39.001 | DEBUG    | __main__:trials:24 - Trial = 3118/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.003 | DEBUG    | __main__:trials:29 - Trial = 3118/30000 | Total reward = 41.61
2022-01-26 14:16:39.006 | DEBUG    | __main__:trials:24 - Trial = 3119/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.008 | DEBUG    | __main__:trials:29 - Trial = 3119/30000 | Total reward = 56.30
2022-01-26 14:16:39.012 | DEBUG    | __main__:trials:24 - Trial = 3120/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.013 | DEBUG    | __main__:trials:29 - Trial = 3120/30000 | Total reward = 56.13
2022-01-26 14:16:39.016 | DEBUG    | __main__:trials:24 - Trial = 3121/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.018 | DEBUG    | __main__:trials:29 - Trial = 3121/30000 | Total reward = 56.19
2022-01-26 14:16:39.021 | DEBUG    | __main__:trials:24 - Trial = 3122/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.023 | DEBUG    | __main__:trials:29 - Trial = 3122/30000 | Total reward = 33.49
2022-01-26 14:16:39.027 | DEBUG    | __main__:trials:24 - Trial = 3123/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.028 | DEBUG    | __main__:trials:29 - Trial = 3123/30000 | Total reward = 56.53
2022-01-26 14:16:39.032 | DEBUG    | __main__:trials:24 - Trial = 3124/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.034 | DEBUG    | __main__:trials:29 - Trial = 3124/30000 | Total reward = 56.19
2022-01-26 14:16:39.037 | DEBUG    | __main__:trials:24 - Trial = 3125/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.039 | DEBUG    | __main__:trials:29 - Trial = 3125/30000 | Total reward = 33.71
2022-01-26 14:16:39.043 | DEBUG    | __main__:trials:24 - Trial = 3126/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.044 | DEBUG    | __main__:trials:29 - Trial = 3126/30000 | Total reward = 32.96
2022-01-26 14:16:39.048 | DEBUG    | __main__:trials:24 - Trial = 3127/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.049 | DEBUG    | __main__:trials:29 - Trial = 3127/30000 | Total reward = 52.52
2022-01-26 14:16:39.053 | DEBUG    | __main__:trials:24 - Trial = 3128/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.055 | DEBUG    | __main__:trials:29 - Trial = 3128/30000 | Total reward = 37.39
2022-01-26 14:16:39.058 | DEBUG    | __main__:trials:24 - Trial = 3129/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.060 | DEBUG    | __main__:trials:29 - Trial = 3129/30000 | Total reward = 51.84
2022-01-26 14:16:39.063 | DEBUG    | __main__:trials:24 - Trial = 3130/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.065 | DEBUG    | __main__:trials:29 - Trial = 3130/30000 | Total reward = 54.96
2022-01-26 14:16:39.068 | DEBUG    | __main__:trials:24 - Trial = 3131/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.070 | DEBUG    | __main__:trials:29 - Trial = 3131/30000 | Total reward = 64.84
2022-01-26 14:16:39.073 | DEBUG    | __main__:trials:24 - Trial = 3132/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.074 | DEBUG    | __main__:trials:29 - Trial = 3132/30000 | Total reward = 58.88
2022-01-26 14:16:39.077 | DEBUG    | __main__:trials:24 - Trial = 3133/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.078 | DEBUG    | __main__:trials:29 - Trial = 3133/30000 | Total reward = 56.44
2022-01-26 14:16:39.081 | DEBUG    | __main__:trials:24 - Trial = 3134/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.083 | DEBUG    | __main__:trials:29 - Trial = 3134/30000 | Total reward = 63.90
2022-01-26 14:16:39.087 | DEBUG    | __main__:trials:24 - Trial = 3135/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.088 | DEBUG    | __main__:trials:29 - Trial = 3135/30000 | Total reward = 56.65
2022-01-26 14:16:39.091 | DEBUG    | __main__:trials:24 - Trial = 3136/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.092 | DEBUG    | __main__:trials:29 - Trial = 3136/30000 | Total reward = 56.84
2022-01-26 14:16:39.096 | DEBUG    | __main__:trials:24 - Trial = 3137/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.098 | DEBUG    | __main__:trials:29 - Trial = 3137/30000 | Total reward = 43.22
2022-01-26 14:16:39.101 | DEBUG    | __main__:trials:24 - Trial = 3138/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.102 | DEBUG    | __main__:trials:29 - Trial = 3138/30000 | Total reward = 50.14
2022-01-26 14:16:39.106 | DEBUG    | __main__:trials:24 - Trial = 3139/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.107 | DEBUG    | __main__:trials:29 - Trial = 3139/30000 | Total reward = 59.82
2022-01-26 14:16:39.111 | DEBUG    | __main__:trials:24 - Trial = 3140/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.113 | DEBUG    | __main__:trials:29 - Trial = 3140/30000 | Total reward = 55.24
2022-01-26 14:16:39.116 | DEBUG    | __main__:trials:24 - Trial = 3141/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.117 | DEBUG    | __main__:trials:29 - Trial = 3141/30000 | Total reward = 56.10
2022-01-26 14:16:39.121 | DEBUG    | __main__:trials:24 - Trial = 3142/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.122 | DEBUG    | __main__:trials:29 - Trial = 3142/30000 | Total reward = 24.37
2022-01-26 14:16:39.125 | DEBUG    | __main__:trials:24 - Trial = 3143/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.127 | DEBUG    | __main__:trials:29 - Trial = 3143/30000 | Total reward = 49.49
2022-01-26 14:16:39.131 | DEBUG    | __main__:trials:24 - Trial = 3144/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.132 | DEBUG    | __main__:trials:29 - Trial = 3144/30000 | Total reward = 41.89
2022-01-26 14:16:39.136 | DEBUG    | __main__:trials:24 - Trial = 3145/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.138 | DEBUG    | __main__:trials:29 - Trial = 3145/30000 | Total reward = 65.56
2022-01-26 14:16:39.141 | DEBUG    | __main__:trials:24 - Trial = 3146/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.143 | DEBUG    | __main__:trials:29 - Trial = 3146/30000 | Total reward = 51.24
2022-01-26 14:16:39.147 | DEBUG    | __main__:trials:24 - Trial = 3147/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.148 | DEBUG    | __main__:trials:29 - Trial = 3147/30000 | Total reward = 56.44
2022-01-26 14:16:39.151 | DEBUG    | __main__:trials:24 - Trial = 3148/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.153 | DEBUG    | __main__:trials:29 - Trial = 3148/30000 | Total reward = 47.40
2022-01-26 14:16:39.156 | DEBUG    | __main__:trials:24 - Trial = 3149/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.158 | DEBUG    | __main__:trials:29 - Trial = 3149/30000 | Total reward = 48.79
2022-01-26 14:16:39.161 | DEBUG    | __main__:trials:24 - Trial = 3150/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.163 | DEBUG    | __main__:trials:29 - Trial = 3150/30000 | Total reward = 58.51
2022-01-26 14:16:39.165 | DEBUG    | __main__:trials:24 - Trial = 3151/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.167 | DEBUG    | __main__:trials:29 - Trial = 3151/30000 | Total reward = 63.19
2022-01-26 14:16:39.170 | DEBUG    | __main__:trials:26 - Trial = 3152/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.171 | DEBUG    | __main__:trials:29 - Trial = 3152/30000 | Total reward = 17.64
2022-01-26 14:16:39.175 | DEBUG    | __main__:trials:24 - Trial = 3153/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.176 | DEBUG    | __main__:trials:29 - Trial = 3153/30000 | Total reward = 56.44
2022-01-26 14:16:39.180 | DEBUG    | __main__:trials:26 - Trial = 3154/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.182 | DEBUG    | __main__:trials:29 - Trial = 3154/30000 | Total reward = 35.50
2022-01-26 14:16:39.185 | DEBUG    | __main__:trials:24 - Trial = 3155/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.187 | DEBUG    | __main__:trials:29 - Trial = 3155/30000 | Total reward = 28.06
2022-01-26 14:16:39.191 | DEBUG    | __main__:trials:24 - Trial = 3156/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.192 | DEBUG    | __main__:trials:29 - Trial = 3156/30000 | Total reward = 55.16
2022-01-26 14:16:39.196 | DEBUG    | __main__:trials:24 - Trial = 3157/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.197 | DEBUG    | __main__:trials:29 - Trial = 3157/30000 | Total reward = 45.14
2022-01-26 14:16:39.200 | DEBUG    | __main__:trials:24 - Trial = 3158/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.203 | DEBUG    | __main__:trials:29 - Trial = 3158/30000 | Total reward = 55.46
2022-01-26 14:16:39.206 | DEBUG    | __main__:trials:24 - Trial = 3159/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.208 | DEBUG    | __main__:trials:29 - Trial = 3159/30000 | Total reward = 45.71
2022-01-26 14:16:39.211 | DEBUG    | __main__:trials:24 - Trial = 3160/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.213 | DEBUG    | __main__:trials:29 - Trial = 3160/30000 | Total reward = 56.82
2022-01-26 14:16:39.217 | DEBUG    | __main__:trials:24 - Trial = 3161/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.218 | DEBUG    | __main__:trials:29 - Trial = 3161/30000 | Total reward = 46.08
2022-01-26 14:16:39.222 | DEBUG    | __main__:trials:24 - Trial = 3162/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.223 | DEBUG    | __main__:trials:29 - Trial = 3162/30000 | Total reward = 58.28
2022-01-26 14:16:39.227 | DEBUG    | __main__:trials:24 - Trial = 3163/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.228 | DEBUG    | __main__:trials:29 - Trial = 3163/30000 | Total reward = 55.49
2022-01-26 14:16:39.232 | DEBUG    | __main__:trials:24 - Trial = 3164/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.233 | DEBUG    | __main__:trials:29 - Trial = 3164/30000 | Total reward = 28.52
2022-01-26 14:16:39.236 | DEBUG    | __main__:trials:24 - Trial = 3165/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.238 | DEBUG    | __main__:trials:29 - Trial = 3165/30000 | Total reward = 43.56
2022-01-26 14:16:39.242 | DEBUG    | __main__:trials:24 - Trial = 3166/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.244 | DEBUG    | __main__:trials:29 - Trial = 3166/30000 | Total reward = 56.19
2022-01-26 14:16:39.247 | DEBUG    | __main__:trials:24 - Trial = 3167/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.249 | DEBUG    | __main__:trials:29 - Trial = 3167/30000 | Total reward = 57.01
2022-01-26 14:16:39.253 | DEBUG    | __main__:trials:24 - Trial = 3168/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.254 | DEBUG    | __main__:trials:29 - Trial = 3168/30000 | Total reward = 56.60
2022-01-26 14:16:39.258 | DEBUG    | __main__:trials:24 - Trial = 3169/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.259 | DEBUG    | __main__:trials:29 - Trial = 3169/30000 | Total reward = 29.46
2022-01-26 14:16:39.263 | DEBUG    | __main__:trials:24 - Trial = 3170/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.264 | DEBUG    | __main__:trials:29 - Trial = 3170/30000 | Total reward = 53.38
2022-01-26 14:16:39.268 | DEBUG    | __main__:trials:24 - Trial = 3171/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.269 | DEBUG    | __main__:trials:29 - Trial = 3171/30000 | Total reward = 58.16
2022-01-26 14:16:39.273 | DEBUG    | __main__:trials:24 - Trial = 3172/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.274 | DEBUG    | __main__:trials:29 - Trial = 3172/30000 | Total reward = 56.30
2022-01-26 14:16:39.278 | DEBUG    | __main__:trials:24 - Trial = 3173/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.280 | DEBUG    | __main__:trials:29 - Trial = 3173/30000 | Total reward = 51.15
2022-01-26 14:16:39.283 | DEBUG    | __main__:trials:26 - Trial = 3174/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.284 | DEBUG    | __main__:trials:29 - Trial = 3174/30000 | Total reward = 19.54
2022-01-26 14:16:39.288 | DEBUG    | __main__:trials:24 - Trial = 3175/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.290 | DEBUG    | __main__:trials:29 - Trial = 3175/30000 | Total reward = 47.97
2022-01-26 14:16:39.293 | DEBUG    | __main__:trials:24 - Trial = 3176/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.295 | DEBUG    | __main__:trials:29 - Trial = 3176/30000 | Total reward = 53.92
2022-01-26 14:16:39.299 | DEBUG    | __main__:trials:24 - Trial = 3177/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.301 | DEBUG    | __main__:trials:29 - Trial = 3177/30000 | Total reward = 56.44
2022-01-26 14:16:39.304 | DEBUG    | __main__:trials:24 - Trial = 3178/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.306 | DEBUG    | __main__:trials:29 - Trial = 3178/30000 | Total reward = 34.80
2022-01-26 14:16:39.309 | DEBUG    | __main__:trials:26 - Trial = 3179/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.311 | DEBUG    | __main__:trials:29 - Trial = 3179/30000 | Total reward = 25.11
2022-01-26 14:16:39.314 | DEBUG    | __main__:trials:26 - Trial = 3180/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.316 | DEBUG    | __main__:trials:29 - Trial = 3180/30000 | Total reward = 17.61
2022-01-26 14:16:39.319 | DEBUG    | __main__:trials:24 - Trial = 3181/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.321 | DEBUG    | __main__:trials:29 - Trial = 3181/30000 | Total reward = 56.44
2022-01-26 14:16:39.324 | DEBUG    | __main__:trials:26 - Trial = 3182/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.325 | DEBUG    | __main__:trials:29 - Trial = 3182/30000 | Total reward = 22.57
2022-01-26 14:16:39.328 | DEBUG    | __main__:trials:24 - Trial = 3183/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.329 | DEBUG    | __main__:trials:29 - Trial = 3183/30000 | Total reward = 37.70
2022-01-26 14:16:39.333 | DEBUG    | __main__:trials:24 - Trial = 3184/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.334 | DEBUG    | __main__:trials:29 - Trial = 3184/30000 | Total reward = 58.36
2022-01-26 14:16:39.337 | DEBUG    | __main__:trials:26 - Trial = 3185/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.338 | DEBUG    | __main__:trials:29 - Trial = 3185/30000 | Total reward = 16.77
2022-01-26 14:16:39.342 | DEBUG    | __main__:trials:24 - Trial = 3186/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.343 | DEBUG    | __main__:trials:29 - Trial = 3186/30000 | Total reward = 47.90
2022-01-26 14:16:39.346 | DEBUG    | __main__:trials:26 - Trial = 3187/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.348 | DEBUG    | __main__:trials:29 - Trial = 3187/30000 | Total reward = 26.03
2022-01-26 14:16:39.351 | DEBUG    | __main__:trials:24 - Trial = 3188/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.353 | DEBUG    | __main__:trials:29 - Trial = 3188/30000 | Total reward = 56.44
2022-01-26 14:16:39.356 | DEBUG    | __main__:trials:24 - Trial = 3189/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.358 | DEBUG    | __main__:trials:29 - Trial = 3189/30000 | Total reward = 56.41
2022-01-26 14:16:39.362 | DEBUG    | __main__:trials:24 - Trial = 3190/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.363 | DEBUG    | __main__:trials:29 - Trial = 3190/30000 | Total reward = 49.84
2022-01-26 14:16:39.366 | DEBUG    | __main__:trials:24 - Trial = 3191/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.368 | DEBUG    | __main__:trials:29 - Trial = 3191/30000 | Total reward = 41.49
2022-01-26 14:16:39.372 | DEBUG    | __main__:trials:24 - Trial = 3192/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.373 | DEBUG    | __main__:trials:29 - Trial = 3192/30000 | Total reward = 46.82
2022-01-26 14:16:39.377 | DEBUG    | __main__:trials:24 - Trial = 3193/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.378 | DEBUG    | __main__:trials:29 - Trial = 3193/30000 | Total reward = 48.39
2022-01-26 14:16:39.382 | DEBUG    | __main__:trials:24 - Trial = 3194/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.383 | DEBUG    | __main__:trials:29 - Trial = 3194/30000 | Total reward = 56.55
2022-01-26 14:16:39.387 | DEBUG    | __main__:trials:24 - Trial = 3195/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.388 | DEBUG    | __main__:trials:29 - Trial = 3195/30000 | Total reward = 55.00
2022-01-26 14:16:39.392 | DEBUG    | __main__:trials:24 - Trial = 3196/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.394 | DEBUG    | __main__:trials:29 - Trial = 3196/30000 | Total reward = 38.92
2022-01-26 14:16:39.397 | DEBUG    | __main__:trials:24 - Trial = 3197/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.399 | DEBUG    | __main__:trials:29 - Trial = 3197/30000 | Total reward = 48.60
2022-01-26 14:16:39.402 | DEBUG    | __main__:trials:24 - Trial = 3198/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.404 | DEBUG    | __main__:trials:29 - Trial = 3198/30000 | Total reward = 56.58
2022-01-26 14:16:39.407 | DEBUG    | __main__:trials:24 - Trial = 3199/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.409 | DEBUG    | __main__:trials:29 - Trial = 3199/30000 | Total reward = 44.99
2022-01-26 14:16:39.413 | DEBUG    | __main__:trials:24 - Trial = 3200/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.413 | DEBUG    | __main__:trials:29 - Trial = 3200/30000 | Total reward = 43.85
2022-01-26 14:16:39.418 | DEBUG    | __main__:trials:24 - Trial = 3201/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.420 | DEBUG    | __main__:trials:29 - Trial = 3201/30000 | Total reward = 46.73
2022-01-26 14:16:39.423 | DEBUG    | __main__:trials:24 - Trial = 3202/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.425 | DEBUG    | __main__:trials:29 - Trial = 3202/30000 | Total reward = 55.78
2022-01-26 14:16:39.429 | DEBUG    | __main__:trials:26 - Trial = 3203/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.430 | DEBUG    | __main__:trials:29 - Trial = 3203/30000 | Total reward = 33.50
2022-01-26 14:16:39.434 | DEBUG    | __main__:trials:24 - Trial = 3204/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.436 | DEBUG    | __main__:trials:29 - Trial = 3204/30000 | Total reward = 27.25
2022-01-26 14:16:39.439 | DEBUG    | __main__:trials:24 - Trial = 3205/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.441 | DEBUG    | __main__:trials:29 - Trial = 3205/30000 | Total reward = 42.98
2022-01-26 14:16:39.444 | DEBUG    | __main__:trials:24 - Trial = 3206/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.446 | DEBUG    | __main__:trials:29 - Trial = 3206/30000 | Total reward = 45.45
2022-01-26 14:16:39.450 | DEBUG    | __main__:trials:24 - Trial = 3207/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.451 | DEBUG    | __main__:trials:29 - Trial = 3207/30000 | Total reward = 55.92
2022-01-26 14:16:39.454 | DEBUG    | __main__:trials:24 - Trial = 3208/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.456 | DEBUG    | __main__:trials:29 - Trial = 3208/30000 | Total reward = 57.06
2022-01-26 14:16:39.460 | DEBUG    | __main__:trials:24 - Trial = 3209/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.461 | DEBUG    | __main__:trials:29 - Trial = 3209/30000 | Total reward = 23.61
2022-01-26 14:16:39.465 | DEBUG    | __main__:trials:24 - Trial = 3210/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.467 | DEBUG    | __main__:trials:29 - Trial = 3210/30000 | Total reward = 50.32
2022-01-26 14:16:39.471 | DEBUG    | __main__:trials:24 - Trial = 3211/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.472 | DEBUG    | __main__:trials:29 - Trial = 3211/30000 | Total reward = 46.45
2022-01-26 14:16:39.476 | DEBUG    | __main__:trials:24 - Trial = 3212/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.477 | DEBUG    | __main__:trials:29 - Trial = 3212/30000 | Total reward = 52.89
2022-01-26 14:16:39.481 | DEBUG    | __main__:trials:24 - Trial = 3213/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.482 | DEBUG    | __main__:trials:29 - Trial = 3213/30000 | Total reward = 56.19
2022-01-26 14:16:39.486 | DEBUG    | __main__:trials:24 - Trial = 3214/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.488 | DEBUG    | __main__:trials:29 - Trial = 3214/30000 | Total reward = 43.64
2022-01-26 14:16:39.491 | DEBUG    | __main__:trials:24 - Trial = 3215/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.493 | DEBUG    | __main__:trials:29 - Trial = 3215/30000 | Total reward = 50.44
2022-01-26 14:16:39.496 | DEBUG    | __main__:trials:24 - Trial = 3216/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.498 | DEBUG    | __main__:trials:29 - Trial = 3216/30000 | Total reward = 40.35
2022-01-26 14:16:39.501 | DEBUG    | __main__:trials:24 - Trial = 3217/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.503 | DEBUG    | __main__:trials:29 - Trial = 3217/30000 | Total reward = 55.02
2022-01-26 14:16:39.506 | DEBUG    | __main__:trials:24 - Trial = 3218/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.508 | DEBUG    | __main__:trials:29 - Trial = 3218/30000 | Total reward = 34.84
2022-01-26 14:16:39.511 | DEBUG    | __main__:trials:24 - Trial = 3219/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.513 | DEBUG    | __main__:trials:29 - Trial = 3219/30000 | Total reward = 44.26
2022-01-26 14:16:39.516 | DEBUG    | __main__:trials:24 - Trial = 3220/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.518 | DEBUG    | __main__:trials:29 - Trial = 3220/30000 | Total reward = 33.67
2022-01-26 14:16:39.522 | DEBUG    | __main__:trials:24 - Trial = 3221/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.523 | DEBUG    | __main__:trials:29 - Trial = 3221/30000 | Total reward = 51.56
2022-01-26 14:16:39.527 | DEBUG    | __main__:trials:24 - Trial = 3222/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.529 | DEBUG    | __main__:trials:29 - Trial = 3222/30000 | Total reward = 61.78
2022-01-26 14:16:39.533 | DEBUG    | __main__:trials:24 - Trial = 3223/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.533 | DEBUG    | __main__:trials:29 - Trial = 3223/30000 | Total reward = 51.20
2022-01-26 14:16:39.537 | DEBUG    | __main__:trials:24 - Trial = 3224/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.538 | DEBUG    | __main__:trials:29 - Trial = 3224/30000 | Total reward = 57.95
2022-01-26 14:16:39.541 | DEBUG    | __main__:trials:26 - Trial = 3225/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.541 | DEBUG    | __main__:trials:29 - Trial = 3225/30000 | Total reward = 15.51
2022-01-26 14:16:39.545 | DEBUG    | __main__:trials:24 - Trial = 3226/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.546 | DEBUG    | __main__:trials:29 - Trial = 3226/30000 | Total reward = 54.93
2022-01-26 14:16:39.550 | DEBUG    | __main__:trials:24 - Trial = 3227/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.552 | DEBUG    | __main__:trials:29 - Trial = 3227/30000 | Total reward = 56.65
2022-01-26 14:16:39.555 | DEBUG    | __main__:trials:24 - Trial = 3228/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.556 | DEBUG    | __main__:trials:29 - Trial = 3228/30000 | Total reward = 51.28
2022-01-26 14:16:39.559 | DEBUG    | __main__:trials:24 - Trial = 3229/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.561 | DEBUG    | __main__:trials:29 - Trial = 3229/30000 | Total reward = 47.78
2022-01-26 14:16:39.565 | DEBUG    | __main__:trials:24 - Trial = 3230/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.567 | DEBUG    | __main__:trials:29 - Trial = 3230/30000 | Total reward = 57.27
2022-01-26 14:16:39.570 | DEBUG    | __main__:trials:24 - Trial = 3231/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.572 | DEBUG    | __main__:trials:29 - Trial = 3231/30000 | Total reward = 15.72
2022-01-26 14:16:39.574 | DEBUG    | __main__:trials:26 - Trial = 3232/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.577 | DEBUG    | __main__:trials:29 - Trial = 3232/30000 | Total reward = 20.13
2022-01-26 14:16:39.580 | DEBUG    | __main__:trials:24 - Trial = 3233/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.582 | DEBUG    | __main__:trials:29 - Trial = 3233/30000 | Total reward = 40.51
2022-01-26 14:16:39.586 | DEBUG    | __main__:trials:24 - Trial = 3234/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.587 | DEBUG    | __main__:trials:29 - Trial = 3234/30000 | Total reward = 51.22
2022-01-26 14:16:39.591 | DEBUG    | __main__:trials:24 - Trial = 3235/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.593 | DEBUG    | __main__:trials:29 - Trial = 3235/30000 | Total reward = 35.36
2022-01-26 14:16:39.596 | DEBUG    | __main__:trials:24 - Trial = 3236/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.597 | DEBUG    | __main__:trials:29 - Trial = 3236/30000 | Total reward = 64.26
2022-01-26 14:16:39.601 | DEBUG    | __main__:trials:24 - Trial = 3237/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.603 | DEBUG    | __main__:trials:29 - Trial = 3237/30000 | Total reward = 56.03
2022-01-26 14:16:39.606 | DEBUG    | __main__:trials:24 - Trial = 3238/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.608 | DEBUG    | __main__:trials:29 - Trial = 3238/30000 | Total reward = 38.23
2022-01-26 14:16:39.611 | DEBUG    | __main__:trials:24 - Trial = 3239/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.613 | DEBUG    | __main__:trials:29 - Trial = 3239/30000 | Total reward = 54.73
2022-01-26 14:16:39.616 | DEBUG    | __main__:trials:24 - Trial = 3240/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.618 | DEBUG    | __main__:trials:29 - Trial = 3240/30000 | Total reward = 47.06
2022-01-26 14:16:39.622 | DEBUG    | __main__:trials:24 - Trial = 3241/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.623 | DEBUG    | __main__:trials:29 - Trial = 3241/30000 | Total reward = 56.05
2022-01-26 14:16:39.627 | DEBUG    | __main__:trials:24 - Trial = 3242/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.629 | DEBUG    | __main__:trials:29 - Trial = 3242/30000 | Total reward = 55.24
2022-01-26 14:16:39.632 | DEBUG    | __main__:trials:24 - Trial = 3243/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.634 | DEBUG    | __main__:trials:29 - Trial = 3243/30000 | Total reward = 55.29
2022-01-26 14:16:39.638 | DEBUG    | __main__:trials:24 - Trial = 3244/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.639 | DEBUG    | __main__:trials:29 - Trial = 3244/30000 | Total reward = 58.34
2022-01-26 14:16:39.643 | DEBUG    | __main__:trials:24 - Trial = 3245/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.645 | DEBUG    | __main__:trials:29 - Trial = 3245/30000 | Total reward = 61.49
2022-01-26 14:16:39.648 | DEBUG    | __main__:trials:24 - Trial = 3246/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.650 | DEBUG    | __main__:trials:29 - Trial = 3246/30000 | Total reward = 50.70
2022-01-26 14:16:39.654 | DEBUG    | __main__:trials:24 - Trial = 3247/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.655 | DEBUG    | __main__:trials:29 - Trial = 3247/30000 | Total reward = 64.46
2022-01-26 14:16:39.658 | DEBUG    | __main__:trials:24 - Trial = 3248/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.660 | DEBUG    | __main__:trials:29 - Trial = 3248/30000 | Total reward = 39.27
2022-01-26 14:16:39.664 | DEBUG    | __main__:trials:24 - Trial = 3249/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.665 | DEBUG    | __main__:trials:29 - Trial = 3249/30000 | Total reward = 53.83
2022-01-26 14:16:39.669 | DEBUG    | __main__:trials:24 - Trial = 3250/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.671 | DEBUG    | __main__:trials:29 - Trial = 3250/30000 | Total reward = 59.36
2022-01-26 14:16:39.675 | DEBUG    | __main__:trials:24 - Trial = 3251/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.676 | DEBUG    | __main__:trials:29 - Trial = 3251/30000 | Total reward = 40.34
2022-01-26 14:16:39.680 | DEBUG    | __main__:trials:24 - Trial = 3252/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.682 | DEBUG    | __main__:trials:29 - Trial = 3252/30000 | Total reward = 59.04
2022-01-26 14:16:39.685 | DEBUG    | __main__:trials:24 - Trial = 3253/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.687 | DEBUG    | __main__:trials:29 - Trial = 3253/30000 | Total reward = 55.91
2022-01-26 14:16:39.690 | DEBUG    | __main__:trials:24 - Trial = 3254/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.692 | DEBUG    | __main__:trials:29 - Trial = 3254/30000 | Total reward = 53.80
2022-01-26 14:16:39.696 | DEBUG    | __main__:trials:24 - Trial = 3255/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.697 | DEBUG    | __main__:trials:29 - Trial = 3255/30000 | Total reward = 60.91
2022-01-26 14:16:39.700 | DEBUG    | __main__:trials:26 - Trial = 3256/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.702 | DEBUG    | __main__:trials:29 - Trial = 3256/30000 | Total reward = 19.17
2022-01-26 14:16:39.705 | DEBUG    | __main__:trials:24 - Trial = 3257/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.707 | DEBUG    | __main__:trials:29 - Trial = 3257/30000 | Total reward = 46.13
2022-01-26 14:16:39.711 | DEBUG    | __main__:trials:24 - Trial = 3258/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.712 | DEBUG    | __main__:trials:29 - Trial = 3258/30000 | Total reward = 56.68
2022-01-26 14:16:39.716 | DEBUG    | __main__:trials:24 - Trial = 3259/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.717 | DEBUG    | __main__:trials:29 - Trial = 3259/30000 | Total reward = 55.01
2022-01-26 14:16:39.721 | DEBUG    | __main__:trials:24 - Trial = 3260/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.723 | DEBUG    | __main__:trials:29 - Trial = 3260/30000 | Total reward = 63.65
2022-01-26 14:16:39.726 | DEBUG    | __main__:trials:24 - Trial = 3261/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.728 | DEBUG    | __main__:trials:29 - Trial = 3261/30000 | Total reward = 52.20
2022-01-26 14:16:39.732 | DEBUG    | __main__:trials:24 - Trial = 3262/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.733 | DEBUG    | __main__:trials:29 - Trial = 3262/30000 | Total reward = 36.46
2022-01-26 14:16:39.735 | DEBUG    | __main__:trials:26 - Trial = 3263/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.737 | DEBUG    | __main__:trials:29 - Trial = 3263/30000 | Total reward = 17.69
2022-01-26 14:16:39.740 | DEBUG    | __main__:trials:24 - Trial = 3264/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.742 | DEBUG    | __main__:trials:29 - Trial = 3264/30000 | Total reward = 61.03
2022-01-26 14:16:39.745 | DEBUG    | __main__:trials:24 - Trial = 3265/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.747 | DEBUG    | __main__:trials:29 - Trial = 3265/30000 | Total reward = 51.38
2022-01-26 14:16:39.751 | DEBUG    | __main__:trials:24 - Trial = 3266/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.753 | DEBUG    | __main__:trials:29 - Trial = 3266/30000 | Total reward = 42.43
2022-01-26 14:16:39.757 | DEBUG    | __main__:trials:24 - Trial = 3267/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.758 | DEBUG    | __main__:trials:29 - Trial = 3267/30000 | Total reward = 59.12
2022-01-26 14:16:39.761 | DEBUG    | __main__:trials:24 - Trial = 3268/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.762 | DEBUG    | __main__:trials:29 - Trial = 3268/30000 | Total reward = 33.19
2022-01-26 14:16:39.765 | DEBUG    | __main__:trials:24 - Trial = 3269/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.766 | DEBUG    | __main__:trials:29 - Trial = 3269/30000 | Total reward = 43.69
2022-01-26 14:16:39.769 | DEBUG    | __main__:trials:24 - Trial = 3270/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.770 | DEBUG    | __main__:trials:29 - Trial = 3270/30000 | Total reward = 20.92
2022-01-26 14:16:39.773 | DEBUG    | __main__:trials:24 - Trial = 3271/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.775 | DEBUG    | __main__:trials:29 - Trial = 3271/30000 | Total reward = 55.77
2022-01-26 14:16:39.779 | DEBUG    | __main__:trials:24 - Trial = 3272/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.779 | DEBUG    | __main__:trials:29 - Trial = 3272/30000 | Total reward = 57.01
2022-01-26 14:16:39.784 | DEBUG    | __main__:trials:24 - Trial = 3273/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.785 | DEBUG    | __main__:trials:29 - Trial = 3273/30000 | Total reward = 62.93
2022-01-26 14:16:39.789 | DEBUG    | __main__:trials:24 - Trial = 3274/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.791 | DEBUG    | __main__:trials:29 - Trial = 3274/30000 | Total reward = 56.03
2022-01-26 14:16:39.795 | DEBUG    | __main__:trials:24 - Trial = 3275/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.796 | DEBUG    | __main__:trials:29 - Trial = 3275/30000 | Total reward = 31.53
2022-01-26 14:16:39.799 | DEBUG    | __main__:trials:24 - Trial = 3276/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.801 | DEBUG    | __main__:trials:29 - Trial = 3276/30000 | Total reward = 59.72
2022-01-26 14:16:39.805 | DEBUG    | __main__:trials:24 - Trial = 3277/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.806 | DEBUG    | __main__:trials:29 - Trial = 3277/30000 | Total reward = 57.12
2022-01-26 14:16:39.809 | DEBUG    | __main__:trials:24 - Trial = 3278/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.810 | DEBUG    | __main__:trials:29 - Trial = 3278/30000 | Total reward = 46.30
2022-01-26 14:16:39.814 | DEBUG    | __main__:trials:24 - Trial = 3279/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.814 | DEBUG    | __main__:trials:29 - Trial = 3279/30000 | Total reward = 60.04
2022-01-26 14:16:39.818 | DEBUG    | __main__:trials:24 - Trial = 3280/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.820 | DEBUG    | __main__:trials:29 - Trial = 3280/30000 | Total reward = 57.11
2022-01-26 14:16:39.824 | DEBUG    | __main__:trials:24 - Trial = 3281/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.825 | DEBUG    | __main__:trials:29 - Trial = 3281/30000 | Total reward = 56.37
2022-01-26 14:16:39.829 | DEBUG    | __main__:trials:24 - Trial = 3282/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.831 | DEBUG    | __main__:trials:29 - Trial = 3282/30000 | Total reward = 54.21
2022-01-26 14:16:39.835 | DEBUG    | __main__:trials:24 - Trial = 3283/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.837 | DEBUG    | __main__:trials:29 - Trial = 3283/30000 | Total reward = 38.76
2022-01-26 14:16:39.841 | DEBUG    | __main__:trials:24 - Trial = 3284/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.843 | DEBUG    | __main__:trials:29 - Trial = 3284/30000 | Total reward = 53.33
2022-01-26 14:16:39.847 | DEBUG    | __main__:trials:24 - Trial = 3285/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.848 | DEBUG    | __main__:trials:29 - Trial = 3285/30000 | Total reward = 48.90
2022-01-26 14:16:39.852 | DEBUG    | __main__:trials:24 - Trial = 3286/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.854 | DEBUG    | __main__:trials:29 - Trial = 3286/30000 | Total reward = 37.03
2022-01-26 14:16:39.858 | DEBUG    | __main__:trials:24 - Trial = 3287/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.859 | DEBUG    | __main__:trials:29 - Trial = 3287/30000 | Total reward = 52.36
2022-01-26 14:16:39.863 | DEBUG    | __main__:trials:24 - Trial = 3288/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.864 | DEBUG    | __main__:trials:29 - Trial = 3288/30000 | Total reward = 37.78
2022-01-26 14:16:39.868 | DEBUG    | __main__:trials:24 - Trial = 3289/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.870 | DEBUG    | __main__:trials:29 - Trial = 3289/30000 | Total reward = 45.72
2022-01-26 14:16:39.874 | DEBUG    | __main__:trials:24 - Trial = 3290/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.875 | DEBUG    | __main__:trials:29 - Trial = 3290/30000 | Total reward = 49.06
2022-01-26 14:16:39.879 | DEBUG    | __main__:trials:24 - Trial = 3291/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.881 | DEBUG    | __main__:trials:29 - Trial = 3291/30000 | Total reward = 36.54
2022-01-26 14:16:39.885 | DEBUG    | __main__:trials:24 - Trial = 3292/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.886 | DEBUG    | __main__:trials:29 - Trial = 3292/30000 | Total reward = 39.15
2022-01-26 14:16:39.890 | DEBUG    | __main__:trials:24 - Trial = 3293/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.892 | DEBUG    | __main__:trials:29 - Trial = 3293/30000 | Total reward = 30.21
2022-01-26 14:16:39.894 | DEBUG    | __main__:trials:26 - Trial = 3294/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:39.896 | DEBUG    | __main__:trials:29 - Trial = 3294/30000 | Total reward = 18.51
2022-01-26 14:16:39.900 | DEBUG    | __main__:trials:24 - Trial = 3295/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.901 | DEBUG    | __main__:trials:29 - Trial = 3295/30000 | Total reward = 56.44
2022-01-26 14:16:39.904 | DEBUG    | __main__:trials:24 - Trial = 3296/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.905 | DEBUG    | __main__:trials:29 - Trial = 3296/30000 | Total reward = 35.16
2022-01-26 14:16:39.909 | DEBUG    | __main__:trials:24 - Trial = 3297/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.909 | DEBUG    | __main__:trials:29 - Trial = 3297/30000 | Total reward = 51.99
2022-01-26 14:16:39.914 | DEBUG    | __main__:trials:24 - Trial = 3298/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.916 | DEBUG    | __main__:trials:29 - Trial = 3298/30000 | Total reward = 52.92
2022-01-26 14:16:39.919 | DEBUG    | __main__:trials:24 - Trial = 3299/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.921 | DEBUG    | __main__:trials:29 - Trial = 3299/30000 | Total reward = 45.92
2022-01-26 14:16:39.924 | DEBUG    | __main__:trials:24 - Trial = 3300/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.926 | DEBUG    | __main__:trials:29 - Trial = 3300/30000 | Total reward = 55.49
2022-01-26 14:16:39.929 | DEBUG    | __main__:trials:24 - Trial = 3301/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.930 | DEBUG    | __main__:trials:29 - Trial = 3301/30000 | Total reward = 40.30
2022-01-26 14:16:39.933 | DEBUG    | __main__:trials:24 - Trial = 3302/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.935 | DEBUG    | __main__:trials:29 - Trial = 3302/30000 | Total reward = 41.15
2022-01-26 14:16:39.938 | DEBUG    | __main__:trials:24 - Trial = 3303/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.940 | DEBUG    | __main__:trials:29 - Trial = 3303/30000 | Total reward = 53.96
2022-01-26 14:16:39.943 | DEBUG    | __main__:trials:24 - Trial = 3304/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.945 | DEBUG    | __main__:trials:29 - Trial = 3304/30000 | Total reward = 59.13
2022-01-26 14:16:39.948 | DEBUG    | __main__:trials:24 - Trial = 3305/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.950 | DEBUG    | __main__:trials:29 - Trial = 3305/30000 | Total reward = 35.85
2022-01-26 14:16:39.954 | DEBUG    | __main__:trials:24 - Trial = 3306/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.955 | DEBUG    | __main__:trials:29 - Trial = 3306/30000 | Total reward = 35.06
2022-01-26 14:16:39.959 | DEBUG    | __main__:trials:24 - Trial = 3307/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.960 | DEBUG    | __main__:trials:29 - Trial = 3307/30000 | Total reward = 40.15
2022-01-26 14:16:39.963 | DEBUG    | __main__:trials:24 - Trial = 3308/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.965 | DEBUG    | __main__:trials:29 - Trial = 3308/30000 | Total reward = 56.13
2022-01-26 14:16:39.969 | DEBUG    | __main__:trials:24 - Trial = 3309/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.975 | DEBUG    | __main__:trials:29 - Trial = 3309/30000 | Total reward = 57.00
2022-01-26 14:16:39.984 | DEBUG    | __main__:trials:24 - Trial = 3310/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.984 | DEBUG    | __main__:trials:29 - Trial = 3310/30000 | Total reward = 6.49
2022-01-26 14:16:39.988 | DEBUG    | __main__:trials:24 - Trial = 3311/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.989 | DEBUG    | __main__:trials:29 - Trial = 3311/30000 | Total reward = 52.25
2022-01-26 14:16:39.993 | DEBUG    | __main__:trials:24 - Trial = 3312/30000 | Max number of steps (20) reached
2022-01-26 14:16:39.993 | DEBUG    | __main__:trials:29 - Trial = 3312/30000 | Total reward = 55.84
2022-01-26 14:16:39.998 | DEBUG    | __main__:trials:24 - Trial = 3313/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.000 | DEBUG    | __main__:trials:29 - Trial = 3313/30000 | Total reward = 52.37
2022-01-26 14:16:40.003 | DEBUG    | __main__:trials:26 - Trial = 3314/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.004 | DEBUG    | __main__:trials:29 - Trial = 3314/30000 | Total reward = 17.22
2022-01-26 14:16:40.008 | DEBUG    | __main__:trials:24 - Trial = 3315/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.010 | DEBUG    | __main__:trials:29 - Trial = 3315/30000 | Total reward = 39.80
2022-01-26 14:16:40.013 | DEBUG    | __main__:trials:26 - Trial = 3316/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.013 | DEBUG    | __main__:trials:29 - Trial = 3316/30000 | Total reward = 13.84
2022-01-26 14:16:40.017 | DEBUG    | __main__:trials:24 - Trial = 3317/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.017 | DEBUG    | __main__:trials:29 - Trial = 3317/30000 | Total reward = 45.72
2022-01-26 14:16:40.022 | DEBUG    | __main__:trials:24 - Trial = 3318/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.023 | DEBUG    | __main__:trials:29 - Trial = 3318/30000 | Total reward = 46.98
2022-01-26 14:16:40.026 | DEBUG    | __main__:trials:24 - Trial = 3319/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.028 | DEBUG    | __main__:trials:29 - Trial = 3319/30000 | Total reward = 32.91
2022-01-26 14:16:40.032 | DEBUG    | __main__:trials:24 - Trial = 3320/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.034 | DEBUG    | __main__:trials:29 - Trial = 3320/30000 | Total reward = 40.18
2022-01-26 14:16:40.038 | DEBUG    | __main__:trials:24 - Trial = 3321/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.039 | DEBUG    | __main__:trials:29 - Trial = 3321/30000 | Total reward = 57.22
2022-01-26 14:16:40.043 | DEBUG    | __main__:trials:24 - Trial = 3322/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.044 | DEBUG    | __main__:trials:29 - Trial = 3322/30000 | Total reward = 30.13
2022-01-26 14:16:40.048 | DEBUG    | __main__:trials:24 - Trial = 3323/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.049 | DEBUG    | __main__:trials:29 - Trial = 3323/30000 | Total reward = 60.90
2022-01-26 14:16:40.052 | DEBUG    | __main__:trials:24 - Trial = 3324/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.053 | DEBUG    | __main__:trials:29 - Trial = 3324/30000 | Total reward = 51.48
2022-01-26 14:16:40.056 | DEBUG    | __main__:trials:26 - Trial = 3325/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.058 | DEBUG    | __main__:trials:29 - Trial = 3325/30000 | Total reward = 17.39
2022-01-26 14:16:40.062 | DEBUG    | __main__:trials:24 - Trial = 3326/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.063 | DEBUG    | __main__:trials:29 - Trial = 3326/30000 | Total reward = 55.33
2022-01-26 14:16:40.066 | DEBUG    | __main__:trials:24 - Trial = 3327/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.068 | DEBUG    | __main__:trials:29 - Trial = 3327/30000 | Total reward = 49.70
2022-01-26 14:16:40.073 | DEBUG    | __main__:trials:24 - Trial = 3328/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.074 | DEBUG    | __main__:trials:29 - Trial = 3328/30000 | Total reward = 58.49
2022-01-26 14:16:40.078 | DEBUG    | __main__:trials:24 - Trial = 3329/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.080 | DEBUG    | __main__:trials:29 - Trial = 3329/30000 | Total reward = 56.37
2022-01-26 14:16:40.083 | DEBUG    | __main__:trials:24 - Trial = 3330/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.084 | DEBUG    | __main__:trials:29 - Trial = 3330/30000 | Total reward = 40.29
2022-01-26 14:16:40.089 | DEBUG    | __main__:trials:24 - Trial = 3331/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.089 | DEBUG    | __main__:trials:29 - Trial = 3331/30000 | Total reward = 44.12
2022-01-26 14:16:40.093 | DEBUG    | __main__:trials:24 - Trial = 3332/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.093 | DEBUG    | __main__:trials:29 - Trial = 3332/30000 | Total reward = 49.50
2022-01-26 14:16:40.097 | DEBUG    | __main__:trials:24 - Trial = 3333/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.099 | DEBUG    | __main__:trials:29 - Trial = 3333/30000 | Total reward = 48.02
2022-01-26 14:16:40.102 | DEBUG    | __main__:trials:26 - Trial = 3334/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.103 | DEBUG    | __main__:trials:29 - Trial = 3334/30000 | Total reward = 31.61
2022-01-26 14:16:40.107 | DEBUG    | __main__:trials:24 - Trial = 3335/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.109 | DEBUG    | __main__:trials:29 - Trial = 3335/30000 | Total reward = 50.77
2022-01-26 14:16:40.112 | DEBUG    | __main__:trials:24 - Trial = 3336/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.114 | DEBUG    | __main__:trials:29 - Trial = 3336/30000 | Total reward = 44.62
2022-01-26 14:16:40.118 | DEBUG    | __main__:trials:24 - Trial = 3337/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.119 | DEBUG    | __main__:trials:29 - Trial = 3337/30000 | Total reward = 55.09
2022-01-26 14:16:40.123 | DEBUG    | __main__:trials:24 - Trial = 3338/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.124 | DEBUG    | __main__:trials:29 - Trial = 3338/30000 | Total reward = 50.22
2022-01-26 14:16:40.126 | DEBUG    | __main__:trials:26 - Trial = 3339/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.128 | DEBUG    | __main__:trials:29 - Trial = 3339/30000 | Total reward = 13.84
2022-01-26 14:16:40.131 | DEBUG    | __main__:trials:24 - Trial = 3340/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.133 | DEBUG    | __main__:trials:29 - Trial = 3340/30000 | Total reward = 50.45
2022-01-26 14:16:40.137 | DEBUG    | __main__:trials:24 - Trial = 3341/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.138 | DEBUG    | __main__:trials:29 - Trial = 3341/30000 | Total reward = 45.98
2022-01-26 14:16:40.142 | DEBUG    | __main__:trials:24 - Trial = 3342/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.144 | DEBUG    | __main__:trials:29 - Trial = 3342/30000 | Total reward = 48.22
2022-01-26 14:16:40.147 | DEBUG    | __main__:trials:24 - Trial = 3343/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.149 | DEBUG    | __main__:trials:29 - Trial = 3343/30000 | Total reward = 50.99
2022-01-26 14:16:40.152 | DEBUG    | __main__:trials:24 - Trial = 3344/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.153 | DEBUG    | __main__:trials:29 - Trial = 3344/30000 | Total reward = 35.09
2022-01-26 14:16:40.156 | DEBUG    | __main__:trials:24 - Trial = 3345/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.157 | DEBUG    | __main__:trials:29 - Trial = 3345/30000 | Total reward = 57.42
2022-01-26 14:16:40.161 | DEBUG    | __main__:trials:24 - Trial = 3346/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.161 | DEBUG    | __main__:trials:29 - Trial = 3346/30000 | Total reward = 48.45
2022-01-26 14:16:40.166 | DEBUG    | __main__:trials:24 - Trial = 3347/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.166 | DEBUG    | __main__:trials:29 - Trial = 3347/30000 | Total reward = 51.20
2022-01-26 14:16:40.170 | DEBUG    | __main__:trials:24 - Trial = 3348/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.172 | DEBUG    | __main__:trials:29 - Trial = 3348/30000 | Total reward = 45.52
2022-01-26 14:16:40.176 | DEBUG    | __main__:trials:24 - Trial = 3349/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.177 | DEBUG    | __main__:trials:29 - Trial = 3349/30000 | Total reward = 50.25
2022-01-26 14:16:40.181 | DEBUG    | __main__:trials:24 - Trial = 3350/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.182 | DEBUG    | __main__:trials:29 - Trial = 3350/30000 | Total reward = 36.12
2022-01-26 14:16:40.185 | DEBUG    | __main__:trials:24 - Trial = 3351/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.187 | DEBUG    | __main__:trials:29 - Trial = 3351/30000 | Total reward = 60.45
2022-01-26 14:16:40.190 | DEBUG    | __main__:trials:24 - Trial = 3352/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.191 | DEBUG    | __main__:trials:29 - Trial = 3352/30000 | Total reward = 61.09
2022-01-26 14:16:40.194 | DEBUG    | __main__:trials:26 - Trial = 3353/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.196 | DEBUG    | __main__:trials:29 - Trial = 3353/30000 | Total reward = 19.94
2022-01-26 14:16:40.200 | DEBUG    | __main__:trials:24 - Trial = 3354/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.201 | DEBUG    | __main__:trials:29 - Trial = 3354/30000 | Total reward = 60.04
2022-01-26 14:16:40.204 | DEBUG    | __main__:trials:24 - Trial = 3355/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.206 | DEBUG    | __main__:trials:29 - Trial = 3355/30000 | Total reward = 50.09
2022-01-26 14:16:40.209 | DEBUG    | __main__:trials:24 - Trial = 3356/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.212 | DEBUG    | __main__:trials:29 - Trial = 3356/30000 | Total reward = 58.33
2022-01-26 14:16:40.216 | DEBUG    | __main__:trials:24 - Trial = 3357/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.217 | DEBUG    | __main__:trials:29 - Trial = 3357/30000 | Total reward = 54.76
2022-01-26 14:16:40.221 | DEBUG    | __main__:trials:24 - Trial = 3358/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.223 | DEBUG    | __main__:trials:29 - Trial = 3358/30000 | Total reward = 45.34
2022-01-26 14:16:40.227 | DEBUG    | __main__:trials:24 - Trial = 3359/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.228 | DEBUG    | __main__:trials:29 - Trial = 3359/30000 | Total reward = 56.03
2022-01-26 14:16:40.231 | DEBUG    | __main__:trials:24 - Trial = 3360/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.233 | DEBUG    | __main__:trials:29 - Trial = 3360/30000 | Total reward = 26.06
2022-01-26 14:16:40.236 | DEBUG    | __main__:trials:24 - Trial = 3361/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.238 | DEBUG    | __main__:trials:29 - Trial = 3361/30000 | Total reward = 31.72
2022-01-26 14:16:40.242 | DEBUG    | __main__:trials:24 - Trial = 3362/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.244 | DEBUG    | __main__:trials:29 - Trial = 3362/30000 | Total reward = 48.00
2022-01-26 14:16:40.246 | DEBUG    | __main__:trials:24 - Trial = 3363/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.248 | DEBUG    | __main__:trials:29 - Trial = 3363/30000 | Total reward = 50.03
2022-01-26 14:16:40.252 | DEBUG    | __main__:trials:24 - Trial = 3364/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.253 | DEBUG    | __main__:trials:29 - Trial = 3364/30000 | Total reward = 50.79
2022-01-26 14:16:40.257 | DEBUG    | __main__:trials:24 - Trial = 3365/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.258 | DEBUG    | __main__:trials:29 - Trial = 3365/30000 | Total reward = 44.99
2022-01-26 14:16:40.262 | DEBUG    | __main__:trials:24 - Trial = 3366/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.263 | DEBUG    | __main__:trials:29 - Trial = 3366/30000 | Total reward = 46.92
2022-01-26 14:16:40.267 | DEBUG    | __main__:trials:24 - Trial = 3367/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.269 | DEBUG    | __main__:trials:29 - Trial = 3367/30000 | Total reward = 52.49
2022-01-26 14:16:40.272 | DEBUG    | __main__:trials:24 - Trial = 3368/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.274 | DEBUG    | __main__:trials:29 - Trial = 3368/30000 | Total reward = 30.75
2022-01-26 14:16:40.278 | DEBUG    | __main__:trials:24 - Trial = 3369/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.279 | DEBUG    | __main__:trials:29 - Trial = 3369/30000 | Total reward = 52.09
2022-01-26 14:16:40.283 | DEBUG    | __main__:trials:24 - Trial = 3370/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.284 | DEBUG    | __main__:trials:29 - Trial = 3370/30000 | Total reward = 50.96
2022-01-26 14:16:40.288 | DEBUG    | __main__:trials:24 - Trial = 3371/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.289 | DEBUG    | __main__:trials:29 - Trial = 3371/30000 | Total reward = 52.39
2022-01-26 14:16:40.293 | DEBUG    | __main__:trials:24 - Trial = 3372/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.294 | DEBUG    | __main__:trials:29 - Trial = 3372/30000 | Total reward = 47.31
2022-01-26 14:16:40.297 | DEBUG    | __main__:trials:26 - Trial = 3373/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.299 | DEBUG    | __main__:trials:29 - Trial = 3373/30000 | Total reward = 21.69
2022-01-26 14:16:40.303 | DEBUG    | __main__:trials:24 - Trial = 3374/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.304 | DEBUG    | __main__:trials:29 - Trial = 3374/30000 | Total reward = 58.36
2022-01-26 14:16:40.308 | DEBUG    | __main__:trials:24 - Trial = 3375/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.310 | DEBUG    | __main__:trials:29 - Trial = 3375/30000 | Total reward = 56.74
2022-01-26 14:16:40.314 | DEBUG    | __main__:trials:24 - Trial = 3376/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.315 | DEBUG    | __main__:trials:29 - Trial = 3376/30000 | Total reward = 52.45
2022-01-26 14:16:40.319 | DEBUG    | __main__:trials:24 - Trial = 3377/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.321 | DEBUG    | __main__:trials:29 - Trial = 3377/30000 | Total reward = 10.11
2022-01-26 14:16:40.324 | DEBUG    | __main__:trials:24 - Trial = 3378/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.326 | DEBUG    | __main__:trials:29 - Trial = 3378/30000 | Total reward = 45.90
2022-01-26 14:16:40.330 | DEBUG    | __main__:trials:24 - Trial = 3379/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.331 | DEBUG    | __main__:trials:29 - Trial = 3379/30000 | Total reward = 44.56
2022-01-26 14:16:40.335 | DEBUG    | __main__:trials:24 - Trial = 3380/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.336 | DEBUG    | __main__:trials:29 - Trial = 3380/30000 | Total reward = 38.75
2022-01-26 14:16:40.340 | DEBUG    | __main__:trials:24 - Trial = 3381/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.342 | DEBUG    | __main__:trials:29 - Trial = 3381/30000 | Total reward = 53.25
2022-01-26 14:16:40.345 | DEBUG    | __main__:trials:24 - Trial = 3382/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.346 | DEBUG    | __main__:trials:29 - Trial = 3382/30000 | Total reward = 57.44
2022-01-26 14:16:40.351 | DEBUG    | __main__:trials:24 - Trial = 3383/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.353 | DEBUG    | __main__:trials:29 - Trial = 3383/30000 | Total reward = 55.42
2022-01-26 14:16:40.357 | DEBUG    | __main__:trials:24 - Trial = 3384/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.357 | DEBUG    | __main__:trials:29 - Trial = 3384/30000 | Total reward = 39.53
2022-01-26 14:16:40.362 | DEBUG    | __main__:trials:24 - Trial = 3385/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.363 | DEBUG    | __main__:trials:29 - Trial = 3385/30000 | Total reward = 40.05
2022-01-26 14:16:40.367 | DEBUG    | __main__:trials:24 - Trial = 3386/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.368 | DEBUG    | __main__:trials:29 - Trial = 3386/30000 | Total reward = 56.55
2022-01-26 14:16:40.372 | DEBUG    | __main__:trials:24 - Trial = 3387/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.374 | DEBUG    | __main__:trials:29 - Trial = 3387/30000 | Total reward = 51.55
2022-01-26 14:16:40.377 | DEBUG    | __main__:trials:26 - Trial = 3388/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.379 | DEBUG    | __main__:trials:29 - Trial = 3388/30000 | Total reward = 20.81
2022-01-26 14:16:40.383 | DEBUG    | __main__:trials:24 - Trial = 3389/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.384 | DEBUG    | __main__:trials:29 - Trial = 3389/30000 | Total reward = 33.35
2022-01-26 14:16:40.388 | DEBUG    | __main__:trials:24 - Trial = 3390/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.390 | DEBUG    | __main__:trials:29 - Trial = 3390/30000 | Total reward = 53.39
2022-01-26 14:16:40.393 | DEBUG    | __main__:trials:24 - Trial = 3391/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.394 | DEBUG    | __main__:trials:29 - Trial = 3391/30000 | Total reward = 51.57
2022-01-26 14:16:40.397 | DEBUG    | __main__:trials:26 - Trial = 3392/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.398 | DEBUG    | __main__:trials:29 - Trial = 3392/30000 | Total reward = 22.44
2022-01-26 14:16:40.402 | DEBUG    | __main__:trials:24 - Trial = 3393/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.403 | DEBUG    | __main__:trials:29 - Trial = 3393/30000 | Total reward = 48.69
2022-01-26 14:16:40.407 | DEBUG    | __main__:trials:24 - Trial = 3394/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.407 | DEBUG    | __main__:trials:29 - Trial = 3394/30000 | Total reward = 50.83
2022-01-26 14:16:40.412 | DEBUG    | __main__:trials:24 - Trial = 3395/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.413 | DEBUG    | __main__:trials:29 - Trial = 3395/30000 | Total reward = 52.02
2022-01-26 14:16:40.416 | DEBUG    | __main__:trials:24 - Trial = 3396/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.417 | DEBUG    | __main__:trials:29 - Trial = 3396/30000 | Total reward = 36.05
2022-01-26 14:16:40.421 | DEBUG    | __main__:trials:24 - Trial = 3397/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.421 | DEBUG    | __main__:trials:29 - Trial = 3397/30000 | Total reward = 28.82
2022-01-26 14:16:40.426 | DEBUG    | __main__:trials:24 - Trial = 3398/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.427 | DEBUG    | __main__:trials:29 - Trial = 3398/30000 | Total reward = 41.01
2022-01-26 14:16:40.431 | DEBUG    | __main__:trials:24 - Trial = 3399/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.433 | DEBUG    | __main__:trials:29 - Trial = 3399/30000 | Total reward = 47.96
2022-01-26 14:16:40.436 | DEBUG    | __main__:trials:24 - Trial = 3400/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.438 | DEBUG    | __main__:trials:29 - Trial = 3400/30000 | Total reward = 47.52
2022-01-26 14:16:40.442 | DEBUG    | __main__:trials:24 - Trial = 3401/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.443 | DEBUG    | __main__:trials:29 - Trial = 3401/30000 | Total reward = 41.78
2022-01-26 14:16:40.447 | DEBUG    | __main__:trials:24 - Trial = 3402/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.448 | DEBUG    | __main__:trials:29 - Trial = 3402/30000 | Total reward = 46.85
2022-01-26 14:16:40.452 | DEBUG    | __main__:trials:24 - Trial = 3403/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.453 | DEBUG    | __main__:trials:29 - Trial = 3403/30000 | Total reward = 43.90
2022-01-26 14:16:40.456 | DEBUG    | __main__:trials:24 - Trial = 3404/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.458 | DEBUG    | __main__:trials:29 - Trial = 3404/30000 | Total reward = 42.53
2022-01-26 14:16:40.462 | DEBUG    | __main__:trials:24 - Trial = 3405/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.463 | DEBUG    | __main__:trials:29 - Trial = 3405/30000 | Total reward = 27.84
2022-01-26 14:16:40.466 | DEBUG    | __main__:trials:24 - Trial = 3406/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.467 | DEBUG    | __main__:trials:29 - Trial = 3406/30000 | Total reward = 40.81
2022-01-26 14:16:40.471 | DEBUG    | __main__:trials:24 - Trial = 3407/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.472 | DEBUG    | __main__:trials:29 - Trial = 3407/30000 | Total reward = 46.55
2022-01-26 14:16:40.475 | DEBUG    | __main__:trials:24 - Trial = 3408/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.477 | DEBUG    | __main__:trials:29 - Trial = 3408/30000 | Total reward = 33.77
2022-01-26 14:16:40.481 | DEBUG    | __main__:trials:24 - Trial = 3409/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.483 | DEBUG    | __main__:trials:29 - Trial = 3409/30000 | Total reward = 49.54
2022-01-26 14:16:40.487 | DEBUG    | __main__:trials:24 - Trial = 3410/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.487 | DEBUG    | __main__:trials:29 - Trial = 3410/30000 | Total reward = 54.47
2022-01-26 14:16:40.492 | DEBUG    | __main__:trials:24 - Trial = 3411/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.493 | DEBUG    | __main__:trials:29 - Trial = 3411/30000 | Total reward = 59.06
2022-01-26 14:16:40.497 | DEBUG    | __main__:trials:24 - Trial = 3412/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.498 | DEBUG    | __main__:trials:29 - Trial = 3412/30000 | Total reward = 50.69
2022-01-26 14:16:40.501 | DEBUG    | __main__:trials:24 - Trial = 3413/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.502 | DEBUG    | __main__:trials:29 - Trial = 3413/30000 | Total reward = 48.39
2022-01-26 14:16:40.506 | DEBUG    | __main__:trials:24 - Trial = 3414/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.507 | DEBUG    | __main__:trials:29 - Trial = 3414/30000 | Total reward = 32.48
2022-01-26 14:16:40.511 | DEBUG    | __main__:trials:26 - Trial = 3415/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.512 | DEBUG    | __main__:trials:29 - Trial = 3415/30000 | Total reward = 27.49
2022-01-26 14:16:40.516 | DEBUG    | __main__:trials:24 - Trial = 3416/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.518 | DEBUG    | __main__:trials:29 - Trial = 3416/30000 | Total reward = 38.52
2022-01-26 14:16:40.522 | DEBUG    | __main__:trials:24 - Trial = 3417/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.523 | DEBUG    | __main__:trials:29 - Trial = 3417/30000 | Total reward = 40.67
2022-01-26 14:16:40.527 | DEBUG    | __main__:trials:24 - Trial = 3418/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.528 | DEBUG    | __main__:trials:29 - Trial = 3418/30000 | Total reward = 40.83
2022-01-26 14:16:40.532 | DEBUG    | __main__:trials:24 - Trial = 3419/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.533 | DEBUG    | __main__:trials:29 - Trial = 3419/30000 | Total reward = 42.49
2022-01-26 14:16:40.536 | DEBUG    | __main__:trials:26 - Trial = 3420/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.538 | DEBUG    | __main__:trials:29 - Trial = 3420/30000 | Total reward = 13.11
2022-01-26 14:16:40.541 | DEBUG    | __main__:trials:24 - Trial = 3421/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.543 | DEBUG    | __main__:trials:29 - Trial = 3421/30000 | Total reward = 42.24
2022-01-26 14:16:40.547 | DEBUG    | __main__:trials:24 - Trial = 3422/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.548 | DEBUG    | __main__:trials:29 - Trial = 3422/30000 | Total reward = 45.96
2022-01-26 14:16:40.552 | DEBUG    | __main__:trials:24 - Trial = 3423/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.554 | DEBUG    | __main__:trials:29 - Trial = 3423/30000 | Total reward = 30.23
2022-01-26 14:16:40.557 | DEBUG    | __main__:trials:26 - Trial = 3424/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.557 | DEBUG    | __main__:trials:29 - Trial = 3424/30000 | Total reward = 22.22
2022-01-26 14:16:40.561 | DEBUG    | __main__:trials:24 - Trial = 3425/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.563 | DEBUG    | __main__:trials:29 - Trial = 3425/30000 | Total reward = 49.40
2022-01-26 14:16:40.566 | DEBUG    | __main__:trials:24 - Trial = 3426/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.568 | DEBUG    | __main__:trials:29 - Trial = 3426/30000 | Total reward = 46.90
2022-01-26 14:16:40.571 | DEBUG    | __main__:trials:24 - Trial = 3427/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.573 | DEBUG    | __main__:trials:29 - Trial = 3427/30000 | Total reward = 32.57
2022-01-26 14:16:40.577 | DEBUG    | __main__:trials:24 - Trial = 3428/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.578 | DEBUG    | __main__:trials:29 - Trial = 3428/30000 | Total reward = 57.88
2022-01-26 14:16:40.581 | DEBUG    | __main__:trials:24 - Trial = 3429/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.582 | DEBUG    | __main__:trials:29 - Trial = 3429/30000 | Total reward = 49.36
2022-01-26 14:16:40.586 | DEBUG    | __main__:trials:26 - Trial = 3430/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.587 | DEBUG    | __main__:trials:29 - Trial = 3430/30000 | Total reward = 22.30
2022-01-26 14:16:40.589 | DEBUG    | __main__:trials:26 - Trial = 3431/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.590 | DEBUG    | __main__:trials:29 - Trial = 3431/30000 | Total reward = 18.36
2022-01-26 14:16:40.593 | DEBUG    | __main__:trials:26 - Trial = 3432/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.594 | DEBUG    | __main__:trials:29 - Trial = 3432/30000 | Total reward = 15.49
2022-01-26 14:16:40.598 | DEBUG    | __main__:trials:24 - Trial = 3433/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.599 | DEBUG    | __main__:trials:29 - Trial = 3433/30000 | Total reward = 38.61
2022-01-26 14:16:40.603 | DEBUG    | __main__:trials:24 - Trial = 3434/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.605 | DEBUG    | __main__:trials:29 - Trial = 3434/30000 | Total reward = 33.76
2022-01-26 14:16:40.608 | DEBUG    | __main__:trials:26 - Trial = 3435/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.610 | DEBUG    | __main__:trials:29 - Trial = 3435/30000 | Total reward = 27.49
2022-01-26 14:16:40.613 | DEBUG    | __main__:trials:24 - Trial = 3436/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.613 | DEBUG    | __main__:trials:29 - Trial = 3436/30000 | Total reward = 42.03
2022-01-26 14:16:40.618 | DEBUG    | __main__:trials:24 - Trial = 3437/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.619 | DEBUG    | __main__:trials:29 - Trial = 3437/30000 | Total reward = 38.13
2022-01-26 14:16:40.622 | DEBUG    | __main__:trials:24 - Trial = 3438/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.624 | DEBUG    | __main__:trials:29 - Trial = 3438/30000 | Total reward = 40.49
2022-01-26 14:16:40.628 | DEBUG    | __main__:trials:26 - Trial = 3439/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.629 | DEBUG    | __main__:trials:29 - Trial = 3439/30000 | Total reward = 25.14
2022-01-26 14:16:40.632 | DEBUG    | __main__:trials:26 - Trial = 3440/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.633 | DEBUG    | __main__:trials:29 - Trial = 3440/30000 | Total reward = 17.10
2022-01-26 14:16:40.636 | DEBUG    | __main__:trials:24 - Trial = 3441/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.638 | DEBUG    | __main__:trials:29 - Trial = 3441/30000 | Total reward = 42.40
2022-01-26 14:16:40.642 | DEBUG    | __main__:trials:24 - Trial = 3442/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.643 | DEBUG    | __main__:trials:29 - Trial = 3442/30000 | Total reward = 42.53
2022-01-26 14:16:40.647 | DEBUG    | __main__:trials:24 - Trial = 3443/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.648 | DEBUG    | __main__:trials:29 - Trial = 3443/30000 | Total reward = 49.92
2022-01-26 14:16:40.652 | DEBUG    | __main__:trials:24 - Trial = 3444/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.654 | DEBUG    | __main__:trials:29 - Trial = 3444/30000 | Total reward = 47.16
2022-01-26 14:16:40.658 | DEBUG    | __main__:trials:24 - Trial = 3445/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.659 | DEBUG    | __main__:trials:29 - Trial = 3445/30000 | Total reward = 46.51
2022-01-26 14:16:40.663 | DEBUG    | __main__:trials:24 - Trial = 3446/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.665 | DEBUG    | __main__:trials:29 - Trial = 3446/30000 | Total reward = 36.55
2022-01-26 14:16:40.668 | DEBUG    | __main__:trials:24 - Trial = 3447/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.670 | DEBUG    | __main__:trials:29 - Trial = 3447/30000 | Total reward = 40.76
2022-01-26 14:16:40.673 | DEBUG    | __main__:trials:24 - Trial = 3448/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.674 | DEBUG    | __main__:trials:29 - Trial = 3448/30000 | Total reward = 42.53
2022-01-26 14:16:40.678 | DEBUG    | __main__:trials:24 - Trial = 3449/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.680 | DEBUG    | __main__:trials:29 - Trial = 3449/30000 | Total reward = 37.12
2022-01-26 14:16:40.683 | DEBUG    | __main__:trials:24 - Trial = 3450/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.685 | DEBUG    | __main__:trials:29 - Trial = 3450/30000 | Total reward = 20.95
2022-01-26 14:16:40.688 | DEBUG    | __main__:trials:24 - Trial = 3451/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.689 | DEBUG    | __main__:trials:29 - Trial = 3451/30000 | Total reward = 42.67
2022-01-26 14:16:40.693 | DEBUG    | __main__:trials:24 - Trial = 3452/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.694 | DEBUG    | __main__:trials:29 - Trial = 3452/30000 | Total reward = 42.54
2022-01-26 14:16:40.697 | DEBUG    | __main__:trials:24 - Trial = 3453/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.699 | DEBUG    | __main__:trials:29 - Trial = 3453/30000 | Total reward = 34.78
2022-01-26 14:16:40.701 | DEBUG    | __main__:trials:24 - Trial = 3454/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.703 | DEBUG    | __main__:trials:29 - Trial = 3454/30000 | Total reward = 43.26
2022-01-26 14:16:40.706 | DEBUG    | __main__:trials:26 - Trial = 3455/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.707 | DEBUG    | __main__:trials:29 - Trial = 3455/30000 | Total reward = 19.14
2022-01-26 14:16:40.711 | DEBUG    | __main__:trials:24 - Trial = 3456/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.712 | DEBUG    | __main__:trials:29 - Trial = 3456/30000 | Total reward = 39.00
2022-01-26 14:16:40.715 | DEBUG    | __main__:trials:24 - Trial = 3457/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.717 | DEBUG    | __main__:trials:29 - Trial = 3457/30000 | Total reward = 43.33
2022-01-26 14:16:40.721 | DEBUG    | __main__:trials:24 - Trial = 3458/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.723 | DEBUG    | __main__:trials:29 - Trial = 3458/30000 | Total reward = 18.22
2022-01-26 14:16:40.726 | DEBUG    | __main__:trials:24 - Trial = 3459/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.727 | DEBUG    | __main__:trials:29 - Trial = 3459/30000 | Total reward = 41.32
2022-01-26 14:16:40.732 | DEBUG    | __main__:trials:24 - Trial = 3460/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.733 | DEBUG    | __main__:trials:29 - Trial = 3460/30000 | Total reward = 38.70
2022-01-26 14:16:40.736 | DEBUG    | __main__:trials:24 - Trial = 3461/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.738 | DEBUG    | __main__:trials:29 - Trial = 3461/30000 | Total reward = 45.32
2022-01-26 14:16:40.741 | DEBUG    | __main__:trials:24 - Trial = 3462/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.742 | DEBUG    | __main__:trials:29 - Trial = 3462/30000 | Total reward = 44.27
2022-01-26 14:16:40.745 | DEBUG    | __main__:trials:24 - Trial = 3463/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.746 | DEBUG    | __main__:trials:29 - Trial = 3463/30000 | Total reward = 48.96
2022-01-26 14:16:40.750 | DEBUG    | __main__:trials:24 - Trial = 3464/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.751 | DEBUG    | __main__:trials:29 - Trial = 3464/30000 | Total reward = 51.94
2022-01-26 14:16:40.755 | DEBUG    | __main__:trials:24 - Trial = 3465/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.757 | DEBUG    | __main__:trials:29 - Trial = 3465/30000 | Total reward = 46.40
2022-01-26 14:16:40.760 | DEBUG    | __main__:trials:24 - Trial = 3466/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.762 | DEBUG    | __main__:trials:29 - Trial = 3466/30000 | Total reward = 41.20
2022-01-26 14:16:40.767 | DEBUG    | __main__:trials:24 - Trial = 3467/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.768 | DEBUG    | __main__:trials:29 - Trial = 3467/30000 | Total reward = 43.61
2022-01-26 14:16:40.772 | DEBUG    | __main__:trials:24 - Trial = 3468/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.773 | DEBUG    | __main__:trials:29 - Trial = 3468/30000 | Total reward = 28.62
2022-01-26 14:16:40.777 | DEBUG    | __main__:trials:26 - Trial = 3469/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.778 | DEBUG    | __main__:trials:29 - Trial = 3469/30000 | Total reward = 29.31
2022-01-26 14:16:40.782 | DEBUG    | __main__:trials:24 - Trial = 3470/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.782 | DEBUG    | __main__:trials:29 - Trial = 3470/30000 | Total reward = 42.91
2022-01-26 14:16:40.787 | DEBUG    | __main__:trials:24 - Trial = 3471/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.788 | DEBUG    | __main__:trials:29 - Trial = 3471/30000 | Total reward = 48.68
2022-01-26 14:16:40.792 | DEBUG    | __main__:trials:24 - Trial = 3472/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.794 | DEBUG    | __main__:trials:29 - Trial = 3472/30000 | Total reward = 47.61
2022-01-26 14:16:40.797 | DEBUG    | __main__:trials:24 - Trial = 3473/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.799 | DEBUG    | __main__:trials:29 - Trial = 3473/30000 | Total reward = 35.11
2022-01-26 14:16:40.802 | DEBUG    | __main__:trials:24 - Trial = 3474/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.804 | DEBUG    | __main__:trials:29 - Trial = 3474/30000 | Total reward = 43.15
2022-01-26 14:16:40.807 | DEBUG    | __main__:trials:24 - Trial = 3475/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.808 | DEBUG    | __main__:trials:29 - Trial = 3475/30000 | Total reward = 40.20
2022-01-26 14:16:40.812 | DEBUG    | __main__:trials:24 - Trial = 3476/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.813 | DEBUG    | __main__:trials:29 - Trial = 3476/30000 | Total reward = 48.75
2022-01-26 14:16:40.816 | DEBUG    | __main__:trials:26 - Trial = 3477/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.818 | DEBUG    | __main__:trials:29 - Trial = 3477/30000 | Total reward = 18.80
2022-01-26 14:16:40.821 | DEBUG    | __main__:trials:24 - Trial = 3478/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.822 | DEBUG    | __main__:trials:29 - Trial = 3478/30000 | Total reward = 45.27
2022-01-26 14:16:40.827 | DEBUG    | __main__:trials:24 - Trial = 3479/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.828 | DEBUG    | __main__:trials:29 - Trial = 3479/30000 | Total reward = 43.07
2022-01-26 14:16:40.832 | DEBUG    | __main__:trials:24 - Trial = 3480/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.834 | DEBUG    | __main__:trials:29 - Trial = 3480/30000 | Total reward = 28.57
2022-01-26 14:16:40.838 | DEBUG    | __main__:trials:24 - Trial = 3481/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.838 | DEBUG    | __main__:trials:29 - Trial = 3481/30000 | Total reward = 43.08
2022-01-26 14:16:40.842 | DEBUG    | __main__:trials:24 - Trial = 3482/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.844 | DEBUG    | __main__:trials:29 - Trial = 3482/30000 | Total reward = 47.03
2022-01-26 14:16:40.847 | DEBUG    | __main__:trials:24 - Trial = 3483/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.849 | DEBUG    | __main__:trials:29 - Trial = 3483/30000 | Total reward = 31.27
2022-01-26 14:16:40.852 | DEBUG    | __main__:trials:24 - Trial = 3484/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.853 | DEBUG    | __main__:trials:29 - Trial = 3484/30000 | Total reward = 35.95
2022-01-26 14:16:40.857 | DEBUG    | __main__:trials:24 - Trial = 3485/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.859 | DEBUG    | __main__:trials:29 - Trial = 3485/30000 | Total reward = 35.48
2022-01-26 14:16:40.862 | DEBUG    | __main__:trials:24 - Trial = 3486/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.864 | DEBUG    | __main__:trials:29 - Trial = 3486/30000 | Total reward = 50.23
2022-01-26 14:16:40.867 | DEBUG    | __main__:trials:24 - Trial = 3487/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.869 | DEBUG    | __main__:trials:29 - Trial = 3487/30000 | Total reward = 49.61
2022-01-26 14:16:40.872 | DEBUG    | __main__:trials:24 - Trial = 3488/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.874 | DEBUG    | __main__:trials:29 - Trial = 3488/30000 | Total reward = 44.35
2022-01-26 14:16:40.877 | DEBUG    | __main__:trials:24 - Trial = 3489/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.878 | DEBUG    | __main__:trials:29 - Trial = 3489/30000 | Total reward = 34.78
2022-01-26 14:16:40.883 | DEBUG    | __main__:trials:24 - Trial = 3490/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.884 | DEBUG    | __main__:trials:29 - Trial = 3490/30000 | Total reward = 41.53
2022-01-26 14:16:40.888 | DEBUG    | __main__:trials:24 - Trial = 3491/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.889 | DEBUG    | __main__:trials:29 - Trial = 3491/30000 | Total reward = 39.24
2022-01-26 14:16:40.893 | DEBUG    | __main__:trials:24 - Trial = 3492/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.894 | DEBUG    | __main__:trials:29 - Trial = 3492/30000 | Total reward = 55.16
2022-01-26 14:16:40.898 | DEBUG    | __main__:trials:24 - Trial = 3493/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.900 | DEBUG    | __main__:trials:29 - Trial = 3493/30000 | Total reward = 44.18
2022-01-26 14:16:40.903 | DEBUG    | __main__:trials:26 - Trial = 3494/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.904 | DEBUG    | __main__:trials:29 - Trial = 3494/30000 | Total reward = 20.81
2022-01-26 14:16:40.907 | DEBUG    | __main__:trials:24 - Trial = 3495/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.909 | DEBUG    | __main__:trials:29 - Trial = 3495/30000 | Total reward = 47.06
2022-01-26 14:16:40.912 | DEBUG    | __main__:trials:24 - Trial = 3496/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.914 | DEBUG    | __main__:trials:29 - Trial = 3496/30000 | Total reward = 39.97
2022-01-26 14:16:40.918 | DEBUG    | __main__:trials:24 - Trial = 3497/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.919 | DEBUG    | __main__:trials:29 - Trial = 3497/30000 | Total reward = 47.34
2022-01-26 14:16:40.923 | DEBUG    | __main__:trials:24 - Trial = 3498/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.924 | DEBUG    | __main__:trials:29 - Trial = 3498/30000 | Total reward = 43.86
2022-01-26 14:16:40.928 | DEBUG    | __main__:trials:24 - Trial = 3499/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.930 | DEBUG    | __main__:trials:29 - Trial = 3499/30000 | Total reward = 34.09
2022-01-26 14:16:40.932 | DEBUG    | __main__:trials:26 - Trial = 3500/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.934 | DEBUG    | __main__:trials:29 - Trial = 3500/30000 | Total reward = 17.12
2022-01-26 14:16:40.938 | DEBUG    | __main__:trials:24 - Trial = 3501/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.938 | DEBUG    | __main__:trials:29 - Trial = 3501/30000 | Total reward = 43.94
2022-01-26 14:16:40.943 | DEBUG    | __main__:trials:24 - Trial = 3502/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.944 | DEBUG    | __main__:trials:29 - Trial = 3502/30000 | Total reward = 40.10
2022-01-26 14:16:40.947 | DEBUG    | __main__:trials:24 - Trial = 3503/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.949 | DEBUG    | __main__:trials:29 - Trial = 3503/30000 | Total reward = 45.34
2022-01-26 14:16:40.952 | DEBUG    | __main__:trials:24 - Trial = 3504/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.954 | DEBUG    | __main__:trials:29 - Trial = 3504/30000 | Total reward = 43.45
2022-01-26 14:16:40.957 | DEBUG    | __main__:trials:24 - Trial = 3505/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.958 | DEBUG    | __main__:trials:29 - Trial = 3505/30000 | Total reward = 47.75
2022-01-26 14:16:40.960 | DEBUG    | __main__:trials:26 - Trial = 3506/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.962 | DEBUG    | __main__:trials:29 - Trial = 3506/30000 | Total reward = 17.07
2022-01-26 14:16:40.966 | DEBUG    | __main__:trials:24 - Trial = 3507/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.967 | DEBUG    | __main__:trials:29 - Trial = 3507/30000 | Total reward = 49.20
2022-01-26 14:16:40.970 | DEBUG    | __main__:trials:24 - Trial = 3508/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.972 | DEBUG    | __main__:trials:29 - Trial = 3508/30000 | Total reward = 43.45
2022-01-26 14:16:40.975 | DEBUG    | __main__:trials:24 - Trial = 3509/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.977 | DEBUG    | __main__:trials:29 - Trial = 3509/30000 | Total reward = 49.70
2022-01-26 14:16:40.981 | DEBUG    | __main__:trials:24 - Trial = 3510/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.982 | DEBUG    | __main__:trials:29 - Trial = 3510/30000 | Total reward = 41.99
2022-01-26 14:16:40.986 | DEBUG    | __main__:trials:26 - Trial = 3511/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:40.987 | DEBUG    | __main__:trials:29 - Trial = 3511/30000 | Total reward = 19.73
2022-01-26 14:16:40.991 | DEBUG    | __main__:trials:24 - Trial = 3512/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.993 | DEBUG    | __main__:trials:29 - Trial = 3512/30000 | Total reward = 47.81
2022-01-26 14:16:40.996 | DEBUG    | __main__:trials:24 - Trial = 3513/30000 | Max number of steps (20) reached
2022-01-26 14:16:40.997 | DEBUG    | __main__:trials:29 - Trial = 3513/30000 | Total reward = 44.01
2022-01-26 14:16:41.000 | DEBUG    | __main__:trials:26 - Trial = 3514/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.000 | DEBUG    | __main__:trials:29 - Trial = 3514/30000 | Total reward = 18.51
2022-01-26 14:16:41.004 | DEBUG    | __main__:trials:24 - Trial = 3515/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.005 | DEBUG    | __main__:trials:29 - Trial = 3515/30000 | Total reward = 54.98
2022-01-26 14:16:41.008 | DEBUG    | __main__:trials:24 - Trial = 3516/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.010 | DEBUG    | __main__:trials:29 - Trial = 3516/30000 | Total reward = 47.57
2022-01-26 14:16:41.014 | DEBUG    | __main__:trials:24 - Trial = 3517/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.015 | DEBUG    | __main__:trials:29 - Trial = 3517/30000 | Total reward = 47.71
2022-01-26 14:16:41.018 | DEBUG    | __main__:trials:24 - Trial = 3518/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.020 | DEBUG    | __main__:trials:29 - Trial = 3518/30000 | Total reward = 42.69
2022-01-26 14:16:41.023 | DEBUG    | __main__:trials:24 - Trial = 3519/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.025 | DEBUG    | __main__:trials:29 - Trial = 3519/30000 | Total reward = 39.64
2022-01-26 14:16:41.028 | DEBUG    | __main__:trials:24 - Trial = 3520/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.029 | DEBUG    | __main__:trials:29 - Trial = 3520/30000 | Total reward = 58.11
2022-01-26 14:16:41.034 | DEBUG    | __main__:trials:24 - Trial = 3521/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.035 | DEBUG    | __main__:trials:29 - Trial = 3521/30000 | Total reward = 43.65
2022-01-26 14:16:41.039 | DEBUG    | __main__:trials:24 - Trial = 3522/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.040 | DEBUG    | __main__:trials:29 - Trial = 3522/30000 | Total reward = 48.72
2022-01-26 14:16:41.044 | DEBUG    | __main__:trials:26 - Trial = 3523/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.045 | DEBUG    | __main__:trials:29 - Trial = 3523/30000 | Total reward = 32.23
2022-01-26 14:16:41.048 | DEBUG    | __main__:trials:24 - Trial = 3524/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.050 | DEBUG    | __main__:trials:29 - Trial = 3524/30000 | Total reward = 55.21
2022-01-26 14:16:41.053 | DEBUG    | __main__:trials:24 - Trial = 3525/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.054 | DEBUG    | __main__:trials:29 - Trial = 3525/30000 | Total reward = 57.59
2022-01-26 14:16:41.057 | DEBUG    | __main__:trials:24 - Trial = 3526/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.058 | DEBUG    | __main__:trials:29 - Trial = 3526/30000 | Total reward = 48.80
2022-01-26 14:16:41.061 | DEBUG    | __main__:trials:26 - Trial = 3527/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.063 | DEBUG    | __main__:trials:29 - Trial = 3527/30000 | Total reward = 26.41
2022-01-26 14:16:41.066 | DEBUG    | __main__:trials:24 - Trial = 3528/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.067 | DEBUG    | __main__:trials:29 - Trial = 3528/30000 | Total reward = 40.05
2022-01-26 14:16:41.070 | DEBUG    | __main__:trials:26 - Trial = 3529/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.070 | DEBUG    | __main__:trials:29 - Trial = 3529/30000 | Total reward = 20.17
2022-01-26 14:16:41.073 | DEBUG    | __main__:trials:26 - Trial = 3530/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.075 | DEBUG    | __main__:trials:29 - Trial = 3530/30000 | Total reward = 23.40
2022-01-26 14:16:41.079 | DEBUG    | __main__:trials:24 - Trial = 3531/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.080 | DEBUG    | __main__:trials:29 - Trial = 3531/30000 | Total reward = 44.46
2022-01-26 14:16:41.083 | DEBUG    | __main__:trials:26 - Trial = 3532/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.085 | DEBUG    | __main__:trials:29 - Trial = 3532/30000 | Total reward = 12.51
2022-01-26 14:16:41.088 | DEBUG    | __main__:trials:26 - Trial = 3533/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.090 | DEBUG    | __main__:trials:29 - Trial = 3533/30000 | Total reward = 35.45
2022-01-26 14:16:41.093 | DEBUG    | __main__:trials:24 - Trial = 3534/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.094 | DEBUG    | __main__:trials:29 - Trial = 3534/30000 | Total reward = 32.58
2022-01-26 14:16:41.097 | DEBUG    | __main__:trials:24 - Trial = 3535/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.098 | DEBUG    | __main__:trials:29 - Trial = 3535/30000 | Total reward = 28.65
2022-01-26 14:16:41.101 | DEBUG    | __main__:trials:24 - Trial = 3536/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.103 | DEBUG    | __main__:trials:29 - Trial = 3536/30000 | Total reward = 49.91
2022-01-26 14:16:41.106 | DEBUG    | __main__:trials:24 - Trial = 3537/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.107 | DEBUG    | __main__:trials:29 - Trial = 3537/30000 | Total reward = 32.41
2022-01-26 14:16:41.111 | DEBUG    | __main__:trials:24 - Trial = 3538/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.112 | DEBUG    | __main__:trials:29 - Trial = 3538/30000 | Total reward = 36.58
2022-01-26 14:16:41.115 | DEBUG    | __main__:trials:24 - Trial = 3539/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.117 | DEBUG    | __main__:trials:29 - Trial = 3539/30000 | Total reward = 51.52
2022-01-26 14:16:41.121 | DEBUG    | __main__:trials:24 - Trial = 3540/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.122 | DEBUG    | __main__:trials:29 - Trial = 3540/30000 | Total reward = 54.16
2022-01-26 14:16:41.125 | DEBUG    | __main__:trials:26 - Trial = 3541/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.126 | DEBUG    | __main__:trials:29 - Trial = 3541/30000 | Total reward = 26.41
2022-01-26 14:16:41.130 | DEBUG    | __main__:trials:24 - Trial = 3542/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.131 | DEBUG    | __main__:trials:29 - Trial = 3542/30000 | Total reward = 46.54
2022-01-26 14:16:41.134 | DEBUG    | __main__:trials:24 - Trial = 3543/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.135 | DEBUG    | __main__:trials:29 - Trial = 3543/30000 | Total reward = 48.93
2022-01-26 14:16:41.138 | DEBUG    | __main__:trials:24 - Trial = 3544/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.140 | DEBUG    | __main__:trials:29 - Trial = 3544/30000 | Total reward = 40.38
2022-01-26 14:16:41.144 | DEBUG    | __main__:trials:24 - Trial = 3545/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.144 | DEBUG    | __main__:trials:29 - Trial = 3545/30000 | Total reward = 43.42
2022-01-26 14:16:41.149 | DEBUG    | __main__:trials:24 - Trial = 3546/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.150 | DEBUG    | __main__:trials:29 - Trial = 3546/30000 | Total reward = 40.54
2022-01-26 14:16:41.154 | DEBUG    | __main__:trials:24 - Trial = 3547/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.156 | DEBUG    | __main__:trials:29 - Trial = 3547/30000 | Total reward = 44.10
2022-01-26 14:16:41.159 | DEBUG    | __main__:trials:24 - Trial = 3548/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.161 | DEBUG    | __main__:trials:29 - Trial = 3548/30000 | Total reward = 54.86
2022-01-26 14:16:41.164 | DEBUG    | __main__:trials:24 - Trial = 3549/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.165 | DEBUG    | __main__:trials:29 - Trial = 3549/30000 | Total reward = 35.84
2022-01-26 14:16:41.169 | DEBUG    | __main__:trials:26 - Trial = 3550/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.169 | DEBUG    | __main__:trials:29 - Trial = 3550/30000 | Total reward = 29.30
2022-01-26 14:16:41.173 | DEBUG    | __main__:trials:24 - Trial = 3551/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.174 | DEBUG    | __main__:trials:29 - Trial = 3551/30000 | Total reward = 32.74
2022-01-26 14:16:41.177 | DEBUG    | __main__:trials:26 - Trial = 3552/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.178 | DEBUG    | __main__:trials:29 - Trial = 3552/30000 | Total reward = 14.90
2022-01-26 14:16:41.182 | DEBUG    | __main__:trials:24 - Trial = 3553/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.183 | DEBUG    | __main__:trials:29 - Trial = 3553/30000 | Total reward = 24.68
2022-01-26 14:16:41.187 | DEBUG    | __main__:trials:24 - Trial = 3554/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.189 | DEBUG    | __main__:trials:29 - Trial = 3554/30000 | Total reward = 54.08
2022-01-26 14:16:41.192 | DEBUG    | __main__:trials:24 - Trial = 3555/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.193 | DEBUG    | __main__:trials:29 - Trial = 3555/30000 | Total reward = 42.58
2022-01-26 14:16:41.196 | DEBUG    | __main__:trials:24 - Trial = 3556/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.198 | DEBUG    | __main__:trials:29 - Trial = 3556/30000 | Total reward = 48.48
2022-01-26 14:16:41.200 | DEBUG    | __main__:trials:26 - Trial = 3557/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.200 | DEBUG    | __main__:trials:29 - Trial = 3557/30000 | Total reward = 13.84
2022-01-26 14:16:41.204 | DEBUG    | __main__:trials:24 - Trial = 3558/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.206 | DEBUG    | __main__:trials:29 - Trial = 3558/30000 | Total reward = 43.85
2022-01-26 14:16:41.209 | DEBUG    | __main__:trials:24 - Trial = 3559/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.210 | DEBUG    | __main__:trials:29 - Trial = 3559/30000 | Total reward = 45.01
2022-01-26 14:16:41.214 | DEBUG    | __main__:trials:24 - Trial = 3560/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.215 | DEBUG    | __main__:trials:29 - Trial = 3560/30000 | Total reward = 44.01
2022-01-26 14:16:41.218 | DEBUG    | __main__:trials:24 - Trial = 3561/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.220 | DEBUG    | __main__:trials:29 - Trial = 3561/30000 | Total reward = 43.79
2022-01-26 14:16:41.223 | DEBUG    | __main__:trials:24 - Trial = 3562/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.225 | DEBUG    | __main__:trials:29 - Trial = 3562/30000 | Total reward = 38.48
2022-01-26 14:16:41.228 | DEBUG    | __main__:trials:26 - Trial = 3563/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.229 | DEBUG    | __main__:trials:29 - Trial = 3563/30000 | Total reward = 32.94
2022-01-26 14:16:41.232 | DEBUG    | __main__:trials:26 - Trial = 3564/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.233 | DEBUG    | __main__:trials:29 - Trial = 3564/30000 | Total reward = 25.13
2022-01-26 14:16:41.236 | DEBUG    | __main__:trials:24 - Trial = 3565/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.237 | DEBUG    | __main__:trials:29 - Trial = 3565/30000 | Total reward = 43.65
2022-01-26 14:16:41.240 | DEBUG    | __main__:trials:24 - Trial = 3566/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.241 | DEBUG    | __main__:trials:29 - Trial = 3566/30000 | Total reward = 44.90
2022-01-26 14:16:41.244 | DEBUG    | __main__:trials:24 - Trial = 3567/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.245 | DEBUG    | __main__:trials:29 - Trial = 3567/30000 | Total reward = 33.30
2022-01-26 14:16:41.249 | DEBUG    | __main__:trials:24 - Trial = 3568/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.250 | DEBUG    | __main__:trials:29 - Trial = 3568/30000 | Total reward = 46.90
2022-01-26 14:16:41.253 | DEBUG    | __main__:trials:24 - Trial = 3569/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.254 | DEBUG    | __main__:trials:29 - Trial = 3569/30000 | Total reward = 46.85
2022-01-26 14:16:41.258 | DEBUG    | __main__:trials:24 - Trial = 3570/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.260 | DEBUG    | __main__:trials:29 - Trial = 3570/30000 | Total reward = 45.66
2022-01-26 14:16:41.263 | DEBUG    | __main__:trials:24 - Trial = 3571/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.264 | DEBUG    | __main__:trials:29 - Trial = 3571/30000 | Total reward = 30.42
2022-01-26 14:16:41.268 | DEBUG    | __main__:trials:24 - Trial = 3572/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.270 | DEBUG    | __main__:trials:29 - Trial = 3572/30000 | Total reward = 35.94
2022-01-26 14:16:41.274 | DEBUG    | __main__:trials:24 - Trial = 3573/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.274 | DEBUG    | __main__:trials:29 - Trial = 3573/30000 | Total reward = 47.92
2022-01-26 14:16:41.278 | DEBUG    | __main__:trials:24 - Trial = 3574/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.279 | DEBUG    | __main__:trials:29 - Trial = 3574/30000 | Total reward = 51.05
2022-01-26 14:16:41.283 | DEBUG    | __main__:trials:24 - Trial = 3575/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.285 | DEBUG    | __main__:trials:29 - Trial = 3575/30000 | Total reward = 45.53
2022-01-26 14:16:41.288 | DEBUG    | __main__:trials:24 - Trial = 3576/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.290 | DEBUG    | __main__:trials:29 - Trial = 3576/30000 | Total reward = 46.14
2022-01-26 14:16:41.293 | DEBUG    | __main__:trials:24 - Trial = 3577/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.294 | DEBUG    | __main__:trials:29 - Trial = 3577/30000 | Total reward = 40.58
2022-01-26 14:16:41.298 | DEBUG    | __main__:trials:24 - Trial = 3578/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.300 | DEBUG    | __main__:trials:29 - Trial = 3578/30000 | Total reward = 52.51
2022-01-26 14:16:41.303 | DEBUG    | __main__:trials:24 - Trial = 3579/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.304 | DEBUG    | __main__:trials:29 - Trial = 3579/30000 | Total reward = 40.17
2022-01-26 14:16:41.306 | DEBUG    | __main__:trials:26 - Trial = 3580/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.308 | DEBUG    | __main__:trials:29 - Trial = 3580/30000 | Total reward = 17.46
2022-01-26 14:16:41.312 | DEBUG    | __main__:trials:24 - Trial = 3581/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.312 | DEBUG    | __main__:trials:29 - Trial = 3581/30000 | Total reward = 52.51
2022-01-26 14:16:41.317 | DEBUG    | __main__:trials:24 - Trial = 3582/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.318 | DEBUG    | __main__:trials:29 - Trial = 3582/30000 | Total reward = 42.85
2022-01-26 14:16:41.322 | DEBUG    | __main__:trials:24 - Trial = 3583/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.323 | DEBUG    | __main__:trials:29 - Trial = 3583/30000 | Total reward = 36.40
2022-01-26 14:16:41.327 | DEBUG    | __main__:trials:24 - Trial = 3584/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.329 | DEBUG    | __main__:trials:29 - Trial = 3584/30000 | Total reward = 49.27
2022-01-26 14:16:41.332 | DEBUG    | __main__:trials:24 - Trial = 3585/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.334 | DEBUG    | __main__:trials:29 - Trial = 3585/30000 | Total reward = 47.06
2022-01-26 14:16:41.338 | DEBUG    | __main__:trials:24 - Trial = 3586/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.339 | DEBUG    | __main__:trials:29 - Trial = 3586/30000 | Total reward = 31.51
2022-01-26 14:16:41.343 | DEBUG    | __main__:trials:26 - Trial = 3587/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.344 | DEBUG    | __main__:trials:29 - Trial = 3587/30000 | Total reward = 34.89
2022-01-26 14:16:41.348 | DEBUG    | __main__:trials:24 - Trial = 3588/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.350 | DEBUG    | __main__:trials:29 - Trial = 3588/30000 | Total reward = 35.00
2022-01-26 14:16:41.353 | DEBUG    | __main__:trials:24 - Trial = 3589/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.355 | DEBUG    | __main__:trials:29 - Trial = 3589/30000 | Total reward = 34.40
2022-01-26 14:16:41.359 | DEBUG    | __main__:trials:24 - Trial = 3590/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.360 | DEBUG    | __main__:trials:29 - Trial = 3590/30000 | Total reward = 31.33
2022-01-26 14:16:41.363 | DEBUG    | __main__:trials:24 - Trial = 3591/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.365 | DEBUG    | __main__:trials:29 - Trial = 3591/30000 | Total reward = 46.80
2022-01-26 14:16:41.368 | DEBUG    | __main__:trials:24 - Trial = 3592/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.369 | DEBUG    | __main__:trials:29 - Trial = 3592/30000 | Total reward = 41.74
2022-01-26 14:16:41.374 | DEBUG    | __main__:trials:24 - Trial = 3593/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.375 | DEBUG    | __main__:trials:29 - Trial = 3593/30000 | Total reward = 49.98
2022-01-26 14:16:41.379 | DEBUG    | __main__:trials:24 - Trial = 3594/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.380 | DEBUG    | __main__:trials:29 - Trial = 3594/30000 | Total reward = 45.60
2022-01-26 14:16:41.384 | DEBUG    | __main__:trials:24 - Trial = 3595/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.386 | DEBUG    | __main__:trials:29 - Trial = 3595/30000 | Total reward = 45.68
2022-01-26 14:16:41.390 | DEBUG    | __main__:trials:24 - Trial = 3596/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.390 | DEBUG    | __main__:trials:29 - Trial = 3596/30000 | Total reward = 47.15
2022-01-26 14:16:41.393 | DEBUG    | __main__:trials:26 - Trial = 3597/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.395 | DEBUG    | __main__:trials:29 - Trial = 3597/30000 | Total reward = 13.84
2022-01-26 14:16:41.399 | DEBUG    | __main__:trials:24 - Trial = 3598/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.399 | DEBUG    | __main__:trials:29 - Trial = 3598/30000 | Total reward = 31.53
2022-01-26 14:16:41.404 | DEBUG    | __main__:trials:24 - Trial = 3599/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.405 | DEBUG    | __main__:trials:29 - Trial = 3599/30000 | Total reward = 43.16
2022-01-26 14:16:41.408 | DEBUG    | __main__:trials:24 - Trial = 3600/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.410 | DEBUG    | __main__:trials:29 - Trial = 3600/30000 | Total reward = 50.96
2022-01-26 14:16:41.413 | DEBUG    | __main__:trials:24 - Trial = 3601/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.415 | DEBUG    | __main__:trials:29 - Trial = 3601/30000 | Total reward = 45.96
2022-01-26 14:16:41.418 | DEBUG    | __main__:trials:24 - Trial = 3602/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.420 | DEBUG    | __main__:trials:29 - Trial = 3602/30000 | Total reward = 41.67
2022-01-26 14:16:41.423 | DEBUG    | __main__:trials:24 - Trial = 3603/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.425 | DEBUG    | __main__:trials:29 - Trial = 3603/30000 | Total reward = 27.02
2022-01-26 14:16:41.428 | DEBUG    | __main__:trials:24 - Trial = 3604/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.430 | DEBUG    | __main__:trials:29 - Trial = 3604/30000 | Total reward = 45.32
2022-01-26 14:16:41.433 | DEBUG    | __main__:trials:24 - Trial = 3605/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.434 | DEBUG    | __main__:trials:29 - Trial = 3605/30000 | Total reward = 44.98
2022-01-26 14:16:41.438 | DEBUG    | __main__:trials:24 - Trial = 3606/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.440 | DEBUG    | __main__:trials:29 - Trial = 3606/30000 | Total reward = 39.07
2022-01-26 14:16:41.444 | DEBUG    | __main__:trials:24 - Trial = 3607/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.444 | DEBUG    | __main__:trials:29 - Trial = 3607/30000 | Total reward = 43.69
2022-01-26 14:16:41.449 | DEBUG    | __main__:trials:24 - Trial = 3608/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.451 | DEBUG    | __main__:trials:29 - Trial = 3608/30000 | Total reward = 44.37
2022-01-26 14:16:41.454 | DEBUG    | __main__:trials:24 - Trial = 3609/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.455 | DEBUG    | __main__:trials:29 - Trial = 3609/30000 | Total reward = 42.39
2022-01-26 14:16:41.459 | DEBUG    | __main__:trials:24 - Trial = 3610/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.460 | DEBUG    | __main__:trials:29 - Trial = 3610/30000 | Total reward = 52.51
2022-01-26 14:16:41.464 | DEBUG    | __main__:trials:24 - Trial = 3611/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.466 | DEBUG    | __main__:trials:29 - Trial = 3611/30000 | Total reward = 29.39
2022-01-26 14:16:41.469 | DEBUG    | __main__:trials:24 - Trial = 3612/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.470 | DEBUG    | __main__:trials:29 - Trial = 3612/30000 | Total reward = 46.40
2022-01-26 14:16:41.475 | DEBUG    | __main__:trials:24 - Trial = 3613/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.475 | DEBUG    | __main__:trials:29 - Trial = 3613/30000 | Total reward = 49.32
2022-01-26 14:16:41.479 | DEBUG    | __main__:trials:24 - Trial = 3614/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.481 | DEBUG    | __main__:trials:29 - Trial = 3614/30000 | Total reward = 60.83
2022-01-26 14:16:41.484 | DEBUG    | __main__:trials:24 - Trial = 3615/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.485 | DEBUG    | __main__:trials:29 - Trial = 3615/30000 | Total reward = 56.48
2022-01-26 14:16:41.489 | DEBUG    | __main__:trials:24 - Trial = 3616/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.491 | DEBUG    | __main__:trials:29 - Trial = 3616/30000 | Total reward = 53.40
2022-01-26 14:16:41.494 | DEBUG    | __main__:trials:24 - Trial = 3617/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.495 | DEBUG    | __main__:trials:29 - Trial = 3617/30000 | Total reward = 26.91
2022-01-26 14:16:41.499 | DEBUG    | __main__:trials:24 - Trial = 3618/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.501 | DEBUG    | __main__:trials:29 - Trial = 3618/30000 | Total reward = 49.18
2022-01-26 14:16:41.504 | DEBUG    | __main__:trials:24 - Trial = 3619/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.506 | DEBUG    | __main__:trials:29 - Trial = 3619/30000 | Total reward = 50.32
2022-01-26 14:16:41.510 | DEBUG    | __main__:trials:24 - Trial = 3620/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.510 | DEBUG    | __main__:trials:29 - Trial = 3620/30000 | Total reward = 38.01
2022-01-26 14:16:41.514 | DEBUG    | __main__:trials:24 - Trial = 3621/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.516 | DEBUG    | __main__:trials:29 - Trial = 3621/30000 | Total reward = 48.64
2022-01-26 14:16:41.518 | DEBUG    | __main__:trials:26 - Trial = 3622/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.520 | DEBUG    | __main__:trials:29 - Trial = 3622/30000 | Total reward = 29.85
2022-01-26 14:16:41.524 | DEBUG    | __main__:trials:24 - Trial = 3623/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.525 | DEBUG    | __main__:trials:29 - Trial = 3623/30000 | Total reward = 52.76
2022-01-26 14:16:41.529 | DEBUG    | __main__:trials:24 - Trial = 3624/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.530 | DEBUG    | __main__:trials:29 - Trial = 3624/30000 | Total reward = 40.04
2022-01-26 14:16:41.533 | DEBUG    | __main__:trials:24 - Trial = 3625/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.535 | DEBUG    | __main__:trials:29 - Trial = 3625/30000 | Total reward = 33.92
2022-01-26 14:16:41.539 | DEBUG    | __main__:trials:24 - Trial = 3626/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.540 | DEBUG    | __main__:trials:29 - Trial = 3626/30000 | Total reward = 41.24
2022-01-26 14:16:41.544 | DEBUG    | __main__:trials:24 - Trial = 3627/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.546 | DEBUG    | __main__:trials:29 - Trial = 3627/30000 | Total reward = 44.33
2022-01-26 14:16:41.549 | DEBUG    | __main__:trials:24 - Trial = 3628/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.551 | DEBUG    | __main__:trials:29 - Trial = 3628/30000 | Total reward = 48.58
2022-01-26 14:16:41.554 | DEBUG    | __main__:trials:24 - Trial = 3629/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.556 | DEBUG    | __main__:trials:29 - Trial = 3629/30000 | Total reward = 47.89
2022-01-26 14:16:41.560 | DEBUG    | __main__:trials:24 - Trial = 3630/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.561 | DEBUG    | __main__:trials:29 - Trial = 3630/30000 | Total reward = 49.88
2022-01-26 14:16:41.564 | DEBUG    | __main__:trials:24 - Trial = 3631/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.566 | DEBUG    | __main__:trials:29 - Trial = 3631/30000 | Total reward = 41.65
2022-01-26 14:16:41.570 | DEBUG    | __main__:trials:24 - Trial = 3632/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.570 | DEBUG    | __main__:trials:29 - Trial = 3632/30000 | Total reward = 27.47
2022-01-26 14:16:41.574 | DEBUG    | __main__:trials:24 - Trial = 3633/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.576 | DEBUG    | __main__:trials:29 - Trial = 3633/30000 | Total reward = 59.51
2022-01-26 14:16:41.580 | DEBUG    | __main__:trials:24 - Trial = 3634/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.581 | DEBUG    | __main__:trials:29 - Trial = 3634/30000 | Total reward = 57.20
2022-01-26 14:16:41.585 | DEBUG    | __main__:trials:24 - Trial = 3635/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.586 | DEBUG    | __main__:trials:29 - Trial = 3635/30000 | Total reward = 44.30
2022-01-26 14:16:41.590 | DEBUG    | __main__:trials:24 - Trial = 3636/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.590 | DEBUG    | __main__:trials:29 - Trial = 3636/30000 | Total reward = 58.86
2022-01-26 14:16:41.595 | DEBUG    | __main__:trials:24 - Trial = 3637/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.596 | DEBUG    | __main__:trials:29 - Trial = 3637/30000 | Total reward = 28.91
2022-01-26 14:16:41.600 | DEBUG    | __main__:trials:24 - Trial = 3638/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.602 | DEBUG    | __main__:trials:29 - Trial = 3638/30000 | Total reward = 44.95
2022-01-26 14:16:41.605 | DEBUG    | __main__:trials:26 - Trial = 3639/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.606 | DEBUG    | __main__:trials:29 - Trial = 3639/30000 | Total reward = 18.71
2022-01-26 14:16:41.610 | DEBUG    | __main__:trials:24 - Trial = 3640/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.612 | DEBUG    | __main__:trials:29 - Trial = 3640/30000 | Total reward = 41.83
2022-01-26 14:16:41.615 | DEBUG    | __main__:trials:24 - Trial = 3641/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.617 | DEBUG    | __main__:trials:29 - Trial = 3641/30000 | Total reward = 54.15
2022-01-26 14:16:41.620 | DEBUG    | __main__:trials:26 - Trial = 3642/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.621 | DEBUG    | __main__:trials:29 - Trial = 3642/30000 | Total reward = 19.33
2022-01-26 14:16:41.625 | DEBUG    | __main__:trials:24 - Trial = 3643/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.626 | DEBUG    | __main__:trials:29 - Trial = 3643/30000 | Total reward = 56.54
2022-01-26 14:16:41.630 | DEBUG    | __main__:trials:24 - Trial = 3644/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.632 | DEBUG    | __main__:trials:29 - Trial = 3644/30000 | Total reward = 56.02
2022-01-26 14:16:41.635 | DEBUG    | __main__:trials:24 - Trial = 3645/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.637 | DEBUG    | __main__:trials:29 - Trial = 3645/30000 | Total reward = 46.37
2022-01-26 14:16:41.639 | DEBUG    | __main__:trials:26 - Trial = 3646/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.641 | DEBUG    | __main__:trials:29 - Trial = 3646/30000 | Total reward = 16.93
2022-01-26 14:16:41.644 | DEBUG    | __main__:trials:24 - Trial = 3647/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.645 | DEBUG    | __main__:trials:29 - Trial = 3647/30000 | Total reward = 47.18
2022-01-26 14:16:41.648 | DEBUG    | __main__:trials:24 - Trial = 3648/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.650 | DEBUG    | __main__:trials:29 - Trial = 3648/30000 | Total reward = 42.80
2022-01-26 14:16:41.654 | DEBUG    | __main__:trials:24 - Trial = 3649/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.654 | DEBUG    | __main__:trials:29 - Trial = 3649/30000 | Total reward = 47.15
2022-01-26 14:16:41.658 | DEBUG    | __main__:trials:26 - Trial = 3650/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.659 | DEBUG    | __main__:trials:29 - Trial = 3650/30000 | Total reward = 19.14
2022-01-26 14:16:41.663 | DEBUG    | __main__:trials:26 - Trial = 3651/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.664 | DEBUG    | __main__:trials:29 - Trial = 3651/30000 | Total reward = 18.80
2022-01-26 14:16:41.668 | DEBUG    | __main__:trials:24 - Trial = 3652/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.669 | DEBUG    | __main__:trials:29 - Trial = 3652/30000 | Total reward = 37.11
2022-01-26 14:16:41.673 | DEBUG    | __main__:trials:24 - Trial = 3653/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.674 | DEBUG    | __main__:trials:29 - Trial = 3653/30000 | Total reward = 34.54
2022-01-26 14:16:41.677 | DEBUG    | __main__:trials:24 - Trial = 3654/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.679 | DEBUG    | __main__:trials:29 - Trial = 3654/30000 | Total reward = 32.67
2022-01-26 14:16:41.683 | DEBUG    | __main__:trials:24 - Trial = 3655/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.685 | DEBUG    | __main__:trials:29 - Trial = 3655/30000 | Total reward = 49.67
2022-01-26 14:16:41.688 | DEBUG    | __main__:trials:24 - Trial = 3656/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.688 | DEBUG    | __main__:trials:29 - Trial = 3656/30000 | Total reward = 40.98
2022-01-26 14:16:41.692 | DEBUG    | __main__:trials:24 - Trial = 3657/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.693 | DEBUG    | __main__:trials:29 - Trial = 3657/30000 | Total reward = 53.13
2022-01-26 14:16:41.697 | DEBUG    | __main__:trials:24 - Trial = 3658/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.698 | DEBUG    | __main__:trials:29 - Trial = 3658/30000 | Total reward = 52.02
2022-01-26 14:16:41.701 | DEBUG    | __main__:trials:24 - Trial = 3659/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.703 | DEBUG    | __main__:trials:29 - Trial = 3659/30000 | Total reward = 44.10
2022-01-26 14:16:41.705 | DEBUG    | __main__:trials:26 - Trial = 3660/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.707 | DEBUG    | __main__:trials:29 - Trial = 3660/30000 | Total reward = 18.36
2022-01-26 14:16:41.710 | DEBUG    | __main__:trials:24 - Trial = 3661/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.712 | DEBUG    | __main__:trials:29 - Trial = 3661/30000 | Total reward = 43.02
2022-01-26 14:16:41.715 | DEBUG    | __main__:trials:24 - Trial = 3662/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.717 | DEBUG    | __main__:trials:29 - Trial = 3662/30000 | Total reward = 39.03
2022-01-26 14:16:41.720 | DEBUG    | __main__:trials:24 - Trial = 3663/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.722 | DEBUG    | __main__:trials:29 - Trial = 3663/30000 | Total reward = 43.66
2022-01-26 14:16:41.725 | DEBUG    | __main__:trials:24 - Trial = 3664/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.725 | DEBUG    | __main__:trials:29 - Trial = 3664/30000 | Total reward = 44.51
2022-01-26 14:16:41.729 | DEBUG    | __main__:trials:24 - Trial = 3665/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.730 | DEBUG    | __main__:trials:29 - Trial = 3665/30000 | Total reward = 29.37
2022-01-26 14:16:41.733 | DEBUG    | __main__:trials:24 - Trial = 3666/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.734 | DEBUG    | __main__:trials:29 - Trial = 3666/30000 | Total reward = 44.77
2022-01-26 14:16:41.737 | DEBUG    | __main__:trials:24 - Trial = 3667/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.738 | DEBUG    | __main__:trials:29 - Trial = 3667/30000 | Total reward = 55.02
2022-01-26 14:16:41.742 | DEBUG    | __main__:trials:24 - Trial = 3668/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.742 | DEBUG    | __main__:trials:29 - Trial = 3668/30000 | Total reward = 48.90
2022-01-26 14:16:41.746 | DEBUG    | __main__:trials:26 - Trial = 3669/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.748 | DEBUG    | __main__:trials:29 - Trial = 3669/30000 | Total reward = 23.13
2022-01-26 14:16:41.751 | DEBUG    | __main__:trials:24 - Trial = 3670/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.753 | DEBUG    | __main__:trials:29 - Trial = 3670/30000 | Total reward = 52.79
2022-01-26 14:16:41.756 | DEBUG    | __main__:trials:24 - Trial = 3671/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.757 | DEBUG    | __main__:trials:29 - Trial = 3671/30000 | Total reward = 43.11
2022-01-26 14:16:41.760 | DEBUG    | __main__:trials:24 - Trial = 3672/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.762 | DEBUG    | __main__:trials:29 - Trial = 3672/30000 | Total reward = 50.74
2022-01-26 14:16:41.766 | DEBUG    | __main__:trials:24 - Trial = 3673/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.766 | DEBUG    | __main__:trials:29 - Trial = 3673/30000 | Total reward = 44.38
2022-01-26 14:16:41.771 | DEBUG    | __main__:trials:24 - Trial = 3674/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.771 | DEBUG    | __main__:trials:29 - Trial = 3674/30000 | Total reward = 21.24
2022-01-26 14:16:41.776 | DEBUG    | __main__:trials:26 - Trial = 3675/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.778 | DEBUG    | __main__:trials:29 - Trial = 3675/30000 | Total reward = 27.99
2022-01-26 14:16:41.781 | DEBUG    | __main__:trials:24 - Trial = 3676/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.784 | DEBUG    | __main__:trials:29 - Trial = 3676/30000 | Total reward = 34.59
2022-01-26 14:16:41.788 | DEBUG    | __main__:trials:24 - Trial = 3677/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.790 | DEBUG    | __main__:trials:29 - Trial = 3677/30000 | Total reward = 44.74
2022-01-26 14:16:41.793 | DEBUG    | __main__:trials:24 - Trial = 3678/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.795 | DEBUG    | __main__:trials:29 - Trial = 3678/30000 | Total reward = 53.10
2022-01-26 14:16:41.798 | DEBUG    | __main__:trials:24 - Trial = 3679/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.800 | DEBUG    | __main__:trials:29 - Trial = 3679/30000 | Total reward = 43.52
2022-01-26 14:16:41.803 | DEBUG    | __main__:trials:26 - Trial = 3680/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.805 | DEBUG    | __main__:trials:29 - Trial = 3680/30000 | Total reward = 22.88
2022-01-26 14:16:41.808 | DEBUG    | __main__:trials:24 - Trial = 3681/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.809 | DEBUG    | __main__:trials:29 - Trial = 3681/30000 | Total reward = 49.10
2022-01-26 14:16:41.813 | DEBUG    | __main__:trials:24 - Trial = 3682/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.814 | DEBUG    | __main__:trials:29 - Trial = 3682/30000 | Total reward = 39.60
2022-01-26 14:16:41.817 | DEBUG    | __main__:trials:24 - Trial = 3683/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.817 | DEBUG    | __main__:trials:29 - Trial = 3683/30000 | Total reward = 41.55
2022-01-26 14:16:41.821 | DEBUG    | __main__:trials:26 - Trial = 3684/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.822 | DEBUG    | __main__:trials:29 - Trial = 3684/30000 | Total reward = 9.56
2022-01-26 14:16:41.826 | DEBUG    | __main__:trials:24 - Trial = 3685/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.826 | DEBUG    | __main__:trials:29 - Trial = 3685/30000 | Total reward = 41.08
2022-01-26 14:16:41.831 | DEBUG    | __main__:trials:24 - Trial = 3686/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.832 | DEBUG    | __main__:trials:29 - Trial = 3686/30000 | Total reward = 36.12
2022-01-26 14:16:41.835 | DEBUG    | __main__:trials:24 - Trial = 3687/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.837 | DEBUG    | __main__:trials:29 - Trial = 3687/30000 | Total reward = 42.20
2022-01-26 14:16:41.840 | DEBUG    | __main__:trials:24 - Trial = 3688/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.842 | DEBUG    | __main__:trials:29 - Trial = 3688/30000 | Total reward = 37.02
2022-01-26 14:16:41.845 | DEBUG    | __main__:trials:24 - Trial = 3689/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.846 | DEBUG    | __main__:trials:29 - Trial = 3689/30000 | Total reward = 9.27
2022-01-26 14:16:41.849 | DEBUG    | __main__:trials:24 - Trial = 3690/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.850 | DEBUG    | __main__:trials:29 - Trial = 3690/30000 | Total reward = 46.73
2022-01-26 14:16:41.854 | DEBUG    | __main__:trials:24 - Trial = 3691/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.856 | DEBUG    | __main__:trials:29 - Trial = 3691/30000 | Total reward = 49.11
2022-01-26 14:16:41.859 | DEBUG    | __main__:trials:24 - Trial = 3692/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.861 | DEBUG    | __main__:trials:29 - Trial = 3692/30000 | Total reward = 49.77
2022-01-26 14:16:41.864 | DEBUG    | __main__:trials:24 - Trial = 3693/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.866 | DEBUG    | __main__:trials:29 - Trial = 3693/30000 | Total reward = 46.66
2022-01-26 14:16:41.869 | DEBUG    | __main__:trials:24 - Trial = 3694/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.871 | DEBUG    | __main__:trials:29 - Trial = 3694/30000 | Total reward = 29.24
2022-01-26 14:16:41.874 | DEBUG    | __main__:trials:24 - Trial = 3695/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.876 | DEBUG    | __main__:trials:29 - Trial = 3695/30000 | Total reward = 53.44
2022-01-26 14:16:41.879 | DEBUG    | __main__:trials:24 - Trial = 3696/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.881 | DEBUG    | __main__:trials:29 - Trial = 3696/30000 | Total reward = 36.30
2022-01-26 14:16:41.884 | DEBUG    | __main__:trials:24 - Trial = 3697/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.886 | DEBUG    | __main__:trials:29 - Trial = 3697/30000 | Total reward = 48.13
2022-01-26 14:16:41.889 | DEBUG    | __main__:trials:26 - Trial = 3698/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:41.891 | DEBUG    | __main__:trials:29 - Trial = 3698/30000 | Total reward = 21.20
2022-01-26 14:16:41.894 | DEBUG    | __main__:trials:24 - Trial = 3699/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.896 | DEBUG    | __main__:trials:29 - Trial = 3699/30000 | Total reward = 43.14
2022-01-26 14:16:41.899 | DEBUG    | __main__:trials:24 - Trial = 3700/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.901 | DEBUG    | __main__:trials:29 - Trial = 3700/30000 | Total reward = 36.34
2022-01-26 14:16:41.905 | DEBUG    | __main__:trials:24 - Trial = 3701/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.906 | DEBUG    | __main__:trials:29 - Trial = 3701/30000 | Total reward = 35.28
2022-01-26 14:16:41.910 | DEBUG    | __main__:trials:24 - Trial = 3702/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.911 | DEBUG    | __main__:trials:29 - Trial = 3702/30000 | Total reward = 47.33
2022-01-26 14:16:41.915 | DEBUG    | __main__:trials:24 - Trial = 3703/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.916 | DEBUG    | __main__:trials:29 - Trial = 3703/30000 | Total reward = 43.65
2022-01-26 14:16:41.919 | DEBUG    | __main__:trials:24 - Trial = 3704/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.921 | DEBUG    | __main__:trials:29 - Trial = 3704/30000 | Total reward = 34.77
2022-01-26 14:16:41.925 | DEBUG    | __main__:trials:24 - Trial = 3705/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.927 | DEBUG    | __main__:trials:29 - Trial = 3705/30000 | Total reward = 28.56
2022-01-26 14:16:41.931 | DEBUG    | __main__:trials:24 - Trial = 3706/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.932 | DEBUG    | __main__:trials:29 - Trial = 3706/30000 | Total reward = 36.50
2022-01-26 14:16:41.936 | DEBUG    | __main__:trials:24 - Trial = 3707/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.938 | DEBUG    | __main__:trials:29 - Trial = 3707/30000 | Total reward = 45.91
2022-01-26 14:16:41.942 | DEBUG    | __main__:trials:24 - Trial = 3708/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.943 | DEBUG    | __main__:trials:29 - Trial = 3708/30000 | Total reward = 43.65
2022-01-26 14:16:41.947 | DEBUG    | __main__:trials:24 - Trial = 3709/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.949 | DEBUG    | __main__:trials:29 - Trial = 3709/30000 | Total reward = 50.74
2022-01-26 14:16:41.952 | DEBUG    | __main__:trials:24 - Trial = 3710/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.954 | DEBUG    | __main__:trials:29 - Trial = 3710/30000 | Total reward = 42.74
2022-01-26 14:16:41.958 | DEBUG    | __main__:trials:24 - Trial = 3711/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.960 | DEBUG    | __main__:trials:29 - Trial = 3711/30000 | Total reward = 52.84
2022-01-26 14:16:41.964 | DEBUG    | __main__:trials:24 - Trial = 3712/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.965 | DEBUG    | __main__:trials:29 - Trial = 3712/30000 | Total reward = 34.16
2022-01-26 14:16:41.969 | DEBUG    | __main__:trials:24 - Trial = 3713/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.970 | DEBUG    | __main__:trials:29 - Trial = 3713/30000 | Total reward = 49.98
2022-01-26 14:16:41.974 | DEBUG    | __main__:trials:24 - Trial = 3714/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.976 | DEBUG    | __main__:trials:29 - Trial = 3714/30000 | Total reward = 45.74
2022-01-26 14:16:41.979 | DEBUG    | __main__:trials:24 - Trial = 3715/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.981 | DEBUG    | __main__:trials:29 - Trial = 3715/30000 | Total reward = 43.68
2022-01-26 14:16:41.985 | DEBUG    | __main__:trials:24 - Trial = 3716/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.986 | DEBUG    | __main__:trials:29 - Trial = 3716/30000 | Total reward = 49.01
2022-01-26 14:16:41.990 | DEBUG    | __main__:trials:24 - Trial = 3717/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.992 | DEBUG    | __main__:trials:29 - Trial = 3717/30000 | Total reward = 27.12
2022-01-26 14:16:41.996 | DEBUG    | __main__:trials:24 - Trial = 3718/30000 | Max number of steps (20) reached
2022-01-26 14:16:41.998 | DEBUG    | __main__:trials:29 - Trial = 3718/30000 | Total reward = 13.75
2022-01-26 14:16:42.002 | DEBUG    | __main__:trials:24 - Trial = 3719/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.004 | DEBUG    | __main__:trials:29 - Trial = 3719/30000 | Total reward = 36.99
2022-01-26 14:16:42.008 | DEBUG    | __main__:trials:24 - Trial = 3720/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.010 | DEBUG    | __main__:trials:29 - Trial = 3720/30000 | Total reward = 61.77
2022-01-26 14:16:42.014 | DEBUG    | __main__:trials:24 - Trial = 3721/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.017 | DEBUG    | __main__:trials:29 - Trial = 3721/30000 | Total reward = 36.17
2022-01-26 14:16:42.020 | DEBUG    | __main__:trials:24 - Trial = 3722/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.022 | DEBUG    | __main__:trials:29 - Trial = 3722/30000 | Total reward = 43.85
2022-01-26 14:16:42.026 | DEBUG    | __main__:trials:24 - Trial = 3723/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.028 | DEBUG    | __main__:trials:29 - Trial = 3723/30000 | Total reward = 48.29
2022-01-26 14:16:42.032 | DEBUG    | __main__:trials:24 - Trial = 3724/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.033 | DEBUG    | __main__:trials:29 - Trial = 3724/30000 | Total reward = 47.66
2022-01-26 14:16:42.037 | DEBUG    | __main__:trials:24 - Trial = 3725/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.038 | DEBUG    | __main__:trials:29 - Trial = 3725/30000 | Total reward = 47.37
2022-01-26 14:16:42.042 | DEBUG    | __main__:trials:24 - Trial = 3726/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.046 | DEBUG    | __main__:trials:29 - Trial = 3726/30000 | Total reward = 39.06
2022-01-26 14:16:42.050 | DEBUG    | __main__:trials:24 - Trial = 3727/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.051 | DEBUG    | __main__:trials:29 - Trial = 3727/30000 | Total reward = 37.22
2022-01-26 14:16:42.056 | DEBUG    | __main__:trials:24 - Trial = 3728/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.058 | DEBUG    | __main__:trials:29 - Trial = 3728/30000 | Total reward = 36.36
2022-01-26 14:16:42.062 | DEBUG    | __main__:trials:24 - Trial = 3729/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.063 | DEBUG    | __main__:trials:29 - Trial = 3729/30000 | Total reward = 50.14
2022-01-26 14:16:42.067 | DEBUG    | __main__:trials:24 - Trial = 3730/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.069 | DEBUG    | __main__:trials:29 - Trial = 3730/30000 | Total reward = 43.51
2022-01-26 14:16:42.072 | DEBUG    | __main__:trials:24 - Trial = 3731/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.073 | DEBUG    | __main__:trials:29 - Trial = 3731/30000 | Total reward = 47.40
2022-01-26 14:16:42.076 | DEBUG    | __main__:trials:26 - Trial = 3732/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.077 | DEBUG    | __main__:trials:29 - Trial = 3732/30000 | Total reward = 17.75
2022-01-26 14:16:42.081 | DEBUG    | __main__:trials:24 - Trial = 3733/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.081 | DEBUG    | __main__:trials:29 - Trial = 3733/30000 | Total reward = 42.05
2022-01-26 14:16:42.088 | DEBUG    | __main__:trials:24 - Trial = 3734/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.089 | DEBUG    | __main__:trials:29 - Trial = 3734/30000 | Total reward = 52.28
2022-01-26 14:16:42.095 | DEBUG    | __main__:trials:24 - Trial = 3735/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.097 | DEBUG    | __main__:trials:29 - Trial = 3735/30000 | Total reward = 48.50
2022-01-26 14:16:42.100 | DEBUG    | __main__:trials:24 - Trial = 3736/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.102 | DEBUG    | __main__:trials:29 - Trial = 3736/30000 | Total reward = 38.50
2022-01-26 14:16:42.105 | DEBUG    | __main__:trials:24 - Trial = 3737/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.105 | DEBUG    | __main__:trials:29 - Trial = 3737/30000 | Total reward = 37.10
2022-01-26 14:16:42.108 | DEBUG    | __main__:trials:26 - Trial = 3738/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.109 | DEBUG    | __main__:trials:29 - Trial = 3738/30000 | Total reward = 16.08
2022-01-26 14:16:42.114 | DEBUG    | __main__:trials:24 - Trial = 3739/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.115 | DEBUG    | __main__:trials:29 - Trial = 3739/30000 | Total reward = 44.28
2022-01-26 14:16:42.118 | DEBUG    | __main__:trials:24 - Trial = 3740/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.120 | DEBUG    | __main__:trials:29 - Trial = 3740/30000 | Total reward = 32.41
2022-01-26 14:16:42.124 | DEBUG    | __main__:trials:24 - Trial = 3741/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.125 | DEBUG    | __main__:trials:29 - Trial = 3741/30000 | Total reward = 43.45
2022-01-26 14:16:42.128 | DEBUG    | __main__:trials:24 - Trial = 3742/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.130 | DEBUG    | __main__:trials:29 - Trial = 3742/30000 | Total reward = 26.36
2022-01-26 14:16:42.133 | DEBUG    | __main__:trials:24 - Trial = 3743/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.135 | DEBUG    | __main__:trials:29 - Trial = 3743/30000 | Total reward = 56.30
2022-01-26 14:16:42.138 | DEBUG    | __main__:trials:26 - Trial = 3744/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.140 | DEBUG    | __main__:trials:29 - Trial = 3744/30000 | Total reward = 23.48
2022-01-26 14:16:42.143 | DEBUG    | __main__:trials:24 - Trial = 3745/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.144 | DEBUG    | __main__:trials:29 - Trial = 3745/30000 | Total reward = 28.29
2022-01-26 14:16:42.148 | DEBUG    | __main__:trials:24 - Trial = 3746/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.150 | DEBUG    | __main__:trials:29 - Trial = 3746/30000 | Total reward = 37.32
2022-01-26 14:16:42.154 | DEBUG    | __main__:trials:24 - Trial = 3747/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.156 | DEBUG    | __main__:trials:29 - Trial = 3747/30000 | Total reward = 48.74
2022-01-26 14:16:42.160 | DEBUG    | __main__:trials:24 - Trial = 3748/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.162 | DEBUG    | __main__:trials:29 - Trial = 3748/30000 | Total reward = 39.62
2022-01-26 14:16:42.165 | DEBUG    | __main__:trials:24 - Trial = 3749/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.167 | DEBUG    | __main__:trials:29 - Trial = 3749/30000 | Total reward = 48.81
2022-01-26 14:16:42.170 | DEBUG    | __main__:trials:24 - Trial = 3750/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.172 | DEBUG    | __main__:trials:29 - Trial = 3750/30000 | Total reward = 46.01
2022-01-26 14:16:42.175 | DEBUG    | __main__:trials:24 - Trial = 3751/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.177 | DEBUG    | __main__:trials:29 - Trial = 3751/30000 | Total reward = 43.65
2022-01-26 14:16:42.180 | DEBUG    | __main__:trials:24 - Trial = 3752/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.182 | DEBUG    | __main__:trials:29 - Trial = 3752/30000 | Total reward = 57.57
2022-01-26 14:16:42.185 | DEBUG    | __main__:trials:24 - Trial = 3753/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.187 | DEBUG    | __main__:trials:29 - Trial = 3753/30000 | Total reward = 39.70
2022-01-26 14:16:42.191 | DEBUG    | __main__:trials:24 - Trial = 3754/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.192 | DEBUG    | __main__:trials:29 - Trial = 3754/30000 | Total reward = 51.87
2022-01-26 14:16:42.195 | DEBUG    | __main__:trials:24 - Trial = 3755/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.197 | DEBUG    | __main__:trials:29 - Trial = 3755/30000 | Total reward = 43.09
2022-01-26 14:16:42.200 | DEBUG    | __main__:trials:24 - Trial = 3756/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.202 | DEBUG    | __main__:trials:29 - Trial = 3756/30000 | Total reward = 51.60
2022-01-26 14:16:42.205 | DEBUG    | __main__:trials:26 - Trial = 3757/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.206 | DEBUG    | __main__:trials:29 - Trial = 3757/30000 | Total reward = 16.75
2022-01-26 14:16:42.210 | DEBUG    | __main__:trials:24 - Trial = 3758/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.211 | DEBUG    | __main__:trials:29 - Trial = 3758/30000 | Total reward = 45.58
2022-01-26 14:16:42.215 | DEBUG    | __main__:trials:24 - Trial = 3759/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.217 | DEBUG    | __main__:trials:29 - Trial = 3759/30000 | Total reward = 42.39
2022-01-26 14:16:42.220 | DEBUG    | __main__:trials:24 - Trial = 3760/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.221 | DEBUG    | __main__:trials:29 - Trial = 3760/30000 | Total reward = 41.07
2022-01-26 14:16:42.225 | DEBUG    | __main__:trials:24 - Trial = 3761/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.227 | DEBUG    | __main__:trials:29 - Trial = 3761/30000 | Total reward = 34.62
2022-01-26 14:16:42.230 | DEBUG    | __main__:trials:24 - Trial = 3762/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.232 | DEBUG    | __main__:trials:29 - Trial = 3762/30000 | Total reward = 41.14
2022-01-26 14:16:42.236 | DEBUG    | __main__:trials:24 - Trial = 3763/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.237 | DEBUG    | __main__:trials:29 - Trial = 3763/30000 | Total reward = 36.95
2022-01-26 14:16:42.241 | DEBUG    | __main__:trials:24 - Trial = 3764/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.242 | DEBUG    | __main__:trials:29 - Trial = 3764/30000 | Total reward = 58.73
2022-01-26 14:16:42.246 | DEBUG    | __main__:trials:24 - Trial = 3765/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.247 | DEBUG    | __main__:trials:29 - Trial = 3765/30000 | Total reward = 47.33
2022-01-26 14:16:42.251 | DEBUG    | __main__:trials:24 - Trial = 3766/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.253 | DEBUG    | __main__:trials:29 - Trial = 3766/30000 | Total reward = 36.52
2022-01-26 14:16:42.256 | DEBUG    | __main__:trials:24 - Trial = 3767/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.257 | DEBUG    | __main__:trials:29 - Trial = 3767/30000 | Total reward = 35.41
2022-01-26 14:16:42.260 | DEBUG    | __main__:trials:24 - Trial = 3768/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.262 | DEBUG    | __main__:trials:29 - Trial = 3768/30000 | Total reward = 48.76
2022-01-26 14:16:42.266 | DEBUG    | __main__:trials:24 - Trial = 3769/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.267 | DEBUG    | __main__:trials:29 - Trial = 3769/30000 | Total reward = 23.51
2022-01-26 14:16:42.271 | DEBUG    | __main__:trials:24 - Trial = 3770/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.273 | DEBUG    | __main__:trials:29 - Trial = 3770/30000 | Total reward = 47.15
2022-01-26 14:16:42.276 | DEBUG    | __main__:trials:24 - Trial = 3771/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.278 | DEBUG    | __main__:trials:29 - Trial = 3771/30000 | Total reward = 45.28
2022-01-26 14:16:42.282 | DEBUG    | __main__:trials:24 - Trial = 3772/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.283 | DEBUG    | __main__:trials:29 - Trial = 3772/30000 | Total reward = 48.66
2022-01-26 14:16:42.287 | DEBUG    | __main__:trials:24 - Trial = 3773/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.288 | DEBUG    | __main__:trials:29 - Trial = 3773/30000 | Total reward = 40.86
2022-01-26 14:16:42.292 | DEBUG    | __main__:trials:24 - Trial = 3774/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.294 | DEBUG    | __main__:trials:29 - Trial = 3774/30000 | Total reward = 57.81
2022-01-26 14:16:42.296 | DEBUG    | __main__:trials:24 - Trial = 3775/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.298 | DEBUG    | __main__:trials:29 - Trial = 3775/30000 | Total reward = 49.99
2022-01-26 14:16:42.301 | DEBUG    | __main__:trials:24 - Trial = 3776/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.303 | DEBUG    | __main__:trials:29 - Trial = 3776/30000 | Total reward = 28.78
2022-01-26 14:16:42.305 | DEBUG    | __main__:trials:24 - Trial = 3777/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.307 | DEBUG    | __main__:trials:29 - Trial = 3777/30000 | Total reward = 43.64
2022-01-26 14:16:42.311 | DEBUG    | __main__:trials:24 - Trial = 3778/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.312 | DEBUG    | __main__:trials:29 - Trial = 3778/30000 | Total reward = 42.94
2022-01-26 14:16:42.316 | DEBUG    | __main__:trials:24 - Trial = 3779/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.318 | DEBUG    | __main__:trials:29 - Trial = 3779/30000 | Total reward = 24.44
2022-01-26 14:16:42.322 | DEBUG    | __main__:trials:24 - Trial = 3780/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.323 | DEBUG    | __main__:trials:29 - Trial = 3780/30000 | Total reward = 40.75
2022-01-26 14:16:42.327 | DEBUG    | __main__:trials:24 - Trial = 3781/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.328 | DEBUG    | __main__:trials:29 - Trial = 3781/30000 | Total reward = 37.61
2022-01-26 14:16:42.332 | DEBUG    | __main__:trials:24 - Trial = 3782/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.334 | DEBUG    | __main__:trials:29 - Trial = 3782/30000 | Total reward = 58.50
2022-01-26 14:16:42.338 | DEBUG    | __main__:trials:24 - Trial = 3783/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.339 | DEBUG    | __main__:trials:29 - Trial = 3783/30000 | Total reward = 44.38
2022-01-26 14:16:42.343 | DEBUG    | __main__:trials:24 - Trial = 3784/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.344 | DEBUG    | __main__:trials:29 - Trial = 3784/30000 | Total reward = 43.30
2022-01-26 14:16:42.348 | DEBUG    | __main__:trials:24 - Trial = 3785/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.350 | DEBUG    | __main__:trials:29 - Trial = 3785/30000 | Total reward = 44.38
2022-01-26 14:16:42.353 | DEBUG    | __main__:trials:24 - Trial = 3786/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.355 | DEBUG    | __main__:trials:29 - Trial = 3786/30000 | Total reward = 46.40
2022-01-26 14:16:42.359 | DEBUG    | __main__:trials:24 - Trial = 3787/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.359 | DEBUG    | __main__:trials:29 - Trial = 3787/30000 | Total reward = 35.18
2022-01-26 14:16:42.363 | DEBUG    | __main__:trials:24 - Trial = 3788/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.365 | DEBUG    | __main__:trials:29 - Trial = 3788/30000 | Total reward = 39.49
2022-01-26 14:16:42.368 | DEBUG    | __main__:trials:26 - Trial = 3789/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.369 | DEBUG    | __main__:trials:29 - Trial = 3789/30000 | Total reward = 12.78
2022-01-26 14:16:42.373 | DEBUG    | __main__:trials:24 - Trial = 3790/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.374 | DEBUG    | __main__:trials:29 - Trial = 3790/30000 | Total reward = 43.71
2022-01-26 14:16:42.377 | DEBUG    | __main__:trials:24 - Trial = 3791/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.379 | DEBUG    | __main__:trials:29 - Trial = 3791/30000 | Total reward = 41.59
2022-01-26 14:16:42.383 | DEBUG    | __main__:trials:24 - Trial = 3792/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.384 | DEBUG    | __main__:trials:29 - Trial = 3792/30000 | Total reward = 56.16
2022-01-26 14:16:42.388 | DEBUG    | __main__:trials:24 - Trial = 3793/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.390 | DEBUG    | __main__:trials:29 - Trial = 3793/30000 | Total reward = 43.00
2022-01-26 14:16:42.393 | DEBUG    | __main__:trials:24 - Trial = 3794/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.394 | DEBUG    | __main__:trials:29 - Trial = 3794/30000 | Total reward = 43.71
2022-01-26 14:16:42.398 | DEBUG    | __main__:trials:24 - Trial = 3795/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.400 | DEBUG    | __main__:trials:29 - Trial = 3795/30000 | Total reward = 44.18
2022-01-26 14:16:42.404 | DEBUG    | __main__:trials:24 - Trial = 3796/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.405 | DEBUG    | __main__:trials:29 - Trial = 3796/30000 | Total reward = 33.18
2022-01-26 14:16:42.409 | DEBUG    | __main__:trials:24 - Trial = 3797/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.410 | DEBUG    | __main__:trials:29 - Trial = 3797/30000 | Total reward = 36.97
2022-01-26 14:16:42.414 | DEBUG    | __main__:trials:24 - Trial = 3798/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.415 | DEBUG    | __main__:trials:29 - Trial = 3798/30000 | Total reward = 43.12
2022-01-26 14:16:42.419 | DEBUG    | __main__:trials:24 - Trial = 3799/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.421 | DEBUG    | __main__:trials:29 - Trial = 3799/30000 | Total reward = 46.26
2022-01-26 14:16:42.424 | DEBUG    | __main__:trials:24 - Trial = 3800/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.426 | DEBUG    | __main__:trials:29 - Trial = 3800/30000 | Total reward = 49.69
2022-01-26 14:16:42.430 | DEBUG    | __main__:trials:24 - Trial = 3801/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.431 | DEBUG    | __main__:trials:29 - Trial = 3801/30000 | Total reward = 18.59
2022-01-26 14:16:42.436 | DEBUG    | __main__:trials:24 - Trial = 3802/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.438 | DEBUG    | __main__:trials:29 - Trial = 3802/30000 | Total reward = 58.94
2022-01-26 14:16:42.441 | DEBUG    | __main__:trials:24 - Trial = 3803/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.443 | DEBUG    | __main__:trials:29 - Trial = 3803/30000 | Total reward = 57.03
2022-01-26 14:16:42.446 | DEBUG    | __main__:trials:24 - Trial = 3804/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.448 | DEBUG    | __main__:trials:29 - Trial = 3804/30000 | Total reward = 40.75
2022-01-26 14:16:42.452 | DEBUG    | __main__:trials:24 - Trial = 3805/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.454 | DEBUG    | __main__:trials:29 - Trial = 3805/30000 | Total reward = 31.89
2022-01-26 14:16:42.457 | DEBUG    | __main__:trials:24 - Trial = 3806/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.459 | DEBUG    | __main__:trials:29 - Trial = 3806/30000 | Total reward = 40.64
2022-01-26 14:16:42.463 | DEBUG    | __main__:trials:24 - Trial = 3807/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.465 | DEBUG    | __main__:trials:29 - Trial = 3807/30000 | Total reward = 40.49
2022-01-26 14:16:42.469 | DEBUG    | __main__:trials:24 - Trial = 3808/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.469 | DEBUG    | __main__:trials:29 - Trial = 3808/30000 | Total reward = 41.67
2022-01-26 14:16:42.474 | DEBUG    | __main__:trials:24 - Trial = 3809/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.476 | DEBUG    | __main__:trials:29 - Trial = 3809/30000 | Total reward = 39.58
2022-01-26 14:16:42.479 | DEBUG    | __main__:trials:24 - Trial = 3810/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.481 | DEBUG    | __main__:trials:29 - Trial = 3810/30000 | Total reward = 49.91
2022-01-26 14:16:42.484 | DEBUG    | __main__:trials:24 - Trial = 3811/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.485 | DEBUG    | __main__:trials:29 - Trial = 3811/30000 | Total reward = 49.29
2022-01-26 14:16:42.489 | DEBUG    | __main__:trials:24 - Trial = 3812/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.491 | DEBUG    | __main__:trials:29 - Trial = 3812/30000 | Total reward = 43.96
2022-01-26 14:16:42.494 | DEBUG    | __main__:trials:24 - Trial = 3813/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.496 | DEBUG    | __main__:trials:29 - Trial = 3813/30000 | Total reward = 48.68
2022-01-26 14:16:42.499 | DEBUG    | __main__:trials:26 - Trial = 3814/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.500 | DEBUG    | __main__:trials:29 - Trial = 3814/30000 | Total reward = 20.75
2022-01-26 14:16:42.504 | DEBUG    | __main__:trials:24 - Trial = 3815/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.506 | DEBUG    | __main__:trials:29 - Trial = 3815/30000 | Total reward = 32.33
2022-01-26 14:16:42.510 | DEBUG    | __main__:trials:24 - Trial = 3816/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.511 | DEBUG    | __main__:trials:29 - Trial = 3816/30000 | Total reward = 38.68
2022-01-26 14:16:42.515 | DEBUG    | __main__:trials:24 - Trial = 3817/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.516 | DEBUG    | __main__:trials:29 - Trial = 3817/30000 | Total reward = 30.94
2022-01-26 14:16:42.520 | DEBUG    | __main__:trials:24 - Trial = 3818/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.522 | DEBUG    | __main__:trials:29 - Trial = 3818/30000 | Total reward = 47.26
2022-01-26 14:16:42.525 | DEBUG    | __main__:trials:24 - Trial = 3819/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.527 | DEBUG    | __main__:trials:29 - Trial = 3819/30000 | Total reward = 46.79
2022-01-26 14:16:42.530 | DEBUG    | __main__:trials:26 - Trial = 3820/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.532 | DEBUG    | __main__:trials:29 - Trial = 3820/30000 | Total reward = 20.31
2022-01-26 14:16:42.535 | DEBUG    | __main__:trials:24 - Trial = 3821/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.537 | DEBUG    | __main__:trials:29 - Trial = 3821/30000 | Total reward = 29.48
2022-01-26 14:16:42.540 | DEBUG    | __main__:trials:24 - Trial = 3822/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.542 | DEBUG    | __main__:trials:29 - Trial = 3822/30000 | Total reward = 47.32
2022-01-26 14:16:42.546 | DEBUG    | __main__:trials:24 - Trial = 3823/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.547 | DEBUG    | __main__:trials:29 - Trial = 3823/30000 | Total reward = 25.05
2022-01-26 14:16:42.551 | DEBUG    | __main__:trials:24 - Trial = 3824/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.553 | DEBUG    | __main__:trials:29 - Trial = 3824/30000 | Total reward = 43.71
2022-01-26 14:16:42.556 | DEBUG    | __main__:trials:24 - Trial = 3825/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.558 | DEBUG    | __main__:trials:29 - Trial = 3825/30000 | Total reward = 25.43
2022-01-26 14:16:42.562 | DEBUG    | __main__:trials:24 - Trial = 3826/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.563 | DEBUG    | __main__:trials:29 - Trial = 3826/30000 | Total reward = 41.20
2022-01-26 14:16:42.567 | DEBUG    | __main__:trials:24 - Trial = 3827/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.569 | DEBUG    | __main__:trials:29 - Trial = 3827/30000 | Total reward = 43.71
2022-01-26 14:16:42.572 | DEBUG    | __main__:trials:24 - Trial = 3828/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.574 | DEBUG    | __main__:trials:29 - Trial = 3828/30000 | Total reward = 53.63
2022-01-26 14:16:42.577 | DEBUG    | __main__:trials:24 - Trial = 3829/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.578 | DEBUG    | __main__:trials:29 - Trial = 3829/30000 | Total reward = 42.54
2022-01-26 14:16:42.582 | DEBUG    | __main__:trials:24 - Trial = 3830/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.584 | DEBUG    | __main__:trials:29 - Trial = 3830/30000 | Total reward = 32.17
2022-01-26 14:16:42.588 | DEBUG    | __main__:trials:24 - Trial = 3831/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.588 | DEBUG    | __main__:trials:29 - Trial = 3831/30000 | Total reward = 41.13
2022-01-26 14:16:42.592 | DEBUG    | __main__:trials:24 - Trial = 3832/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.594 | DEBUG    | __main__:trials:29 - Trial = 3832/30000 | Total reward = 48.98
2022-01-26 14:16:42.598 | DEBUG    | __main__:trials:24 - Trial = 3833/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.599 | DEBUG    | __main__:trials:29 - Trial = 3833/30000 | Total reward = 48.25
2022-01-26 14:16:42.603 | DEBUG    | __main__:trials:24 - Trial = 3834/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.605 | DEBUG    | __main__:trials:29 - Trial = 3834/30000 | Total reward = 53.09
2022-01-26 14:16:42.608 | DEBUG    | __main__:trials:24 - Trial = 3835/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.609 | DEBUG    | __main__:trials:29 - Trial = 3835/30000 | Total reward = 43.71
2022-01-26 14:16:42.613 | DEBUG    | __main__:trials:24 - Trial = 3836/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.614 | DEBUG    | __main__:trials:29 - Trial = 3836/30000 | Total reward = 45.29
2022-01-26 14:16:42.618 | DEBUG    | __main__:trials:24 - Trial = 3837/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.619 | DEBUG    | __main__:trials:29 - Trial = 3837/30000 | Total reward = 43.71
2022-01-26 14:16:42.623 | DEBUG    | __main__:trials:24 - Trial = 3838/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.625 | DEBUG    | __main__:trials:29 - Trial = 3838/30000 | Total reward = 42.74
2022-01-26 14:16:42.629 | DEBUG    | __main__:trials:24 - Trial = 3839/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.630 | DEBUG    | __main__:trials:29 - Trial = 3839/30000 | Total reward = 61.26
2022-01-26 14:16:42.634 | DEBUG    | __main__:trials:24 - Trial = 3840/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.636 | DEBUG    | __main__:trials:29 - Trial = 3840/30000 | Total reward = 36.42
2022-01-26 14:16:42.639 | DEBUG    | __main__:trials:24 - Trial = 3841/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.640 | DEBUG    | __main__:trials:29 - Trial = 3841/30000 | Total reward = 56.31
2022-01-26 14:16:42.644 | DEBUG    | __main__:trials:24 - Trial = 3842/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.646 | DEBUG    | __main__:trials:29 - Trial = 3842/30000 | Total reward = 44.12
2022-01-26 14:16:42.649 | DEBUG    | __main__:trials:24 - Trial = 3843/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.651 | DEBUG    | __main__:trials:29 - Trial = 3843/30000 | Total reward = 60.74
2022-01-26 14:16:42.654 | DEBUG    | __main__:trials:24 - Trial = 3844/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.656 | DEBUG    | __main__:trials:29 - Trial = 3844/30000 | Total reward = 38.46
2022-01-26 14:16:42.660 | DEBUG    | __main__:trials:24 - Trial = 3845/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.660 | DEBUG    | __main__:trials:29 - Trial = 3845/30000 | Total reward = 43.71
2022-01-26 14:16:42.664 | DEBUG    | __main__:trials:24 - Trial = 3846/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.666 | DEBUG    | __main__:trials:29 - Trial = 3846/30000 | Total reward = 48.69
2022-01-26 14:16:42.669 | DEBUG    | __main__:trials:24 - Trial = 3847/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.670 | DEBUG    | __main__:trials:29 - Trial = 3847/30000 | Total reward = 43.71
2022-01-26 14:16:42.673 | DEBUG    | __main__:trials:24 - Trial = 3848/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.674 | DEBUG    | __main__:trials:29 - Trial = 3848/30000 | Total reward = 51.94
2022-01-26 14:16:42.677 | DEBUG    | __main__:trials:26 - Trial = 3849/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.678 | DEBUG    | __main__:trials:29 - Trial = 3849/30000 | Total reward = 32.82
2022-01-26 14:16:42.681 | DEBUG    | __main__:trials:24 - Trial = 3850/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.684 | DEBUG    | __main__:trials:29 - Trial = 3850/30000 | Total reward = 17.69
2022-01-26 14:16:42.687 | DEBUG    | __main__:trials:24 - Trial = 3851/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.689 | DEBUG    | __main__:trials:29 - Trial = 3851/30000 | Total reward = 49.47
2022-01-26 14:16:42.692 | DEBUG    | __main__:trials:24 - Trial = 3852/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.694 | DEBUG    | __main__:trials:29 - Trial = 3852/30000 | Total reward = 48.66
2022-01-26 14:16:42.697 | DEBUG    | __main__:trials:24 - Trial = 3853/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.699 | DEBUG    | __main__:trials:29 - Trial = 3853/30000 | Total reward = 43.43
2022-01-26 14:16:42.702 | DEBUG    | __main__:trials:24 - Trial = 3854/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.704 | DEBUG    | __main__:trials:29 - Trial = 3854/30000 | Total reward = 44.17
2022-01-26 14:16:42.707 | DEBUG    | __main__:trials:24 - Trial = 3855/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.709 | DEBUG    | __main__:trials:29 - Trial = 3855/30000 | Total reward = 42.36
2022-01-26 14:16:42.712 | DEBUG    | __main__:trials:24 - Trial = 3856/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.714 | DEBUG    | __main__:trials:29 - Trial = 3856/30000 | Total reward = 45.15
2022-01-26 14:16:42.718 | DEBUG    | __main__:trials:24 - Trial = 3857/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.719 | DEBUG    | __main__:trials:29 - Trial = 3857/30000 | Total reward = 40.58
2022-01-26 14:16:42.722 | DEBUG    | __main__:trials:24 - Trial = 3858/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.724 | DEBUG    | __main__:trials:29 - Trial = 3858/30000 | Total reward = 29.46
2022-01-26 14:16:42.728 | DEBUG    | __main__:trials:24 - Trial = 3859/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.728 | DEBUG    | __main__:trials:29 - Trial = 3859/30000 | Total reward = 59.68
2022-01-26 14:16:42.732 | DEBUG    | __main__:trials:26 - Trial = 3860/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.733 | DEBUG    | __main__:trials:29 - Trial = 3860/30000 | Total reward = 11.78
2022-01-26 14:16:42.736 | DEBUG    | __main__:trials:24 - Trial = 3861/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.737 | DEBUG    | __main__:trials:29 - Trial = 3861/30000 | Total reward = 35.50
2022-01-26 14:16:42.740 | DEBUG    | __main__:trials:24 - Trial = 3862/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.742 | DEBUG    | __main__:trials:29 - Trial = 3862/30000 | Total reward = 44.78
2022-01-26 14:16:42.746 | DEBUG    | __main__:trials:24 - Trial = 3863/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.748 | DEBUG    | __main__:trials:29 - Trial = 3863/30000 | Total reward = 44.40
2022-01-26 14:16:42.751 | DEBUG    | __main__:trials:24 - Trial = 3864/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.753 | DEBUG    | __main__:trials:29 - Trial = 3864/30000 | Total reward = 38.05
2022-01-26 14:16:42.756 | DEBUG    | __main__:trials:24 - Trial = 3865/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.757 | DEBUG    | __main__:trials:29 - Trial = 3865/30000 | Total reward = 47.68
2022-01-26 14:16:42.761 | DEBUG    | __main__:trials:24 - Trial = 3866/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.762 | DEBUG    | __main__:trials:29 - Trial = 3866/30000 | Total reward = 29.14
2022-01-26 14:16:42.766 | DEBUG    | __main__:trials:24 - Trial = 3867/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.768 | DEBUG    | __main__:trials:29 - Trial = 3867/30000 | Total reward = 38.03
2022-01-26 14:16:42.771 | DEBUG    | __main__:trials:24 - Trial = 3868/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.773 | DEBUG    | __main__:trials:29 - Trial = 3868/30000 | Total reward = 50.53
2022-01-26 14:16:42.777 | DEBUG    | __main__:trials:24 - Trial = 3869/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.777 | DEBUG    | __main__:trials:29 - Trial = 3869/30000 | Total reward = 36.63
2022-01-26 14:16:42.781 | DEBUG    | __main__:trials:24 - Trial = 3870/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.782 | DEBUG    | __main__:trials:29 - Trial = 3870/30000 | Total reward = 36.79
2022-01-26 14:16:42.785 | DEBUG    | __main__:trials:24 - Trial = 3871/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.787 | DEBUG    | __main__:trials:29 - Trial = 3871/30000 | Total reward = 40.10
2022-01-26 14:16:42.791 | DEBUG    | __main__:trials:24 - Trial = 3872/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.793 | DEBUG    | __main__:trials:29 - Trial = 3872/30000 | Total reward = 47.67
2022-01-26 14:16:42.796 | DEBUG    | __main__:trials:24 - Trial = 3873/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.798 | DEBUG    | __main__:trials:29 - Trial = 3873/30000 | Total reward = 32.39
2022-01-26 14:16:42.802 | DEBUG    | __main__:trials:24 - Trial = 3874/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.804 | DEBUG    | __main__:trials:29 - Trial = 3874/30000 | Total reward = 26.10
2022-01-26 14:16:42.807 | DEBUG    | __main__:trials:24 - Trial = 3875/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.808 | DEBUG    | __main__:trials:29 - Trial = 3875/30000 | Total reward = 43.26
2022-01-26 14:16:42.812 | DEBUG    | __main__:trials:24 - Trial = 3876/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.814 | DEBUG    | __main__:trials:29 - Trial = 3876/30000 | Total reward = 38.92
2022-01-26 14:16:42.817 | DEBUG    | __main__:trials:24 - Trial = 3877/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.819 | DEBUG    | __main__:trials:29 - Trial = 3877/30000 | Total reward = 29.91
2022-01-26 14:16:42.823 | DEBUG    | __main__:trials:24 - Trial = 3878/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.824 | DEBUG    | __main__:trials:29 - Trial = 3878/30000 | Total reward = 43.44
2022-01-26 14:16:42.827 | DEBUG    | __main__:trials:24 - Trial = 3879/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.829 | DEBUG    | __main__:trials:29 - Trial = 3879/30000 | Total reward = 43.47
2022-01-26 14:16:42.833 | DEBUG    | __main__:trials:24 - Trial = 3880/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.834 | DEBUG    | __main__:trials:29 - Trial = 3880/30000 | Total reward = 44.81
2022-01-26 14:16:42.838 | DEBUG    | __main__:trials:24 - Trial = 3881/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.839 | DEBUG    | __main__:trials:29 - Trial = 3881/30000 | Total reward = 56.68
2022-01-26 14:16:42.843 | DEBUG    | __main__:trials:26 - Trial = 3882/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.844 | DEBUG    | __main__:trials:29 - Trial = 3882/30000 | Total reward = 16.39
2022-01-26 14:16:42.848 | DEBUG    | __main__:trials:26 - Trial = 3883/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.850 | DEBUG    | __main__:trials:29 - Trial = 3883/30000 | Total reward = 31.13
2022-01-26 14:16:42.853 | DEBUG    | __main__:trials:24 - Trial = 3884/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.855 | DEBUG    | __main__:trials:29 - Trial = 3884/30000 | Total reward = 48.32
2022-01-26 14:16:42.860 | DEBUG    | __main__:trials:24 - Trial = 3885/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.861 | DEBUG    | __main__:trials:29 - Trial = 3885/30000 | Total reward = 43.47
2022-01-26 14:16:42.865 | DEBUG    | __main__:trials:24 - Trial = 3886/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.867 | DEBUG    | __main__:trials:29 - Trial = 3886/30000 | Total reward = 31.05
2022-01-26 14:16:42.870 | DEBUG    | __main__:trials:24 - Trial = 3887/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.872 | DEBUG    | __main__:trials:29 - Trial = 3887/30000 | Total reward = 37.03
2022-01-26 14:16:42.875 | DEBUG    | __main__:trials:24 - Trial = 3888/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.877 | DEBUG    | __main__:trials:29 - Trial = 3888/30000 | Total reward = 61.57
2022-01-26 14:16:42.880 | DEBUG    | __main__:trials:24 - Trial = 3889/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.882 | DEBUG    | __main__:trials:29 - Trial = 3889/30000 | Total reward = 33.58
2022-01-26 14:16:42.886 | DEBUG    | __main__:trials:24 - Trial = 3890/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.887 | DEBUG    | __main__:trials:29 - Trial = 3890/30000 | Total reward = 32.39
2022-01-26 14:16:42.891 | DEBUG    | __main__:trials:24 - Trial = 3891/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.893 | DEBUG    | __main__:trials:29 - Trial = 3891/30000 | Total reward = 46.45
2022-01-26 14:16:42.896 | DEBUG    | __main__:trials:26 - Trial = 3892/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.897 | DEBUG    | __main__:trials:29 - Trial = 3892/30000 | Total reward = 28.45
2022-01-26 14:16:42.901 | DEBUG    | __main__:trials:24 - Trial = 3893/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.901 | DEBUG    | __main__:trials:29 - Trial = 3893/30000 | Total reward = 41.35
2022-01-26 14:16:42.905 | DEBUG    | __main__:trials:24 - Trial = 3894/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.905 | DEBUG    | __main__:trials:29 - Trial = 3894/30000 | Total reward = 40.87
2022-01-26 14:16:42.909 | DEBUG    | __main__:trials:26 - Trial = 3895/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:42.910 | DEBUG    | __main__:trials:29 - Trial = 3895/30000 | Total reward = 31.43
2022-01-26 14:16:42.914 | DEBUG    | __main__:trials:24 - Trial = 3896/30000 | Max number of steps (20) reached
2022-01-26 14:16:42.915 | DEBUG    | __main__:trials:29 - Trial = 3896/30000 | Total reward = 50.42
2022-01-26 14:16:43.041 | DEBUG    | __main__:trials:24 - Trial = 3897/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.042 | DEBUG    | __main__:trials:29 - Trial = 3897/30000 | Total reward = 47.11
2022-01-26 14:16:43.048 | DEBUG    | __main__:trials:24 - Trial = 3898/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.050 | DEBUG    | __main__:trials:29 - Trial = 3898/30000 | Total reward = 43.28
2022-01-26 14:16:43.053 | DEBUG    | __main__:trials:24 - Trial = 3899/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.055 | DEBUG    | __main__:trials:29 - Trial = 3899/30000 | Total reward = 48.50
2022-01-26 14:16:43.059 | DEBUG    | __main__:trials:24 - Trial = 3900/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.061 | DEBUG    | __main__:trials:29 - Trial = 3900/30000 | Total reward = 54.06
2022-01-26 14:16:43.064 | DEBUG    | __main__:trials:24 - Trial = 3901/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.065 | DEBUG    | __main__:trials:29 - Trial = 3901/30000 | Total reward = 31.42
2022-01-26 14:16:43.068 | DEBUG    | __main__:trials:24 - Trial = 3902/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.070 | DEBUG    | __main__:trials:29 - Trial = 3902/30000 | Total reward = 31.90
2022-01-26 14:16:43.074 | DEBUG    | __main__:trials:24 - Trial = 3903/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.076 | DEBUG    | __main__:trials:29 - Trial = 3903/30000 | Total reward = 19.70
2022-01-26 14:16:43.079 | DEBUG    | __main__:trials:24 - Trial = 3904/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.081 | DEBUG    | __main__:trials:29 - Trial = 3904/30000 | Total reward = 52.32
2022-01-26 14:16:43.085 | DEBUG    | __main__:trials:24 - Trial = 3905/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.087 | DEBUG    | __main__:trials:29 - Trial = 3905/30000 | Total reward = 56.29
2022-01-26 14:16:43.090 | DEBUG    | __main__:trials:24 - Trial = 3906/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.092 | DEBUG    | __main__:trials:29 - Trial = 3906/30000 | Total reward = 39.73
2022-01-26 14:16:43.096 | DEBUG    | __main__:trials:24 - Trial = 3907/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.097 | DEBUG    | __main__:trials:29 - Trial = 3907/30000 | Total reward = 42.10
2022-01-26 14:16:43.101 | DEBUG    | __main__:trials:24 - Trial = 3908/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.102 | DEBUG    | __main__:trials:29 - Trial = 3908/30000 | Total reward = 49.38
2022-01-26 14:16:43.105 | DEBUG    | __main__:trials:24 - Trial = 3909/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.107 | DEBUG    | __main__:trials:29 - Trial = 3909/30000 | Total reward = 37.99
2022-01-26 14:16:43.110 | DEBUG    | __main__:trials:24 - Trial = 3910/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.111 | DEBUG    | __main__:trials:29 - Trial = 3910/30000 | Total reward = 52.21
2022-01-26 14:16:43.116 | DEBUG    | __main__:trials:24 - Trial = 3911/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.117 | DEBUG    | __main__:trials:29 - Trial = 3911/30000 | Total reward = 31.25
2022-01-26 14:16:43.121 | DEBUG    | __main__:trials:24 - Trial = 3912/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.122 | DEBUG    | __main__:trials:29 - Trial = 3912/30000 | Total reward = 36.10
2022-01-26 14:16:43.126 | DEBUG    | __main__:trials:24 - Trial = 3913/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.128 | DEBUG    | __main__:trials:29 - Trial = 3913/30000 | Total reward = 47.72
2022-01-26 14:16:43.131 | DEBUG    | __main__:trials:24 - Trial = 3914/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.132 | DEBUG    | __main__:trials:29 - Trial = 3914/30000 | Total reward = 51.81
2022-01-26 14:16:43.136 | DEBUG    | __main__:trials:24 - Trial = 3915/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.138 | DEBUG    | __main__:trials:29 - Trial = 3915/30000 | Total reward = 41.51
2022-01-26 14:16:43.141 | DEBUG    | __main__:trials:24 - Trial = 3916/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.143 | DEBUG    | __main__:trials:29 - Trial = 3916/30000 | Total reward = 22.40
2022-01-26 14:16:43.147 | DEBUG    | __main__:trials:24 - Trial = 3917/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.148 | DEBUG    | __main__:trials:29 - Trial = 3917/30000 | Total reward = 46.36
2022-01-26 14:16:43.152 | DEBUG    | __main__:trials:24 - Trial = 3918/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.153 | DEBUG    | __main__:trials:29 - Trial = 3918/30000 | Total reward = 43.30
2022-01-26 14:16:43.157 | DEBUG    | __main__:trials:24 - Trial = 3919/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.158 | DEBUG    | __main__:trials:29 - Trial = 3919/30000 | Total reward = 48.37
2022-01-26 14:16:43.161 | DEBUG    | __main__:trials:24 - Trial = 3920/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.162 | DEBUG    | __main__:trials:29 - Trial = 3920/30000 | Total reward = 42.63
2022-01-26 14:16:43.166 | DEBUG    | __main__:trials:24 - Trial = 3921/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.166 | DEBUG    | __main__:trials:29 - Trial = 3921/30000 | Total reward = 39.85
2022-01-26 14:16:43.170 | DEBUG    | __main__:trials:24 - Trial = 3922/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.170 | DEBUG    | __main__:trials:29 - Trial = 3922/30000 | Total reward = 43.58
2022-01-26 14:16:43.174 | DEBUG    | __main__:trials:24 - Trial = 3923/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.176 | DEBUG    | __main__:trials:29 - Trial = 3923/30000 | Total reward = 31.81
2022-01-26 14:16:43.179 | DEBUG    | __main__:trials:24 - Trial = 3924/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.181 | DEBUG    | __main__:trials:29 - Trial = 3924/30000 | Total reward = 33.23
2022-01-26 14:16:43.183 | DEBUG    | __main__:trials:24 - Trial = 3925/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.185 | DEBUG    | __main__:trials:29 - Trial = 3925/30000 | Total reward = 21.93
2022-01-26 14:16:43.189 | DEBUG    | __main__:trials:24 - Trial = 3926/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.191 | DEBUG    | __main__:trials:29 - Trial = 3926/30000 | Total reward = 31.61
2022-01-26 14:16:43.194 | DEBUG    | __main__:trials:24 - Trial = 3927/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.196 | DEBUG    | __main__:trials:29 - Trial = 3927/30000 | Total reward = 33.84
2022-01-26 14:16:43.200 | DEBUG    | __main__:trials:24 - Trial = 3928/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.200 | DEBUG    | __main__:trials:29 - Trial = 3928/30000 | Total reward = 46.17
2022-01-26 14:16:43.204 | DEBUG    | __main__:trials:24 - Trial = 3929/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.205 | DEBUG    | __main__:trials:29 - Trial = 3929/30000 | Total reward = 32.49
2022-01-26 14:16:43.209 | DEBUG    | __main__:trials:24 - Trial = 3930/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.209 | DEBUG    | __main__:trials:29 - Trial = 3930/30000 | Total reward = 43.65
2022-01-26 14:16:43.213 | DEBUG    | __main__:trials:24 - Trial = 3931/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.214 | DEBUG    | __main__:trials:29 - Trial = 3931/30000 | Total reward = 43.94
2022-01-26 14:16:43.217 | DEBUG    | __main__:trials:24 - Trial = 3932/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.218 | DEBUG    | __main__:trials:29 - Trial = 3932/30000 | Total reward = 43.59
2022-01-26 14:16:43.221 | DEBUG    | __main__:trials:24 - Trial = 3933/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.223 | DEBUG    | __main__:trials:29 - Trial = 3933/30000 | Total reward = 46.61
2022-01-26 14:16:43.227 | DEBUG    | __main__:trials:24 - Trial = 3934/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.229 | DEBUG    | __main__:trials:29 - Trial = 3934/30000 | Total reward = 39.11
2022-01-26 14:16:43.232 | DEBUG    | __main__:trials:24 - Trial = 3935/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.234 | DEBUG    | __main__:trials:29 - Trial = 3935/30000 | Total reward = 37.68
2022-01-26 14:16:43.237 | DEBUG    | __main__:trials:24 - Trial = 3936/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.239 | DEBUG    | __main__:trials:29 - Trial = 3936/30000 | Total reward = 34.77
2022-01-26 14:16:43.243 | DEBUG    | __main__:trials:24 - Trial = 3937/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.245 | DEBUG    | __main__:trials:29 - Trial = 3937/30000 | Total reward = 35.14
2022-01-26 14:16:43.248 | DEBUG    | __main__:trials:24 - Trial = 3938/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.250 | DEBUG    | __main__:trials:29 - Trial = 3938/30000 | Total reward = 33.38
2022-01-26 14:16:43.253 | DEBUG    | __main__:trials:26 - Trial = 3939/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.253 | DEBUG    | __main__:trials:29 - Trial = 3939/30000 | Total reward = 17.85
2022-01-26 14:16:43.258 | DEBUG    | __main__:trials:24 - Trial = 3940/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.258 | DEBUG    | __main__:trials:29 - Trial = 3940/30000 | Total reward = 49.32
2022-01-26 14:16:43.262 | DEBUG    | __main__:trials:24 - Trial = 3941/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.263 | DEBUG    | __main__:trials:29 - Trial = 3941/30000 | Total reward = 31.19
2022-01-26 14:16:43.270 | DEBUG    | __main__:trials:26 - Trial = 3942/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.270 | DEBUG    | __main__:trials:29 - Trial = 3942/30000 | Total reward = 20.75
2022-01-26 14:16:43.274 | DEBUG    | __main__:trials:24 - Trial = 3943/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.276 | DEBUG    | __main__:trials:29 - Trial = 3943/30000 | Total reward = 47.41
2022-01-26 14:16:43.279 | DEBUG    | __main__:trials:24 - Trial = 3944/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.281 | DEBUG    | __main__:trials:29 - Trial = 3944/30000 | Total reward = 56.64
2022-01-26 14:16:43.285 | DEBUG    | __main__:trials:24 - Trial = 3945/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.286 | DEBUG    | __main__:trials:29 - Trial = 3945/30000 | Total reward = 40.49
2022-01-26 14:16:43.289 | DEBUG    | __main__:trials:24 - Trial = 3946/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.291 | DEBUG    | __main__:trials:29 - Trial = 3946/30000 | Total reward = 53.55
2022-01-26 14:16:43.295 | DEBUG    | __main__:trials:24 - Trial = 3947/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.296 | DEBUG    | __main__:trials:29 - Trial = 3947/30000 | Total reward = 31.35
2022-01-26 14:16:43.300 | DEBUG    | __main__:trials:24 - Trial = 3948/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.300 | DEBUG    | __main__:trials:29 - Trial = 3948/30000 | Total reward = 48.39
2022-01-26 14:16:43.304 | DEBUG    | __main__:trials:24 - Trial = 3949/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.306 | DEBUG    | __main__:trials:29 - Trial = 3949/30000 | Total reward = 51.77
2022-01-26 14:16:43.310 | DEBUG    | __main__:trials:24 - Trial = 3950/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.311 | DEBUG    | __main__:trials:29 - Trial = 3950/30000 | Total reward = 35.48
2022-01-26 14:16:43.314 | DEBUG    | __main__:trials:24 - Trial = 3951/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.316 | DEBUG    | __main__:trials:29 - Trial = 3951/30000 | Total reward = 38.22
2022-01-26 14:16:43.320 | DEBUG    | __main__:trials:24 - Trial = 3952/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.321 | DEBUG    | __main__:trials:29 - Trial = 3952/30000 | Total reward = 48.75
2022-01-26 14:16:43.325 | DEBUG    | __main__:trials:24 - Trial = 3953/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.327 | DEBUG    | __main__:trials:29 - Trial = 3953/30000 | Total reward = 46.10
2022-01-26 14:16:43.331 | DEBUG    | __main__:trials:24 - Trial = 3954/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.332 | DEBUG    | __main__:trials:29 - Trial = 3954/30000 | Total reward = 11.63
2022-01-26 14:16:43.336 | DEBUG    | __main__:trials:24 - Trial = 3955/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.338 | DEBUG    | __main__:trials:29 - Trial = 3955/30000 | Total reward = 37.16
2022-01-26 14:16:43.341 | DEBUG    | __main__:trials:24 - Trial = 3956/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.343 | DEBUG    | __main__:trials:29 - Trial = 3956/30000 | Total reward = 41.57
2022-01-26 14:16:43.347 | DEBUG    | __main__:trials:24 - Trial = 3957/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.348 | DEBUG    | __main__:trials:29 - Trial = 3957/30000 | Total reward = 37.70
2022-01-26 14:16:43.352 | DEBUG    | __main__:trials:24 - Trial = 3958/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.353 | DEBUG    | __main__:trials:29 - Trial = 3958/30000 | Total reward = 55.63
2022-01-26 14:16:43.357 | DEBUG    | __main__:trials:24 - Trial = 3959/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.359 | DEBUG    | __main__:trials:29 - Trial = 3959/30000 | Total reward = 21.61
2022-01-26 14:16:43.362 | DEBUG    | __main__:trials:24 - Trial = 3960/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.364 | DEBUG    | __main__:trials:29 - Trial = 3960/30000 | Total reward = 48.01
2022-01-26 14:16:43.367 | DEBUG    | __main__:trials:24 - Trial = 3961/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.369 | DEBUG    | __main__:trials:29 - Trial = 3961/30000 | Total reward = 32.97
2022-01-26 14:16:43.372 | DEBUG    | __main__:trials:24 - Trial = 3962/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.373 | DEBUG    | __main__:trials:29 - Trial = 3962/30000 | Total reward = 43.16
2022-01-26 14:16:43.377 | DEBUG    | __main__:trials:24 - Trial = 3963/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.377 | DEBUG    | __main__:trials:29 - Trial = 3963/30000 | Total reward = 48.55
2022-01-26 14:16:43.382 | DEBUG    | __main__:trials:24 - Trial = 3964/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.384 | DEBUG    | __main__:trials:29 - Trial = 3964/30000 | Total reward = 32.53
2022-01-26 14:16:43.387 | DEBUG    | __main__:trials:24 - Trial = 3965/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.389 | DEBUG    | __main__:trials:29 - Trial = 3965/30000 | Total reward = 49.38
2022-01-26 14:16:43.393 | DEBUG    | __main__:trials:24 - Trial = 3966/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.394 | DEBUG    | __main__:trials:29 - Trial = 3966/30000 | Total reward = 50.22
2022-01-26 14:16:43.397 | DEBUG    | __main__:trials:24 - Trial = 3967/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.399 | DEBUG    | __main__:trials:29 - Trial = 3967/30000 | Total reward = 42.63
2022-01-26 14:16:43.403 | DEBUG    | __main__:trials:24 - Trial = 3968/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.404 | DEBUG    | __main__:trials:29 - Trial = 3968/30000 | Total reward = 43.71
2022-01-26 14:16:43.408 | DEBUG    | __main__:trials:24 - Trial = 3969/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.410 | DEBUG    | __main__:trials:29 - Trial = 3969/30000 | Total reward = 46.60
2022-01-26 14:16:43.413 | DEBUG    | __main__:trials:24 - Trial = 3970/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.415 | DEBUG    | __main__:trials:29 - Trial = 3970/30000 | Total reward = 27.78
2022-01-26 14:16:43.419 | DEBUG    | __main__:trials:24 - Trial = 3971/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.421 | DEBUG    | __main__:trials:29 - Trial = 3971/30000 | Total reward = 43.24
2022-01-26 14:16:43.424 | DEBUG    | __main__:trials:24 - Trial = 3972/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.425 | DEBUG    | __main__:trials:29 - Trial = 3972/30000 | Total reward = 43.51
2022-01-26 14:16:43.429 | DEBUG    | __main__:trials:24 - Trial = 3973/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.429 | DEBUG    | __main__:trials:29 - Trial = 3973/30000 | Total reward = 35.32
2022-01-26 14:16:43.433 | DEBUG    | __main__:trials:24 - Trial = 3974/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.435 | DEBUG    | __main__:trials:29 - Trial = 3974/30000 | Total reward = 39.00
2022-01-26 14:16:43.438 | DEBUG    | __main__:trials:24 - Trial = 3975/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.440 | DEBUG    | __main__:trials:29 - Trial = 3975/30000 | Total reward = 49.00
2022-01-26 14:16:43.444 | DEBUG    | __main__:trials:24 - Trial = 3976/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.445 | DEBUG    | __main__:trials:29 - Trial = 3976/30000 | Total reward = 53.61
2022-01-26 14:16:43.449 | DEBUG    | __main__:trials:24 - Trial = 3977/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.450 | DEBUG    | __main__:trials:29 - Trial = 3977/30000 | Total reward = 43.12
2022-01-26 14:16:43.454 | DEBUG    | __main__:trials:24 - Trial = 3978/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.456 | DEBUG    | __main__:trials:29 - Trial = 3978/30000 | Total reward = 28.23
2022-01-26 14:16:43.460 | DEBUG    | __main__:trials:24 - Trial = 3979/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.460 | DEBUG    | __main__:trials:29 - Trial = 3979/30000 | Total reward = 35.92
2022-01-26 14:16:43.464 | DEBUG    | __main__:trials:24 - Trial = 3980/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.466 | DEBUG    | __main__:trials:29 - Trial = 3980/30000 | Total reward = 45.93
2022-01-26 14:16:43.470 | DEBUG    | __main__:trials:24 - Trial = 3981/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.472 | DEBUG    | __main__:trials:29 - Trial = 3981/30000 | Total reward = 30.12
2022-01-26 14:16:43.475 | DEBUG    | __main__:trials:24 - Trial = 3982/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.476 | DEBUG    | __main__:trials:29 - Trial = 3982/30000 | Total reward = 43.03
2022-01-26 14:16:43.480 | DEBUG    | __main__:trials:24 - Trial = 3983/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.482 | DEBUG    | __main__:trials:29 - Trial = 3983/30000 | Total reward = 48.45
2022-01-26 14:16:43.485 | DEBUG    | __main__:trials:24 - Trial = 3984/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.487 | DEBUG    | __main__:trials:29 - Trial = 3984/30000 | Total reward = 47.59
2022-01-26 14:16:43.490 | DEBUG    | __main__:trials:26 - Trial = 3985/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.491 | DEBUG    | __main__:trials:29 - Trial = 3985/30000 | Total reward = 18.45
2022-01-26 14:16:43.495 | DEBUG    | __main__:trials:24 - Trial = 3986/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.496 | DEBUG    | __main__:trials:29 - Trial = 3986/30000 | Total reward = 35.91
2022-01-26 14:16:43.500 | DEBUG    | __main__:trials:24 - Trial = 3987/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.501 | DEBUG    | __main__:trials:29 - Trial = 3987/30000 | Total reward = 45.43
2022-01-26 14:16:43.505 | DEBUG    | __main__:trials:24 - Trial = 3988/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.507 | DEBUG    | __main__:trials:29 - Trial = 3988/30000 | Total reward = 40.28
2022-01-26 14:16:43.510 | DEBUG    | __main__:trials:24 - Trial = 3989/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.512 | DEBUG    | __main__:trials:29 - Trial = 3989/30000 | Total reward = 30.89
2022-01-26 14:16:43.516 | DEBUG    | __main__:trials:24 - Trial = 3990/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.517 | DEBUG    | __main__:trials:29 - Trial = 3990/30000 | Total reward = 41.29
2022-01-26 14:16:43.521 | DEBUG    | __main__:trials:24 - Trial = 3991/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.523 | DEBUG    | __main__:trials:29 - Trial = 3991/30000 | Total reward = 30.66
2022-01-26 14:16:43.526 | DEBUG    | __main__:trials:24 - Trial = 3992/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.528 | DEBUG    | __main__:trials:29 - Trial = 3992/30000 | Total reward = 36.84
2022-01-26 14:16:43.531 | DEBUG    | __main__:trials:24 - Trial = 3993/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.533 | DEBUG    | __main__:trials:29 - Trial = 3993/30000 | Total reward = 32.28
2022-01-26 14:16:43.536 | DEBUG    | __main__:trials:24 - Trial = 3994/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.538 | DEBUG    | __main__:trials:29 - Trial = 3994/30000 | Total reward = 58.77
2022-01-26 14:16:43.542 | DEBUG    | __main__:trials:24 - Trial = 3995/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.542 | DEBUG    | __main__:trials:29 - Trial = 3995/30000 | Total reward = 43.47
2022-01-26 14:16:43.547 | DEBUG    | __main__:trials:24 - Trial = 3996/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.548 | DEBUG    | __main__:trials:29 - Trial = 3996/30000 | Total reward = 50.79
2022-01-26 14:16:43.552 | DEBUG    | __main__:trials:24 - Trial = 3997/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.553 | DEBUG    | __main__:trials:29 - Trial = 3997/30000 | Total reward = 35.03
2022-01-26 14:16:43.557 | DEBUG    | __main__:trials:24 - Trial = 3998/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.558 | DEBUG    | __main__:trials:29 - Trial = 3998/30000 | Total reward = 43.71
2022-01-26 14:16:43.562 | DEBUG    | __main__:trials:24 - Trial = 3999/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.563 | DEBUG    | __main__:trials:29 - Trial = 3999/30000 | Total reward = 32.97
2022-01-26 14:16:43.566 | DEBUG    | __main__:trials:24 - Trial = 4000/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.568 | DEBUG    | __main__:trials:29 - Trial = 4000/30000 | Total reward = 45.19
2022-01-26 14:16:43.572 | DEBUG    | __main__:trials:24 - Trial = 4001/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.573 | DEBUG    | __main__:trials:29 - Trial = 4001/30000 | Total reward = 34.42
2022-01-26 14:16:43.577 | DEBUG    | __main__:trials:24 - Trial = 4002/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.579 | DEBUG    | __main__:trials:29 - Trial = 4002/30000 | Total reward = 39.00
2022-01-26 14:16:43.582 | DEBUG    | __main__:trials:24 - Trial = 4003/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.584 | DEBUG    | __main__:trials:29 - Trial = 4003/30000 | Total reward = 35.24
2022-01-26 14:16:43.588 | DEBUG    | __main__:trials:24 - Trial = 4004/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.589 | DEBUG    | __main__:trials:29 - Trial = 4004/30000 | Total reward = 55.99
2022-01-26 14:16:43.592 | DEBUG    | __main__:trials:24 - Trial = 4005/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.594 | DEBUG    | __main__:trials:29 - Trial = 4005/30000 | Total reward = 31.30
2022-01-26 14:16:43.597 | DEBUG    | __main__:trials:26 - Trial = 4006/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.599 | DEBUG    | __main__:trials:29 - Trial = 4006/30000 | Total reward = 20.86
2022-01-26 14:16:43.602 | DEBUG    | __main__:trials:24 - Trial = 4007/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.604 | DEBUG    | __main__:trials:29 - Trial = 4007/30000 | Total reward = 38.15
2022-01-26 14:16:43.608 | DEBUG    | __main__:trials:24 - Trial = 4008/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.609 | DEBUG    | __main__:trials:29 - Trial = 4008/30000 | Total reward = 46.36
2022-01-26 14:16:43.613 | DEBUG    | __main__:trials:24 - Trial = 4009/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.615 | DEBUG    | __main__:trials:29 - Trial = 4009/30000 | Total reward = 33.21
2022-01-26 14:16:43.618 | DEBUG    | __main__:trials:24 - Trial = 4010/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.620 | DEBUG    | __main__:trials:29 - Trial = 4010/30000 | Total reward = 33.55
2022-01-26 14:16:43.623 | DEBUG    | __main__:trials:26 - Trial = 4011/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.624 | DEBUG    | __main__:trials:29 - Trial = 4011/30000 | Total reward = 18.28
2022-01-26 14:16:43.628 | DEBUG    | __main__:trials:24 - Trial = 4012/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.630 | DEBUG    | __main__:trials:29 - Trial = 4012/30000 | Total reward = 50.35
2022-01-26 14:16:43.633 | DEBUG    | __main__:trials:24 - Trial = 4013/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.634 | DEBUG    | __main__:trials:29 - Trial = 4013/30000 | Total reward = 39.00
2022-01-26 14:16:43.638 | DEBUG    | __main__:trials:24 - Trial = 4014/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.639 | DEBUG    | __main__:trials:29 - Trial = 4014/30000 | Total reward = 43.95
2022-01-26 14:16:43.643 | DEBUG    | __main__:trials:24 - Trial = 4015/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.644 | DEBUG    | __main__:trials:29 - Trial = 4015/30000 | Total reward = 36.38
2022-01-26 14:16:43.648 | DEBUG    | __main__:trials:24 - Trial = 4016/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.650 | DEBUG    | __main__:trials:29 - Trial = 4016/30000 | Total reward = 41.41
2022-01-26 14:16:43.653 | DEBUG    | __main__:trials:24 - Trial = 4017/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.655 | DEBUG    | __main__:trials:29 - Trial = 4017/30000 | Total reward = 48.46
2022-01-26 14:16:43.658 | DEBUG    | __main__:trials:24 - Trial = 4018/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.660 | DEBUG    | __main__:trials:29 - Trial = 4018/30000 | Total reward = 42.42
2022-01-26 14:16:43.663 | DEBUG    | __main__:trials:24 - Trial = 4019/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.665 | DEBUG    | __main__:trials:29 - Trial = 4019/30000 | Total reward = 45.48
2022-01-26 14:16:43.668 | DEBUG    | __main__:trials:24 - Trial = 4020/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.670 | DEBUG    | __main__:trials:29 - Trial = 4020/30000 | Total reward = 37.74
2022-01-26 14:16:43.674 | DEBUG    | __main__:trials:24 - Trial = 4021/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.675 | DEBUG    | __main__:trials:29 - Trial = 4021/30000 | Total reward = 37.65
2022-01-26 14:16:43.679 | DEBUG    | __main__:trials:24 - Trial = 4022/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.680 | DEBUG    | __main__:trials:29 - Trial = 4022/30000 | Total reward = 50.22
2022-01-26 14:16:43.684 | DEBUG    | __main__:trials:24 - Trial = 4023/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.685 | DEBUG    | __main__:trials:29 - Trial = 4023/30000 | Total reward = 29.93
2022-01-26 14:16:43.689 | DEBUG    | __main__:trials:24 - Trial = 4024/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.691 | DEBUG    | __main__:trials:29 - Trial = 4024/30000 | Total reward = 43.71
2022-01-26 14:16:43.694 | DEBUG    | __main__:trials:24 - Trial = 4025/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.696 | DEBUG    | __main__:trials:29 - Trial = 4025/30000 | Total reward = 35.47
2022-01-26 14:16:43.700 | DEBUG    | __main__:trials:26 - Trial = 4026/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.701 | DEBUG    | __main__:trials:29 - Trial = 4026/30000 | Total reward = 33.80
2022-01-26 14:16:43.705 | DEBUG    | __main__:trials:24 - Trial = 4027/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.706 | DEBUG    | __main__:trials:29 - Trial = 4027/30000 | Total reward = 43.60
2022-01-26 14:16:43.709 | DEBUG    | __main__:trials:24 - Trial = 4028/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.711 | DEBUG    | __main__:trials:29 - Trial = 4028/30000 | Total reward = 59.38
2022-01-26 14:16:43.714 | DEBUG    | __main__:trials:26 - Trial = 4029/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.715 | DEBUG    | __main__:trials:29 - Trial = 4029/30000 | Total reward = 18.81
2022-01-26 14:16:43.719 | DEBUG    | __main__:trials:24 - Trial = 4030/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.721 | DEBUG    | __main__:trials:29 - Trial = 4030/30000 | Total reward = 43.64
2022-01-26 14:16:43.725 | DEBUG    | __main__:trials:24 - Trial = 4031/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.727 | DEBUG    | __main__:trials:29 - Trial = 4031/30000 | Total reward = 43.24
2022-01-26 14:16:43.731 | DEBUG    | __main__:trials:24 - Trial = 4032/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.732 | DEBUG    | __main__:trials:29 - Trial = 4032/30000 | Total reward = 48.36
2022-01-26 14:16:43.736 | DEBUG    | __main__:trials:24 - Trial = 4033/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.737 | DEBUG    | __main__:trials:29 - Trial = 4033/30000 | Total reward = 40.73
2022-01-26 14:16:43.741 | DEBUG    | __main__:trials:24 - Trial = 4034/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.743 | DEBUG    | __main__:trials:29 - Trial = 4034/30000 | Total reward = 55.07
2022-01-26 14:16:43.747 | DEBUG    | __main__:trials:24 - Trial = 4035/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.748 | DEBUG    | __main__:trials:29 - Trial = 4035/30000 | Total reward = 46.83
2022-01-26 14:16:43.752 | DEBUG    | __main__:trials:24 - Trial = 4036/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.754 | DEBUG    | __main__:trials:29 - Trial = 4036/30000 | Total reward = 44.16
2022-01-26 14:16:43.757 | DEBUG    | __main__:trials:24 - Trial = 4037/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.759 | DEBUG    | __main__:trials:29 - Trial = 4037/30000 | Total reward = 34.97
2022-01-26 14:16:43.763 | DEBUG    | __main__:trials:24 - Trial = 4038/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.763 | DEBUG    | __main__:trials:29 - Trial = 4038/30000 | Total reward = 41.13
2022-01-26 14:16:43.767 | DEBUG    | __main__:trials:26 - Trial = 4039/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:43.769 | DEBUG    | __main__:trials:29 - Trial = 4039/30000 | Total reward = 35.33
2022-01-26 14:16:43.772 | DEBUG    | __main__:trials:24 - Trial = 4040/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.773 | DEBUG    | __main__:trials:29 - Trial = 4040/30000 | Total reward = 39.00
2022-01-26 14:16:43.776 | DEBUG    | __main__:trials:24 - Trial = 4041/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.778 | DEBUG    | __main__:trials:29 - Trial = 4041/30000 | Total reward = 18.13
2022-01-26 14:16:43.782 | DEBUG    | __main__:trials:24 - Trial = 4042/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.783 | DEBUG    | __main__:trials:29 - Trial = 4042/30000 | Total reward = 38.99
2022-01-26 14:16:43.787 | DEBUG    | __main__:trials:24 - Trial = 4043/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.789 | DEBUG    | __main__:trials:29 - Trial = 4043/30000 | Total reward = 42.79
2022-01-26 14:16:43.792 | DEBUG    | __main__:trials:24 - Trial = 4044/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.794 | DEBUG    | __main__:trials:29 - Trial = 4044/30000 | Total reward = 43.71
2022-01-26 14:16:43.798 | DEBUG    | __main__:trials:24 - Trial = 4045/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.799 | DEBUG    | __main__:trials:29 - Trial = 4045/30000 | Total reward = 43.79
2022-01-26 14:16:43.803 | DEBUG    | __main__:trials:24 - Trial = 4046/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.804 | DEBUG    | __main__:trials:29 - Trial = 4046/30000 | Total reward = 42.55
2022-01-26 14:16:43.808 | DEBUG    | __main__:trials:24 - Trial = 4047/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.810 | DEBUG    | __main__:trials:29 - Trial = 4047/30000 | Total reward = 39.68
2022-01-26 14:16:43.813 | DEBUG    | __main__:trials:24 - Trial = 4048/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.815 | DEBUG    | __main__:trials:29 - Trial = 4048/30000 | Total reward = 43.47
2022-01-26 14:16:43.819 | DEBUG    | __main__:trials:24 - Trial = 4049/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.820 | DEBUG    | __main__:trials:29 - Trial = 4049/30000 | Total reward = 43.67
2022-01-26 14:16:43.824 | DEBUG    | __main__:trials:24 - Trial = 4050/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.825 | DEBUG    | __main__:trials:29 - Trial = 4050/30000 | Total reward = 45.01
2022-01-26 14:16:43.829 | DEBUG    | __main__:trials:24 - Trial = 4051/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.831 | DEBUG    | __main__:trials:29 - Trial = 4051/30000 | Total reward = 42.40
2022-01-26 14:16:43.835 | DEBUG    | __main__:trials:24 - Trial = 4052/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.836 | DEBUG    | __main__:trials:29 - Trial = 4052/30000 | Total reward = 44.98
2022-01-26 14:16:43.840 | DEBUG    | __main__:trials:24 - Trial = 4053/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.842 | DEBUG    | __main__:trials:29 - Trial = 4053/30000 | Total reward = 28.05
2022-01-26 14:16:43.846 | DEBUG    | __main__:trials:24 - Trial = 4054/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.847 | DEBUG    | __main__:trials:29 - Trial = 4054/30000 | Total reward = 42.58
2022-01-26 14:16:43.851 | DEBUG    | __main__:trials:24 - Trial = 4055/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.852 | DEBUG    | __main__:trials:29 - Trial = 4055/30000 | Total reward = 48.44
2022-01-26 14:16:43.856 | DEBUG    | __main__:trials:24 - Trial = 4056/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.858 | DEBUG    | __main__:trials:29 - Trial = 4056/30000 | Total reward = 43.71
2022-01-26 14:16:43.862 | DEBUG    | __main__:trials:24 - Trial = 4057/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.863 | DEBUG    | __main__:trials:29 - Trial = 4057/30000 | Total reward = 35.63
2022-01-26 14:16:43.867 | DEBUG    | __main__:trials:24 - Trial = 4058/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.869 | DEBUG    | __main__:trials:29 - Trial = 4058/30000 | Total reward = 32.97
2022-01-26 14:16:43.873 | DEBUG    | __main__:trials:24 - Trial = 4059/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.874 | DEBUG    | __main__:trials:29 - Trial = 4059/30000 | Total reward = 42.63
2022-01-26 14:16:43.878 | DEBUG    | __main__:trials:24 - Trial = 4060/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.879 | DEBUG    | __main__:trials:29 - Trial = 4060/30000 | Total reward = 45.48
2022-01-26 14:16:43.882 | DEBUG    | __main__:trials:24 - Trial = 4061/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.884 | DEBUG    | __main__:trials:29 - Trial = 4061/30000 | Total reward = 49.04
2022-01-26 14:16:43.887 | DEBUG    | __main__:trials:24 - Trial = 4062/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.889 | DEBUG    | __main__:trials:29 - Trial = 4062/30000 | Total reward = 41.99
2022-01-26 14:16:43.893 | DEBUG    | __main__:trials:24 - Trial = 4063/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.895 | DEBUG    | __main__:trials:29 - Trial = 4063/30000 | Total reward = 50.08
2022-01-26 14:16:43.898 | DEBUG    | __main__:trials:24 - Trial = 4064/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.900 | DEBUG    | __main__:trials:29 - Trial = 4064/30000 | Total reward = 30.67
2022-01-26 14:16:43.904 | DEBUG    | __main__:trials:24 - Trial = 4065/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.906 | DEBUG    | __main__:trials:29 - Trial = 4065/30000 | Total reward = 51.13
2022-01-26 14:16:43.910 | DEBUG    | __main__:trials:24 - Trial = 4066/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.911 | DEBUG    | __main__:trials:29 - Trial = 4066/30000 | Total reward = 43.71
2022-01-26 14:16:43.915 | DEBUG    | __main__:trials:24 - Trial = 4067/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.917 | DEBUG    | __main__:trials:29 - Trial = 4067/30000 | Total reward = 43.56
2022-01-26 14:16:43.920 | DEBUG    | __main__:trials:24 - Trial = 4068/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.922 | DEBUG    | __main__:trials:29 - Trial = 4068/30000 | Total reward = 40.82
2022-01-26 14:16:43.925 | DEBUG    | __main__:trials:24 - Trial = 4069/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.927 | DEBUG    | __main__:trials:29 - Trial = 4069/30000 | Total reward = 42.73
2022-01-26 14:16:43.931 | DEBUG    | __main__:trials:24 - Trial = 4070/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.932 | DEBUG    | __main__:trials:29 - Trial = 4070/30000 | Total reward = 50.58
2022-01-26 14:16:43.936 | DEBUG    | __main__:trials:24 - Trial = 4071/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.938 | DEBUG    | __main__:trials:29 - Trial = 4071/30000 | Total reward = 56.20
2022-01-26 14:16:43.941 | DEBUG    | __main__:trials:24 - Trial = 4072/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.942 | DEBUG    | __main__:trials:29 - Trial = 4072/30000 | Total reward = 43.26
2022-01-26 14:16:43.946 | DEBUG    | __main__:trials:24 - Trial = 4073/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.948 | DEBUG    | __main__:trials:29 - Trial = 4073/30000 | Total reward = 49.13
2022-01-26 14:16:43.952 | DEBUG    | __main__:trials:24 - Trial = 4074/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.953 | DEBUG    | __main__:trials:29 - Trial = 4074/30000 | Total reward = 42.24
2022-01-26 14:16:43.957 | DEBUG    | __main__:trials:24 - Trial = 4075/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.958 | DEBUG    | __main__:trials:29 - Trial = 4075/30000 | Total reward = 41.58
2022-01-26 14:16:43.962 | DEBUG    | __main__:trials:24 - Trial = 4076/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.963 | DEBUG    | __main__:trials:29 - Trial = 4076/30000 | Total reward = 42.68
2022-01-26 14:16:43.967 | DEBUG    | __main__:trials:24 - Trial = 4077/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.969 | DEBUG    | __main__:trials:29 - Trial = 4077/30000 | Total reward = 44.40
2022-01-26 14:16:43.972 | DEBUG    | __main__:trials:24 - Trial = 4078/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.974 | DEBUG    | __main__:trials:29 - Trial = 4078/30000 | Total reward = 39.84
2022-01-26 14:16:43.978 | DEBUG    | __main__:trials:24 - Trial = 4079/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.979 | DEBUG    | __main__:trials:29 - Trial = 4079/30000 | Total reward = 50.67
2022-01-26 14:16:43.983 | DEBUG    | __main__:trials:24 - Trial = 4080/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.984 | DEBUG    | __main__:trials:29 - Trial = 4080/30000 | Total reward = 44.48
2022-01-26 14:16:43.988 | DEBUG    | __main__:trials:24 - Trial = 4081/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.990 | DEBUG    | __main__:trials:29 - Trial = 4081/30000 | Total reward = 40.25
2022-01-26 14:16:43.993 | DEBUG    | __main__:trials:24 - Trial = 4082/30000 | Max number of steps (20) reached
2022-01-26 14:16:43.995 | DEBUG    | __main__:trials:29 - Trial = 4082/30000 | Total reward = 48.87
2022-01-26 14:16:43.999 | DEBUG    | __main__:trials:24 - Trial = 4083/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.000 | DEBUG    | __main__:trials:29 - Trial = 4083/30000 | Total reward = 41.26
2022-01-26 14:16:44.004 | DEBUG    | __main__:trials:24 - Trial = 4084/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.006 | DEBUG    | __main__:trials:29 - Trial = 4084/30000 | Total reward = 50.91
2022-01-26 14:16:44.010 | DEBUG    | __main__:trials:24 - Trial = 4085/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.011 | DEBUG    | __main__:trials:29 - Trial = 4085/30000 | Total reward = 51.32
2022-01-26 14:16:44.015 | DEBUG    | __main__:trials:24 - Trial = 4086/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.017 | DEBUG    | __main__:trials:29 - Trial = 4086/30000 | Total reward = 37.99
2022-01-26 14:16:44.020 | DEBUG    | __main__:trials:24 - Trial = 4087/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.022 | DEBUG    | __main__:trials:29 - Trial = 4087/30000 | Total reward = 51.60
2022-01-26 14:16:44.026 | DEBUG    | __main__:trials:24 - Trial = 4088/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.027 | DEBUG    | __main__:trials:29 - Trial = 4088/30000 | Total reward = 56.36
2022-01-26 14:16:44.030 | DEBUG    | __main__:trials:24 - Trial = 4089/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.032 | DEBUG    | __main__:trials:29 - Trial = 4089/30000 | Total reward = 42.40
2022-01-26 14:16:44.036 | DEBUG    | __main__:trials:24 - Trial = 4090/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.038 | DEBUG    | __main__:trials:29 - Trial = 4090/30000 | Total reward = 35.27
2022-01-26 14:16:44.042 | DEBUG    | __main__:trials:24 - Trial = 4091/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.043 | DEBUG    | __main__:trials:29 - Trial = 4091/30000 | Total reward = 42.58
2022-01-26 14:16:44.047 | DEBUG    | __main__:trials:24 - Trial = 4092/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.049 | DEBUG    | __main__:trials:29 - Trial = 4092/30000 | Total reward = 48.58
2022-01-26 14:16:44.052 | DEBUG    | __main__:trials:24 - Trial = 4093/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.054 | DEBUG    | __main__:trials:29 - Trial = 4093/30000 | Total reward = 31.69
2022-01-26 14:16:44.057 | DEBUG    | __main__:trials:24 - Trial = 4094/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.059 | DEBUG    | __main__:trials:29 - Trial = 4094/30000 | Total reward = 30.61
2022-01-26 14:16:44.063 | DEBUG    | __main__:trials:24 - Trial = 4095/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.064 | DEBUG    | __main__:trials:29 - Trial = 4095/30000 | Total reward = 38.28
2022-01-26 14:16:44.067 | DEBUG    | __main__:trials:24 - Trial = 4096/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.070 | DEBUG    | __main__:trials:29 - Trial = 4096/30000 | Total reward = 32.39
2022-01-26 14:16:44.073 | DEBUG    | __main__:trials:26 - Trial = 4097/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.074 | DEBUG    | __main__:trials:29 - Trial = 4097/30000 | Total reward = 28.61
2022-01-26 14:16:44.078 | DEBUG    | __main__:trials:24 - Trial = 4098/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.079 | DEBUG    | __main__:trials:29 - Trial = 4098/30000 | Total reward = 43.32
2022-01-26 14:16:44.083 | DEBUG    | __main__:trials:24 - Trial = 4099/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.085 | DEBUG    | __main__:trials:29 - Trial = 4099/30000 | Total reward = 56.20
2022-01-26 14:16:44.089 | DEBUG    | __main__:trials:24 - Trial = 4100/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.090 | DEBUG    | __main__:trials:29 - Trial = 4100/30000 | Total reward = 42.03
2022-01-26 14:16:44.094 | DEBUG    | __main__:trials:24 - Trial = 4101/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.094 | DEBUG    | __main__:trials:29 - Trial = 4101/30000 | Total reward = 45.66
2022-01-26 14:16:44.099 | DEBUG    | __main__:trials:26 - Trial = 4102/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.100 | DEBUG    | __main__:trials:29 - Trial = 4102/30000 | Total reward = 27.34
2022-01-26 14:16:44.104 | DEBUG    | __main__:trials:24 - Trial = 4103/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.105 | DEBUG    | __main__:trials:29 - Trial = 4103/30000 | Total reward = 45.94
2022-01-26 14:16:44.109 | DEBUG    | __main__:trials:24 - Trial = 4104/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.110 | DEBUG    | __main__:trials:29 - Trial = 4104/30000 | Total reward = 43.79
2022-01-26 14:16:44.113 | DEBUG    | __main__:trials:24 - Trial = 4105/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.114 | DEBUG    | __main__:trials:29 - Trial = 4105/30000 | Total reward = 43.27
2022-01-26 14:16:44.117 | DEBUG    | __main__:trials:24 - Trial = 4106/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.119 | DEBUG    | __main__:trials:29 - Trial = 4106/30000 | Total reward = 43.14
2022-01-26 14:16:44.122 | DEBUG    | __main__:trials:24 - Trial = 4107/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.124 | DEBUG    | __main__:trials:29 - Trial = 4107/30000 | Total reward = 42.07
2022-01-26 14:16:44.128 | DEBUG    | __main__:trials:24 - Trial = 4108/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.129 | DEBUG    | __main__:trials:29 - Trial = 4108/30000 | Total reward = 43.32
2022-01-26 14:16:44.133 | DEBUG    | __main__:trials:24 - Trial = 4109/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.135 | DEBUG    | __main__:trials:29 - Trial = 4109/30000 | Total reward = 23.91
2022-01-26 14:16:44.138 | DEBUG    | __main__:trials:26 - Trial = 4110/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.139 | DEBUG    | __main__:trials:29 - Trial = 4110/30000 | Total reward = 18.49
2022-01-26 14:16:44.143 | DEBUG    | __main__:trials:24 - Trial = 4111/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.145 | DEBUG    | __main__:trials:29 - Trial = 4111/30000 | Total reward = 54.18
2022-01-26 14:16:44.148 | DEBUG    | __main__:trials:24 - Trial = 4112/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.150 | DEBUG    | __main__:trials:29 - Trial = 4112/30000 | Total reward = 43.13
2022-01-26 14:16:44.153 | DEBUG    | __main__:trials:24 - Trial = 4113/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.155 | DEBUG    | __main__:trials:29 - Trial = 4113/30000 | Total reward = 48.58
2022-01-26 14:16:44.159 | DEBUG    | __main__:trials:24 - Trial = 4114/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.159 | DEBUG    | __main__:trials:29 - Trial = 4114/30000 | Total reward = 46.16
2022-01-26 14:16:44.163 | DEBUG    | __main__:trials:24 - Trial = 4115/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.164 | DEBUG    | __main__:trials:29 - Trial = 4115/30000 | Total reward = 45.69
2022-01-26 14:16:44.168 | DEBUG    | __main__:trials:24 - Trial = 4116/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.169 | DEBUG    | __main__:trials:29 - Trial = 4116/30000 | Total reward = 49.77
2022-01-26 14:16:44.172 | DEBUG    | __main__:trials:24 - Trial = 4117/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.173 | DEBUG    | __main__:trials:29 - Trial = 4117/30000 | Total reward = 51.04
2022-01-26 14:16:44.177 | DEBUG    | __main__:trials:24 - Trial = 4118/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.178 | DEBUG    | __main__:trials:29 - Trial = 4118/30000 | Total reward = 44.05
2022-01-26 14:16:44.181 | DEBUG    | __main__:trials:24 - Trial = 4119/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.182 | DEBUG    | __main__:trials:29 - Trial = 4119/30000 | Total reward = 44.42
2022-01-26 14:16:44.186 | DEBUG    | __main__:trials:24 - Trial = 4120/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.188 | DEBUG    | __main__:trials:29 - Trial = 4120/30000 | Total reward = 41.19
2022-01-26 14:16:44.191 | DEBUG    | __main__:trials:24 - Trial = 4121/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.192 | DEBUG    | __main__:trials:29 - Trial = 4121/30000 | Total reward = 43.23
2022-01-26 14:16:44.196 | DEBUG    | __main__:trials:24 - Trial = 4122/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.197 | DEBUG    | __main__:trials:29 - Trial = 4122/30000 | Total reward = 29.46
2022-01-26 14:16:44.200 | DEBUG    | __main__:trials:24 - Trial = 4123/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.202 | DEBUG    | __main__:trials:29 - Trial = 4123/30000 | Total reward = 34.09
2022-01-26 14:16:44.205 | DEBUG    | __main__:trials:24 - Trial = 4124/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.206 | DEBUG    | __main__:trials:29 - Trial = 4124/30000 | Total reward = 48.22
2022-01-26 14:16:44.210 | DEBUG    | __main__:trials:24 - Trial = 4125/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.210 | DEBUG    | __main__:trials:29 - Trial = 4125/30000 | Total reward = 51.03
2022-01-26 14:16:44.214 | DEBUG    | __main__:trials:24 - Trial = 4126/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.215 | DEBUG    | __main__:trials:29 - Trial = 4126/30000 | Total reward = 53.49
2022-01-26 14:16:44.218 | DEBUG    | __main__:trials:24 - Trial = 4127/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.219 | DEBUG    | __main__:trials:29 - Trial = 4127/30000 | Total reward = 41.28
2022-01-26 14:16:44.222 | DEBUG    | __main__:trials:24 - Trial = 4128/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.223 | DEBUG    | __main__:trials:29 - Trial = 4128/30000 | Total reward = 40.83
2022-01-26 14:16:44.227 | DEBUG    | __main__:trials:24 - Trial = 4129/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.228 | DEBUG    | __main__:trials:29 - Trial = 4129/30000 | Total reward = 49.38
2022-01-26 14:16:44.232 | DEBUG    | __main__:trials:24 - Trial = 4130/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.234 | DEBUG    | __main__:trials:29 - Trial = 4130/30000 | Total reward = 51.47
2022-01-26 14:16:44.237 | DEBUG    | __main__:trials:24 - Trial = 4131/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.237 | DEBUG    | __main__:trials:29 - Trial = 4131/30000 | Total reward = 35.97
2022-01-26 14:16:44.241 | DEBUG    | __main__:trials:24 - Trial = 4132/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.242 | DEBUG    | __main__:trials:29 - Trial = 4132/30000 | Total reward = 35.25
2022-01-26 14:16:44.246 | DEBUG    | __main__:trials:24 - Trial = 4133/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.248 | DEBUG    | __main__:trials:29 - Trial = 4133/30000 | Total reward = 48.54
2022-01-26 14:16:44.251 | DEBUG    | __main__:trials:24 - Trial = 4134/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.252 | DEBUG    | __main__:trials:29 - Trial = 4134/30000 | Total reward = 50.10
2022-01-26 14:16:44.255 | DEBUG    | __main__:trials:24 - Trial = 4135/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.257 | DEBUG    | __main__:trials:29 - Trial = 4135/30000 | Total reward = 47.36
2022-01-26 14:16:44.260 | DEBUG    | __main__:trials:24 - Trial = 4136/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.262 | DEBUG    | __main__:trials:29 - Trial = 4136/30000 | Total reward = 25.27
2022-01-26 14:16:44.265 | DEBUG    | __main__:trials:24 - Trial = 4137/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.267 | DEBUG    | __main__:trials:29 - Trial = 4137/30000 | Total reward = 38.31
2022-01-26 14:16:44.270 | DEBUG    | __main__:trials:24 - Trial = 4138/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.271 | DEBUG    | __main__:trials:29 - Trial = 4138/30000 | Total reward = 43.11
2022-01-26 14:16:44.274 | DEBUG    | __main__:trials:24 - Trial = 4139/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.275 | DEBUG    | __main__:trials:29 - Trial = 4139/30000 | Total reward = 29.24
2022-01-26 14:16:44.278 | DEBUG    | __main__:trials:26 - Trial = 4140/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.279 | DEBUG    | __main__:trials:29 - Trial = 4140/30000 | Total reward = 25.37
2022-01-26 14:16:44.283 | DEBUG    | __main__:trials:24 - Trial = 4141/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.284 | DEBUG    | __main__:trials:29 - Trial = 4141/30000 | Total reward = 49.21
2022-01-26 14:16:44.287 | DEBUG    | __main__:trials:24 - Trial = 4142/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.289 | DEBUG    | __main__:trials:29 - Trial = 4142/30000 | Total reward = 52.08
2022-01-26 14:16:44.292 | DEBUG    | __main__:trials:24 - Trial = 4143/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.294 | DEBUG    | __main__:trials:29 - Trial = 4143/30000 | Total reward = 46.02
2022-01-26 14:16:44.296 | DEBUG    | __main__:trials:26 - Trial = 4144/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.297 | DEBUG    | __main__:trials:29 - Trial = 4144/30000 | Total reward = 10.21
2022-01-26 14:16:44.300 | DEBUG    | __main__:trials:24 - Trial = 4145/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.301 | DEBUG    | __main__:trials:29 - Trial = 4145/30000 | Total reward = 41.20
2022-01-26 14:16:44.305 | DEBUG    | __main__:trials:24 - Trial = 4146/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.305 | DEBUG    | __main__:trials:29 - Trial = 4146/30000 | Total reward = 47.33
2022-01-26 14:16:44.309 | DEBUG    | __main__:trials:26 - Trial = 4147/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.309 | DEBUG    | __main__:trials:29 - Trial = 4147/30000 | Total reward = 32.82
2022-01-26 14:16:44.313 | DEBUG    | __main__:trials:24 - Trial = 4148/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.314 | DEBUG    | __main__:trials:29 - Trial = 4148/30000 | Total reward = 43.19
2022-01-26 14:16:44.317 | DEBUG    | __main__:trials:24 - Trial = 4149/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.318 | DEBUG    | __main__:trials:29 - Trial = 4149/30000 | Total reward = 42.87
2022-01-26 14:16:44.321 | DEBUG    | __main__:trials:24 - Trial = 4150/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.322 | DEBUG    | __main__:trials:29 - Trial = 4150/30000 | Total reward = 46.86
2022-01-26 14:16:44.325 | DEBUG    | __main__:trials:24 - Trial = 4151/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.326 | DEBUG    | __main__:trials:29 - Trial = 4151/30000 | Total reward = 43.45
2022-01-26 14:16:44.330 | DEBUG    | __main__:trials:24 - Trial = 4152/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.332 | DEBUG    | __main__:trials:29 - Trial = 4152/30000 | Total reward = 49.57
2022-01-26 14:16:44.335 | DEBUG    | __main__:trials:24 - Trial = 4153/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.336 | DEBUG    | __main__:trials:29 - Trial = 4153/30000 | Total reward = 54.62
2022-01-26 14:16:44.339 | DEBUG    | __main__:trials:24 - Trial = 4154/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.341 | DEBUG    | __main__:trials:29 - Trial = 4154/30000 | Total reward = 54.20
2022-01-26 14:16:44.344 | DEBUG    | __main__:trials:24 - Trial = 4155/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.345 | DEBUG    | __main__:trials:29 - Trial = 4155/30000 | Total reward = 45.02
2022-01-26 14:16:44.349 | DEBUG    | __main__:trials:24 - Trial = 4156/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.350 | DEBUG    | __main__:trials:29 - Trial = 4156/30000 | Total reward = 47.02
2022-01-26 14:16:44.353 | DEBUG    | __main__:trials:24 - Trial = 4157/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.354 | DEBUG    | __main__:trials:29 - Trial = 4157/30000 | Total reward = 32.62
2022-01-26 14:16:44.358 | DEBUG    | __main__:trials:24 - Trial = 4158/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.359 | DEBUG    | __main__:trials:29 - Trial = 4158/30000 | Total reward = 40.63
2022-01-26 14:16:44.362 | DEBUG    | __main__:trials:24 - Trial = 4159/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.363 | DEBUG    | __main__:trials:29 - Trial = 4159/30000 | Total reward = 33.11
2022-01-26 14:16:44.366 | DEBUG    | __main__:trials:24 - Trial = 4160/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.368 | DEBUG    | __main__:trials:29 - Trial = 4160/30000 | Total reward = 46.55
2022-01-26 14:16:44.372 | DEBUG    | __main__:trials:24 - Trial = 4161/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.373 | DEBUG    | __main__:trials:29 - Trial = 4161/30000 | Total reward = 41.25
2022-01-26 14:16:44.377 | DEBUG    | __main__:trials:24 - Trial = 4162/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.377 | DEBUG    | __main__:trials:29 - Trial = 4162/30000 | Total reward = 43.90
2022-01-26 14:16:44.381 | DEBUG    | __main__:trials:24 - Trial = 4163/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.381 | DEBUG    | __main__:trials:29 - Trial = 4163/30000 | Total reward = 49.33
2022-01-26 14:16:44.384 | DEBUG    | __main__:trials:24 - Trial = 4164/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.385 | DEBUG    | __main__:trials:29 - Trial = 4164/30000 | Total reward = 36.71
2022-01-26 14:16:44.389 | DEBUG    | __main__:trials:24 - Trial = 4165/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.390 | DEBUG    | __main__:trials:29 - Trial = 4165/30000 | Total reward = 49.45
2022-01-26 14:16:44.395 | DEBUG    | __main__:trials:24 - Trial = 4166/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.396 | DEBUG    | __main__:trials:29 - Trial = 4166/30000 | Total reward = 48.20
2022-01-26 14:16:44.399 | DEBUG    | __main__:trials:24 - Trial = 4167/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.401 | DEBUG    | __main__:trials:29 - Trial = 4167/30000 | Total reward = 49.97
2022-01-26 14:16:44.405 | DEBUG    | __main__:trials:24 - Trial = 4168/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.405 | DEBUG    | __main__:trials:29 - Trial = 4168/30000 | Total reward = 51.91
2022-01-26 14:16:44.409 | DEBUG    | __main__:trials:24 - Trial = 4169/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.410 | DEBUG    | __main__:trials:29 - Trial = 4169/30000 | Total reward = 47.69
2022-01-26 14:16:44.414 | DEBUG    | __main__:trials:24 - Trial = 4170/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.415 | DEBUG    | __main__:trials:29 - Trial = 4170/30000 | Total reward = 51.38
2022-01-26 14:16:44.419 | DEBUG    | __main__:trials:24 - Trial = 4171/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.421 | DEBUG    | __main__:trials:29 - Trial = 4171/30000 | Total reward = 50.03
2022-01-26 14:16:44.424 | DEBUG    | __main__:trials:24 - Trial = 4172/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.426 | DEBUG    | __main__:trials:29 - Trial = 4172/30000 | Total reward = 51.51
2022-01-26 14:16:44.430 | DEBUG    | __main__:trials:24 - Trial = 4173/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.430 | DEBUG    | __main__:trials:29 - Trial = 4173/30000 | Total reward = 50.69
2022-01-26 14:16:44.435 | DEBUG    | __main__:trials:24 - Trial = 4174/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.436 | DEBUG    | __main__:trials:29 - Trial = 4174/30000 | Total reward = 48.48
2022-01-26 14:16:44.440 | DEBUG    | __main__:trials:24 - Trial = 4175/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.441 | DEBUG    | __main__:trials:29 - Trial = 4175/30000 | Total reward = 49.89
2022-01-26 14:16:44.445 | DEBUG    | __main__:trials:24 - Trial = 4176/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.447 | DEBUG    | __main__:trials:29 - Trial = 4176/30000 | Total reward = 27.37
2022-01-26 14:16:44.450 | DEBUG    | __main__:trials:24 - Trial = 4177/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.452 | DEBUG    | __main__:trials:29 - Trial = 4177/30000 | Total reward = 41.53
2022-01-26 14:16:44.456 | DEBUG    | __main__:trials:24 - Trial = 4178/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.457 | DEBUG    | __main__:trials:29 - Trial = 4178/30000 | Total reward = 47.89
2022-01-26 14:16:44.460 | DEBUG    | __main__:trials:24 - Trial = 4179/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.461 | DEBUG    | __main__:trials:29 - Trial = 4179/30000 | Total reward = 42.38
2022-01-26 14:16:44.465 | DEBUG    | __main__:trials:24 - Trial = 4180/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.465 | DEBUG    | __main__:trials:29 - Trial = 4180/30000 | Total reward = 51.19
2022-01-26 14:16:44.469 | DEBUG    | __main__:trials:24 - Trial = 4181/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.471 | DEBUG    | __main__:trials:29 - Trial = 4181/30000 | Total reward = 47.42
2022-01-26 14:16:44.474 | DEBUG    | __main__:trials:24 - Trial = 4182/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.475 | DEBUG    | __main__:trials:29 - Trial = 4182/30000 | Total reward = 49.02
2022-01-26 14:16:44.478 | DEBUG    | __main__:trials:24 - Trial = 4183/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.480 | DEBUG    | __main__:trials:29 - Trial = 4183/30000 | Total reward = 49.67
2022-01-26 14:16:44.484 | DEBUG    | __main__:trials:24 - Trial = 4184/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.485 | DEBUG    | __main__:trials:29 - Trial = 4184/30000 | Total reward = 50.88
2022-01-26 14:16:44.489 | DEBUG    | __main__:trials:24 - Trial = 4185/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.490 | DEBUG    | __main__:trials:29 - Trial = 4185/30000 | Total reward = 49.07
2022-01-26 14:16:44.494 | DEBUG    | __main__:trials:24 - Trial = 4186/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.496 | DEBUG    | __main__:trials:29 - Trial = 4186/30000 | Total reward = 49.73
2022-01-26 14:16:44.499 | DEBUG    | __main__:trials:24 - Trial = 4187/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.501 | DEBUG    | __main__:trials:29 - Trial = 4187/30000 | Total reward = 47.81
2022-01-26 14:16:44.505 | DEBUG    | __main__:trials:24 - Trial = 4188/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.506 | DEBUG    | __main__:trials:29 - Trial = 4188/30000 | Total reward = 56.65
2022-01-26 14:16:44.510 | DEBUG    | __main__:trials:24 - Trial = 4189/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.512 | DEBUG    | __main__:trials:29 - Trial = 4189/30000 | Total reward = 52.35
2022-01-26 14:16:44.516 | DEBUG    | __main__:trials:24 - Trial = 4190/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.517 | DEBUG    | __main__:trials:29 - Trial = 4190/30000 | Total reward = 50.31
2022-01-26 14:16:44.520 | DEBUG    | __main__:trials:24 - Trial = 4191/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.522 | DEBUG    | __main__:trials:29 - Trial = 4191/30000 | Total reward = 35.47
2022-01-26 14:16:44.525 | DEBUG    | __main__:trials:24 - Trial = 4192/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.526 | DEBUG    | __main__:trials:29 - Trial = 4192/30000 | Total reward = 28.99
2022-01-26 14:16:44.529 | DEBUG    | __main__:trials:24 - Trial = 4193/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.531 | DEBUG    | __main__:trials:29 - Trial = 4193/30000 | Total reward = 47.87
2022-01-26 14:16:44.533 | DEBUG    | __main__:trials:26 - Trial = 4194/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.534 | DEBUG    | __main__:trials:29 - Trial = 4194/30000 | Total reward = 27.64
2022-01-26 14:16:44.537 | DEBUG    | __main__:trials:24 - Trial = 4195/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.539 | DEBUG    | __main__:trials:29 - Trial = 4195/30000 | Total reward = 34.49
2022-01-26 14:16:44.543 | DEBUG    | __main__:trials:24 - Trial = 4196/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.544 | DEBUG    | __main__:trials:29 - Trial = 4196/30000 | Total reward = 44.64
2022-01-26 14:16:44.547 | DEBUG    | __main__:trials:24 - Trial = 4197/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.549 | DEBUG    | __main__:trials:29 - Trial = 4197/30000 | Total reward = 43.96
2022-01-26 14:16:44.553 | DEBUG    | __main__:trials:24 - Trial = 4198/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.555 | DEBUG    | __main__:trials:29 - Trial = 4198/30000 | Total reward = 43.99
2022-01-26 14:16:44.558 | DEBUG    | __main__:trials:24 - Trial = 4199/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.559 | DEBUG    | __main__:trials:29 - Trial = 4199/30000 | Total reward = 46.70
2022-01-26 14:16:44.563 | DEBUG    | __main__:trials:24 - Trial = 4200/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.565 | DEBUG    | __main__:trials:29 - Trial = 4200/30000 | Total reward = 51.15
2022-01-26 14:16:44.568 | DEBUG    | __main__:trials:24 - Trial = 4201/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.570 | DEBUG    | __main__:trials:29 - Trial = 4201/30000 | Total reward = 56.91
2022-01-26 14:16:44.574 | DEBUG    | __main__:trials:24 - Trial = 4202/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.576 | DEBUG    | __main__:trials:29 - Trial = 4202/30000 | Total reward = 51.38
2022-01-26 14:16:44.579 | DEBUG    | __main__:trials:24 - Trial = 4203/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.580 | DEBUG    | __main__:trials:29 - Trial = 4203/30000 | Total reward = 42.56
2022-01-26 14:16:44.583 | DEBUG    | __main__:trials:24 - Trial = 4204/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.585 | DEBUG    | __main__:trials:29 - Trial = 4204/30000 | Total reward = 54.61
2022-01-26 14:16:44.588 | DEBUG    | __main__:trials:26 - Trial = 4205/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.590 | DEBUG    | __main__:trials:29 - Trial = 4205/30000 | Total reward = 38.41
2022-01-26 14:16:44.594 | DEBUG    | __main__:trials:24 - Trial = 4206/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.595 | DEBUG    | __main__:trials:29 - Trial = 4206/30000 | Total reward = 49.67
2022-01-26 14:16:44.599 | DEBUG    | __main__:trials:24 - Trial = 4207/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.600 | DEBUG    | __main__:trials:29 - Trial = 4207/30000 | Total reward = 31.06
2022-01-26 14:16:44.605 | DEBUG    | __main__:trials:24 - Trial = 4208/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.606 | DEBUG    | __main__:trials:29 - Trial = 4208/30000 | Total reward = 37.34
2022-01-26 14:16:44.610 | DEBUG    | __main__:trials:24 - Trial = 4209/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.610 | DEBUG    | __main__:trials:29 - Trial = 4209/30000 | Total reward = 62.44
2022-01-26 14:16:44.614 | DEBUG    | __main__:trials:24 - Trial = 4210/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.615 | DEBUG    | __main__:trials:29 - Trial = 4210/30000 | Total reward = 48.02
2022-01-26 14:16:44.619 | DEBUG    | __main__:trials:24 - Trial = 4211/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.621 | DEBUG    | __main__:trials:29 - Trial = 4211/30000 | Total reward = 34.44
2022-01-26 14:16:44.624 | DEBUG    | __main__:trials:24 - Trial = 4212/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.626 | DEBUG    | __main__:trials:29 - Trial = 4212/30000 | Total reward = 22.54
2022-01-26 14:16:44.630 | DEBUG    | __main__:trials:24 - Trial = 4213/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.631 | DEBUG    | __main__:trials:29 - Trial = 4213/30000 | Total reward = 47.99
2022-01-26 14:16:44.635 | DEBUG    | __main__:trials:24 - Trial = 4214/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.636 | DEBUG    | __main__:trials:29 - Trial = 4214/30000 | Total reward = 46.62
2022-01-26 14:16:44.640 | DEBUG    | __main__:trials:24 - Trial = 4215/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.641 | DEBUG    | __main__:trials:29 - Trial = 4215/30000 | Total reward = 57.95
2022-01-26 14:16:44.645 | DEBUG    | __main__:trials:24 - Trial = 4216/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.646 | DEBUG    | __main__:trials:29 - Trial = 4216/30000 | Total reward = 49.04
2022-01-26 14:16:44.650 | DEBUG    | __main__:trials:24 - Trial = 4217/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.651 | DEBUG    | __main__:trials:29 - Trial = 4217/30000 | Total reward = 47.43
2022-01-26 14:16:44.655 | DEBUG    | __main__:trials:24 - Trial = 4218/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.657 | DEBUG    | __main__:trials:29 - Trial = 4218/30000 | Total reward = 46.39
2022-01-26 14:16:44.659 | DEBUG    | __main__:trials:26 - Trial = 4219/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.661 | DEBUG    | __main__:trials:29 - Trial = 4219/30000 | Total reward = 12.39
2022-01-26 14:16:44.664 | DEBUG    | __main__:trials:24 - Trial = 4220/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.666 | DEBUG    | __main__:trials:29 - Trial = 4220/30000 | Total reward = 35.63
2022-01-26 14:16:44.670 | DEBUG    | __main__:trials:24 - Trial = 4221/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.671 | DEBUG    | __main__:trials:29 - Trial = 4221/30000 | Total reward = 22.38
2022-01-26 14:16:44.675 | DEBUG    | __main__:trials:24 - Trial = 4222/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.676 | DEBUG    | __main__:trials:29 - Trial = 4222/30000 | Total reward = 46.66
2022-01-26 14:16:44.680 | DEBUG    | __main__:trials:24 - Trial = 4223/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.681 | DEBUG    | __main__:trials:29 - Trial = 4223/30000 | Total reward = 48.29
2022-01-26 14:16:44.685 | DEBUG    | __main__:trials:24 - Trial = 4224/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.687 | DEBUG    | __main__:trials:29 - Trial = 4224/30000 | Total reward = 51.21
2022-01-26 14:16:44.691 | DEBUG    | __main__:trials:24 - Trial = 4225/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.692 | DEBUG    | __main__:trials:29 - Trial = 4225/30000 | Total reward = 49.63
2022-01-26 14:16:44.696 | DEBUG    | __main__:trials:24 - Trial = 4226/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.698 | DEBUG    | __main__:trials:29 - Trial = 4226/30000 | Total reward = 49.92
2022-01-26 14:16:44.701 | DEBUG    | __main__:trials:24 - Trial = 4227/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.703 | DEBUG    | __main__:trials:29 - Trial = 4227/30000 | Total reward = 42.88
2022-01-26 14:16:44.707 | DEBUG    | __main__:trials:24 - Trial = 4228/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.708 | DEBUG    | __main__:trials:29 - Trial = 4228/30000 | Total reward = 58.14
2022-01-26 14:16:44.712 | DEBUG    | __main__:trials:24 - Trial = 4229/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.713 | DEBUG    | __main__:trials:29 - Trial = 4229/30000 | Total reward = 51.07
2022-01-26 14:16:44.716 | DEBUG    | __main__:trials:24 - Trial = 4230/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.718 | DEBUG    | __main__:trials:29 - Trial = 4230/30000 | Total reward = 49.73
2022-01-26 14:16:44.722 | DEBUG    | __main__:trials:24 - Trial = 4231/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.723 | DEBUG    | __main__:trials:29 - Trial = 4231/30000 | Total reward = 43.22
2022-01-26 14:16:44.727 | DEBUG    | __main__:trials:24 - Trial = 4232/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.728 | DEBUG    | __main__:trials:29 - Trial = 4232/30000 | Total reward = 51.64
2022-01-26 14:16:44.732 | DEBUG    | __main__:trials:24 - Trial = 4233/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.734 | DEBUG    | __main__:trials:29 - Trial = 4233/30000 | Total reward = 26.80
2022-01-26 14:16:44.737 | DEBUG    | __main__:trials:24 - Trial = 4234/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.739 | DEBUG    | __main__:trials:29 - Trial = 4234/30000 | Total reward = 47.03
2022-01-26 14:16:44.742 | DEBUG    | __main__:trials:24 - Trial = 4235/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.744 | DEBUG    | __main__:trials:29 - Trial = 4235/30000 | Total reward = 50.03
2022-01-26 14:16:44.748 | DEBUG    | __main__:trials:24 - Trial = 4236/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.750 | DEBUG    | __main__:trials:29 - Trial = 4236/30000 | Total reward = 46.93
2022-01-26 14:16:44.753 | DEBUG    | __main__:trials:24 - Trial = 4237/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.754 | DEBUG    | __main__:trials:29 - Trial = 4237/30000 | Total reward = 43.13
2022-01-26 14:16:44.758 | DEBUG    | __main__:trials:26 - Trial = 4238/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.760 | DEBUG    | __main__:trials:29 - Trial = 4238/30000 | Total reward = 40.49
2022-01-26 14:16:44.764 | DEBUG    | __main__:trials:24 - Trial = 4239/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.765 | DEBUG    | __main__:trials:29 - Trial = 4239/30000 | Total reward = 49.52
2022-01-26 14:16:44.768 | DEBUG    | __main__:trials:24 - Trial = 4240/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.769 | DEBUG    | __main__:trials:29 - Trial = 4240/30000 | Total reward = 41.13
2022-01-26 14:16:44.773 | DEBUG    | __main__:trials:24 - Trial = 4241/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.773 | DEBUG    | __main__:trials:29 - Trial = 4241/30000 | Total reward = 51.61
2022-01-26 14:16:44.776 | DEBUG    | __main__:trials:26 - Trial = 4242/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.777 | DEBUG    | __main__:trials:29 - Trial = 4242/30000 | Total reward = 19.83
2022-01-26 14:16:44.780 | DEBUG    | __main__:trials:24 - Trial = 4243/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.782 | DEBUG    | __main__:trials:29 - Trial = 4243/30000 | Total reward = 45.21
2022-01-26 14:16:44.786 | DEBUG    | __main__:trials:24 - Trial = 4244/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.787 | DEBUG    | __main__:trials:29 - Trial = 4244/30000 | Total reward = 46.06
2022-01-26 14:16:44.791 | DEBUG    | __main__:trials:24 - Trial = 4245/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.792 | DEBUG    | __main__:trials:29 - Trial = 4245/30000 | Total reward = 52.62
2022-01-26 14:16:44.796 | DEBUG    | __main__:trials:24 - Trial = 4246/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.798 | DEBUG    | __main__:trials:29 - Trial = 4246/30000 | Total reward = 48.13
2022-01-26 14:16:44.802 | DEBUG    | __main__:trials:24 - Trial = 4247/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.803 | DEBUG    | __main__:trials:29 - Trial = 4247/30000 | Total reward = 47.59
2022-01-26 14:16:44.807 | DEBUG    | __main__:trials:24 - Trial = 4248/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.807 | DEBUG    | __main__:trials:29 - Trial = 4248/30000 | Total reward = 49.67
2022-01-26 14:16:44.812 | DEBUG    | __main__:trials:24 - Trial = 4249/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.813 | DEBUG    | __main__:trials:29 - Trial = 4249/30000 | Total reward = 26.43
2022-01-26 14:16:44.816 | DEBUG    | __main__:trials:24 - Trial = 4250/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.818 | DEBUG    | __main__:trials:29 - Trial = 4250/30000 | Total reward = 51.97
2022-01-26 14:16:44.822 | DEBUG    | __main__:trials:24 - Trial = 4251/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.823 | DEBUG    | __main__:trials:29 - Trial = 4251/30000 | Total reward = 31.70
2022-01-26 14:16:44.827 | DEBUG    | __main__:trials:24 - Trial = 4252/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.829 | DEBUG    | __main__:trials:29 - Trial = 4252/30000 | Total reward = 47.68
2022-01-26 14:16:44.832 | DEBUG    | __main__:trials:24 - Trial = 4253/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.834 | DEBUG    | __main__:trials:29 - Trial = 4253/30000 | Total reward = 51.38
2022-01-26 14:16:44.838 | DEBUG    | __main__:trials:24 - Trial = 4254/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.838 | DEBUG    | __main__:trials:29 - Trial = 4254/30000 | Total reward = 42.18
2022-01-26 14:16:44.843 | DEBUG    | __main__:trials:24 - Trial = 4255/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.844 | DEBUG    | __main__:trials:29 - Trial = 4255/30000 | Total reward = 47.96
2022-01-26 14:16:44.848 | DEBUG    | __main__:trials:24 - Trial = 4256/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.849 | DEBUG    | __main__:trials:29 - Trial = 4256/30000 | Total reward = 36.69
2022-01-26 14:16:44.853 | DEBUG    | __main__:trials:24 - Trial = 4257/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.854 | DEBUG    | __main__:trials:29 - Trial = 4257/30000 | Total reward = 47.70
2022-01-26 14:16:44.857 | DEBUG    | __main__:trials:24 - Trial = 4258/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.858 | DEBUG    | __main__:trials:29 - Trial = 4258/30000 | Total reward = 50.16
2022-01-26 14:16:44.861 | DEBUG    | __main__:trials:24 - Trial = 4259/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.863 | DEBUG    | __main__:trials:29 - Trial = 4259/30000 | Total reward = 45.32
2022-01-26 14:16:44.865 | DEBUG    | __main__:trials:26 - Trial = 4260/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.867 | DEBUG    | __main__:trials:29 - Trial = 4260/30000 | Total reward = 19.67
2022-01-26 14:16:44.870 | DEBUG    | __main__:trials:24 - Trial = 4261/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.871 | DEBUG    | __main__:trials:29 - Trial = 4261/30000 | Total reward = 51.14
2022-01-26 14:16:44.874 | DEBUG    | __main__:trials:24 - Trial = 4262/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.875 | DEBUG    | __main__:trials:29 - Trial = 4262/30000 | Total reward = 47.23
2022-01-26 14:16:44.878 | DEBUG    | __main__:trials:24 - Trial = 4263/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.880 | DEBUG    | __main__:trials:29 - Trial = 4263/30000 | Total reward = 64.70
2022-01-26 14:16:44.883 | DEBUG    | __main__:trials:24 - Trial = 4264/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.885 | DEBUG    | __main__:trials:29 - Trial = 4264/30000 | Total reward = 52.22
2022-01-26 14:16:44.888 | DEBUG    | __main__:trials:24 - Trial = 4265/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.890 | DEBUG    | __main__:trials:29 - Trial = 4265/30000 | Total reward = 43.14
2022-01-26 14:16:44.893 | DEBUG    | __main__:trials:26 - Trial = 4266/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.894 | DEBUG    | __main__:trials:29 - Trial = 4266/30000 | Total reward = 26.19
2022-01-26 14:16:44.897 | DEBUG    | __main__:trials:26 - Trial = 4267/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:44.899 | DEBUG    | __main__:trials:29 - Trial = 4267/30000 | Total reward = 18.85
2022-01-26 14:16:44.903 | DEBUG    | __main__:trials:24 - Trial = 4268/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.903 | DEBUG    | __main__:trials:29 - Trial = 4268/30000 | Total reward = 50.92
2022-01-26 14:16:44.908 | DEBUG    | __main__:trials:24 - Trial = 4269/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.909 | DEBUG    | __main__:trials:29 - Trial = 4269/30000 | Total reward = 45.46
2022-01-26 14:16:44.912 | DEBUG    | __main__:trials:24 - Trial = 4270/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.915 | DEBUG    | __main__:trials:29 - Trial = 4270/30000 | Total reward = 46.70
2022-01-26 14:16:44.918 | DEBUG    | __main__:trials:24 - Trial = 4271/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.920 | DEBUG    | __main__:trials:29 - Trial = 4271/30000 | Total reward = 62.94
2022-01-26 14:16:44.923 | DEBUG    | __main__:trials:24 - Trial = 4272/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.925 | DEBUG    | __main__:trials:29 - Trial = 4272/30000 | Total reward = 27.21
2022-01-26 14:16:44.928 | DEBUG    | __main__:trials:24 - Trial = 4273/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.930 | DEBUG    | __main__:trials:29 - Trial = 4273/30000 | Total reward = 44.36
2022-01-26 14:16:44.934 | DEBUG    | __main__:trials:24 - Trial = 4274/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.935 | DEBUG    | __main__:trials:29 - Trial = 4274/30000 | Total reward = 49.71
2022-01-26 14:16:44.939 | DEBUG    | __main__:trials:24 - Trial = 4275/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.941 | DEBUG    | __main__:trials:29 - Trial = 4275/30000 | Total reward = 28.51
2022-01-26 14:16:44.944 | DEBUG    | __main__:trials:24 - Trial = 4276/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.946 | DEBUG    | __main__:trials:29 - Trial = 4276/30000 | Total reward = 52.78
2022-01-26 14:16:44.950 | DEBUG    | __main__:trials:24 - Trial = 4277/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.951 | DEBUG    | __main__:trials:29 - Trial = 4277/30000 | Total reward = 51.89
2022-01-26 14:16:44.955 | DEBUG    | __main__:trials:24 - Trial = 4278/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.957 | DEBUG    | __main__:trials:29 - Trial = 4278/30000 | Total reward = 48.22
2022-01-26 14:16:44.960 | DEBUG    | __main__:trials:24 - Trial = 4279/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.961 | DEBUG    | __main__:trials:29 - Trial = 4279/30000 | Total reward = 53.65
2022-01-26 14:16:44.966 | DEBUG    | __main__:trials:24 - Trial = 4280/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.967 | DEBUG    | __main__:trials:29 - Trial = 4280/30000 | Total reward = 51.37
2022-01-26 14:16:44.970 | DEBUG    | __main__:trials:24 - Trial = 4281/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.972 | DEBUG    | __main__:trials:29 - Trial = 4281/30000 | Total reward = 51.98
2022-01-26 14:16:44.976 | DEBUG    | __main__:trials:24 - Trial = 4282/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.977 | DEBUG    | __main__:trials:29 - Trial = 4282/30000 | Total reward = 53.68
2022-01-26 14:16:44.981 | DEBUG    | __main__:trials:24 - Trial = 4283/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.983 | DEBUG    | __main__:trials:29 - Trial = 4283/30000 | Total reward = 47.06
2022-01-26 14:16:44.986 | DEBUG    | __main__:trials:24 - Trial = 4284/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.988 | DEBUG    | __main__:trials:29 - Trial = 4284/30000 | Total reward = 34.56
2022-01-26 14:16:44.992 | DEBUG    | __main__:trials:24 - Trial = 4285/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.993 | DEBUG    | __main__:trials:29 - Trial = 4285/30000 | Total reward = 57.01
2022-01-26 14:16:44.997 | DEBUG    | __main__:trials:24 - Trial = 4286/30000 | Max number of steps (20) reached
2022-01-26 14:16:44.998 | DEBUG    | __main__:trials:29 - Trial = 4286/30000 | Total reward = 51.94
2022-01-26 14:16:45.002 | DEBUG    | __main__:trials:24 - Trial = 4287/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.003 | DEBUG    | __main__:trials:29 - Trial = 4287/30000 | Total reward = 36.53
2022-01-26 14:16:45.007 | DEBUG    | __main__:trials:24 - Trial = 4288/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.009 | DEBUG    | __main__:trials:29 - Trial = 4288/30000 | Total reward = 53.08
2022-01-26 14:16:45.012 | DEBUG    | __main__:trials:24 - Trial = 4289/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.014 | DEBUG    | __main__:trials:29 - Trial = 4289/30000 | Total reward = 44.94
2022-01-26 14:16:45.017 | DEBUG    | __main__:trials:24 - Trial = 4290/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.019 | DEBUG    | __main__:trials:29 - Trial = 4290/30000 | Total reward = 54.38
2022-01-26 14:16:45.022 | DEBUG    | __main__:trials:24 - Trial = 4291/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.024 | DEBUG    | __main__:trials:29 - Trial = 4291/30000 | Total reward = 43.29
2022-01-26 14:16:45.027 | DEBUG    | __main__:trials:24 - Trial = 4292/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.029 | DEBUG    | __main__:trials:29 - Trial = 4292/30000 | Total reward = 43.26
2022-01-26 14:16:45.032 | DEBUG    | __main__:trials:24 - Trial = 4293/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.034 | DEBUG    | __main__:trials:29 - Trial = 4293/30000 | Total reward = 49.12
2022-01-26 14:16:45.037 | DEBUG    | __main__:trials:24 - Trial = 4294/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.039 | DEBUG    | __main__:trials:29 - Trial = 4294/30000 | Total reward = 52.35
2022-01-26 14:16:45.042 | DEBUG    | __main__:trials:24 - Trial = 4295/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.044 | DEBUG    | __main__:trials:29 - Trial = 4295/30000 | Total reward = 32.71
2022-01-26 14:16:45.047 | DEBUG    | __main__:trials:24 - Trial = 4296/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.049 | DEBUG    | __main__:trials:29 - Trial = 4296/30000 | Total reward = 48.24
2022-01-26 14:16:45.052 | DEBUG    | __main__:trials:24 - Trial = 4297/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.053 | DEBUG    | __main__:trials:29 - Trial = 4297/30000 | Total reward = 51.09
2022-01-26 14:16:45.057 | DEBUG    | __main__:trials:24 - Trial = 4298/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.058 | DEBUG    | __main__:trials:29 - Trial = 4298/30000 | Total reward = 45.52
2022-01-26 14:16:45.062 | DEBUG    | __main__:trials:24 - Trial = 4299/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.063 | DEBUG    | __main__:trials:29 - Trial = 4299/30000 | Total reward = 49.09
2022-01-26 14:16:45.067 | DEBUG    | __main__:trials:24 - Trial = 4300/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.069 | DEBUG    | __main__:trials:29 - Trial = 4300/30000 | Total reward = 50.15
2022-01-26 14:16:45.072 | DEBUG    | __main__:trials:24 - Trial = 4301/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.074 | DEBUG    | __main__:trials:29 - Trial = 4301/30000 | Total reward = 46.99
2022-01-26 14:16:45.078 | DEBUG    | __main__:trials:24 - Trial = 4302/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.079 | DEBUG    | __main__:trials:29 - Trial = 4302/30000 | Total reward = 53.81
2022-01-26 14:16:45.082 | DEBUG    | __main__:trials:24 - Trial = 4303/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.083 | DEBUG    | __main__:trials:29 - Trial = 4303/30000 | Total reward = 38.79
2022-01-26 14:16:45.087 | DEBUG    | __main__:trials:24 - Trial = 4304/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.089 | DEBUG    | __main__:trials:29 - Trial = 4304/30000 | Total reward = 47.92
2022-01-26 14:16:45.092 | DEBUG    | __main__:trials:24 - Trial = 4305/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.094 | DEBUG    | __main__:trials:29 - Trial = 4305/30000 | Total reward = 49.70
2022-01-26 14:16:45.098 | DEBUG    | __main__:trials:24 - Trial = 4306/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.099 | DEBUG    | __main__:trials:29 - Trial = 4306/30000 | Total reward = 52.61
2022-01-26 14:16:45.103 | DEBUG    | __main__:trials:24 - Trial = 4307/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.104 | DEBUG    | __main__:trials:29 - Trial = 4307/30000 | Total reward = 28.78
2022-01-26 14:16:45.108 | DEBUG    | __main__:trials:24 - Trial = 4308/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.110 | DEBUG    | __main__:trials:29 - Trial = 4308/30000 | Total reward = 51.00
2022-01-26 14:16:45.113 | DEBUG    | __main__:trials:24 - Trial = 4309/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.115 | DEBUG    | __main__:trials:29 - Trial = 4309/30000 | Total reward = 49.76
2022-01-26 14:16:45.118 | DEBUG    | __main__:trials:24 - Trial = 4310/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.120 | DEBUG    | __main__:trials:29 - Trial = 4310/30000 | Total reward = 51.89
2022-01-26 14:16:45.124 | DEBUG    | __main__:trials:24 - Trial = 4311/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.125 | DEBUG    | __main__:trials:29 - Trial = 4311/30000 | Total reward = 56.19
2022-01-26 14:16:45.129 | DEBUG    | __main__:trials:24 - Trial = 4312/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.130 | DEBUG    | __main__:trials:29 - Trial = 4312/30000 | Total reward = 47.48
2022-01-26 14:16:45.133 | DEBUG    | __main__:trials:26 - Trial = 4313/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.134 | DEBUG    | __main__:trials:29 - Trial = 4313/30000 | Total reward = 24.03
2022-01-26 14:16:45.138 | DEBUG    | __main__:trials:24 - Trial = 4314/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.139 | DEBUG    | __main__:trials:29 - Trial = 4314/30000 | Total reward = 54.62
2022-01-26 14:16:45.143 | DEBUG    | __main__:trials:26 - Trial = 4315/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.144 | DEBUG    | __main__:trials:29 - Trial = 4315/30000 | Total reward = 33.89
2022-01-26 14:16:45.148 | DEBUG    | __main__:trials:24 - Trial = 4316/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.150 | DEBUG    | __main__:trials:29 - Trial = 4316/30000 | Total reward = 41.61
2022-01-26 14:16:45.153 | DEBUG    | __main__:trials:24 - Trial = 4317/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.155 | DEBUG    | __main__:trials:29 - Trial = 4317/30000 | Total reward = 50.24
2022-01-26 14:16:45.159 | DEBUG    | __main__:trials:24 - Trial = 4318/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.160 | DEBUG    | __main__:trials:29 - Trial = 4318/30000 | Total reward = 50.45
2022-01-26 14:16:45.164 | DEBUG    | __main__:trials:24 - Trial = 4319/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.166 | DEBUG    | __main__:trials:29 - Trial = 4319/30000 | Total reward = 50.02
2022-01-26 14:16:45.169 | DEBUG    | __main__:trials:24 - Trial = 4320/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.171 | DEBUG    | __main__:trials:29 - Trial = 4320/30000 | Total reward = 45.41
2022-01-26 14:16:45.174 | DEBUG    | __main__:trials:24 - Trial = 4321/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.176 | DEBUG    | __main__:trials:29 - Trial = 4321/30000 | Total reward = 48.82
2022-01-26 14:16:45.179 | DEBUG    | __main__:trials:24 - Trial = 4322/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.181 | DEBUG    | __main__:trials:29 - Trial = 4322/30000 | Total reward = 48.93
2022-01-26 14:16:45.184 | DEBUG    | __main__:trials:24 - Trial = 4323/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.186 | DEBUG    | __main__:trials:29 - Trial = 4323/30000 | Total reward = 49.23
2022-01-26 14:16:45.189 | DEBUG    | __main__:trials:26 - Trial = 4324/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.190 | DEBUG    | __main__:trials:29 - Trial = 4324/30000 | Total reward = 27.49
2022-01-26 14:16:45.194 | DEBUG    | __main__:trials:24 - Trial = 4325/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.195 | DEBUG    | __main__:trials:29 - Trial = 4325/30000 | Total reward = 27.08
2022-01-26 14:16:45.198 | DEBUG    | __main__:trials:24 - Trial = 4326/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.200 | DEBUG    | __main__:trials:29 - Trial = 4326/30000 | Total reward = 32.93
2022-01-26 14:16:45.204 | DEBUG    | __main__:trials:24 - Trial = 4327/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.206 | DEBUG    | __main__:trials:29 - Trial = 4327/30000 | Total reward = 43.89
2022-01-26 14:16:45.209 | DEBUG    | __main__:trials:24 - Trial = 4328/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.211 | DEBUG    | __main__:trials:29 - Trial = 4328/30000 | Total reward = 47.12
2022-01-26 14:16:45.214 | DEBUG    | __main__:trials:24 - Trial = 4329/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.216 | DEBUG    | __main__:trials:29 - Trial = 4329/30000 | Total reward = 60.87
2022-01-26 14:16:45.219 | DEBUG    | __main__:trials:24 - Trial = 4330/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.221 | DEBUG    | __main__:trials:29 - Trial = 4330/30000 | Total reward = 38.17
2022-01-26 14:16:45.224 | DEBUG    | __main__:trials:24 - Trial = 4331/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.226 | DEBUG    | __main__:trials:29 - Trial = 4331/30000 | Total reward = 51.21
2022-01-26 14:16:45.229 | DEBUG    | __main__:trials:24 - Trial = 4332/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.231 | DEBUG    | __main__:trials:29 - Trial = 4332/30000 | Total reward = 53.41
2022-01-26 14:16:45.234 | DEBUG    | __main__:trials:24 - Trial = 4333/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.236 | DEBUG    | __main__:trials:29 - Trial = 4333/30000 | Total reward = 38.13
2022-01-26 14:16:45.240 | DEBUG    | __main__:trials:24 - Trial = 4334/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.241 | DEBUG    | __main__:trials:29 - Trial = 4334/30000 | Total reward = 50.25
2022-01-26 14:16:45.244 | DEBUG    | __main__:trials:24 - Trial = 4335/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.246 | DEBUG    | __main__:trials:29 - Trial = 4335/30000 | Total reward = 47.96
2022-01-26 14:16:45.250 | DEBUG    | __main__:trials:24 - Trial = 4336/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.251 | DEBUG    | __main__:trials:29 - Trial = 4336/30000 | Total reward = 52.35
2022-01-26 14:16:45.255 | DEBUG    | __main__:trials:24 - Trial = 4337/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.256 | DEBUG    | __main__:trials:29 - Trial = 4337/30000 | Total reward = 54.92
2022-01-26 14:16:45.260 | DEBUG    | __main__:trials:24 - Trial = 4338/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.261 | DEBUG    | __main__:trials:29 - Trial = 4338/30000 | Total reward = 44.69
2022-01-26 14:16:45.265 | DEBUG    | __main__:trials:24 - Trial = 4339/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.267 | DEBUG    | __main__:trials:29 - Trial = 4339/30000 | Total reward = 48.18
2022-01-26 14:16:45.270 | DEBUG    | __main__:trials:24 - Trial = 4340/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.272 | DEBUG    | __main__:trials:29 - Trial = 4340/30000 | Total reward = 34.33
2022-01-26 14:16:45.275 | DEBUG    | __main__:trials:24 - Trial = 4341/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.277 | DEBUG    | __main__:trials:29 - Trial = 4341/30000 | Total reward = 52.58
2022-01-26 14:16:45.280 | DEBUG    | __main__:trials:24 - Trial = 4342/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.281 | DEBUG    | __main__:trials:29 - Trial = 4342/30000 | Total reward = 41.14
2022-01-26 14:16:45.285 | DEBUG    | __main__:trials:24 - Trial = 4343/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.286 | DEBUG    | __main__:trials:29 - Trial = 4343/30000 | Total reward = 55.84
2022-01-26 14:16:45.290 | DEBUG    | __main__:trials:24 - Trial = 4344/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.292 | DEBUG    | __main__:trials:29 - Trial = 4344/30000 | Total reward = 48.58
2022-01-26 14:16:45.296 | DEBUG    | __main__:trials:24 - Trial = 4345/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.297 | DEBUG    | __main__:trials:29 - Trial = 4345/30000 | Total reward = 49.43
2022-01-26 14:16:45.300 | DEBUG    | __main__:trials:24 - Trial = 4346/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.302 | DEBUG    | __main__:trials:29 - Trial = 4346/30000 | Total reward = 49.91
2022-01-26 14:16:45.305 | DEBUG    | __main__:trials:24 - Trial = 4347/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.306 | DEBUG    | __main__:trials:29 - Trial = 4347/30000 | Total reward = 38.77
2022-01-26 14:16:45.310 | DEBUG    | __main__:trials:24 - Trial = 4348/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.312 | DEBUG    | __main__:trials:29 - Trial = 4348/30000 | Total reward = 60.13
2022-01-26 14:16:45.315 | DEBUG    | __main__:trials:24 - Trial = 4349/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.317 | DEBUG    | __main__:trials:29 - Trial = 4349/30000 | Total reward = 28.12
2022-01-26 14:16:45.320 | DEBUG    | __main__:trials:24 - Trial = 4350/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.322 | DEBUG    | __main__:trials:29 - Trial = 4350/30000 | Total reward = 57.33
2022-01-26 14:16:45.325 | DEBUG    | __main__:trials:24 - Trial = 4351/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.327 | DEBUG    | __main__:trials:29 - Trial = 4351/30000 | Total reward = 47.40
2022-01-26 14:16:45.330 | DEBUG    | __main__:trials:24 - Trial = 4352/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.332 | DEBUG    | __main__:trials:29 - Trial = 4352/30000 | Total reward = 54.27
2022-01-26 14:16:45.336 | DEBUG    | __main__:trials:24 - Trial = 4353/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.337 | DEBUG    | __main__:trials:29 - Trial = 4353/30000 | Total reward = 46.89
2022-01-26 14:16:45.341 | DEBUG    | __main__:trials:24 - Trial = 4354/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.343 | DEBUG    | __main__:trials:29 - Trial = 4354/30000 | Total reward = 51.66
2022-01-26 14:16:45.346 | DEBUG    | __main__:trials:24 - Trial = 4355/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.348 | DEBUG    | __main__:trials:29 - Trial = 4355/30000 | Total reward = 43.72
2022-01-26 14:16:45.351 | DEBUG    | __main__:trials:24 - Trial = 4356/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.353 | DEBUG    | __main__:trials:29 - Trial = 4356/30000 | Total reward = 49.63
2022-01-26 14:16:45.357 | DEBUG    | __main__:trials:24 - Trial = 4357/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.358 | DEBUG    | __main__:trials:29 - Trial = 4357/30000 | Total reward = 49.07
2022-01-26 14:16:45.361 | DEBUG    | __main__:trials:24 - Trial = 4358/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.362 | DEBUG    | __main__:trials:29 - Trial = 4358/30000 | Total reward = 49.43
2022-01-26 14:16:45.366 | DEBUG    | __main__:trials:24 - Trial = 4359/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.368 | DEBUG    | __main__:trials:29 - Trial = 4359/30000 | Total reward = 28.62
2022-01-26 14:16:45.371 | DEBUG    | __main__:trials:24 - Trial = 4360/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.373 | DEBUG    | __main__:trials:29 - Trial = 4360/30000 | Total reward = 46.78
2022-01-26 14:16:45.376 | DEBUG    | __main__:trials:24 - Trial = 4361/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.377 | DEBUG    | __main__:trials:29 - Trial = 4361/30000 | Total reward = 28.40
2022-01-26 14:16:45.381 | DEBUG    | __main__:trials:24 - Trial = 4362/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.381 | DEBUG    | __main__:trials:29 - Trial = 4362/30000 | Total reward = 44.50
2022-01-26 14:16:45.385 | DEBUG    | __main__:trials:24 - Trial = 4363/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.385 | DEBUG    | __main__:trials:29 - Trial = 4363/30000 | Total reward = 47.18
2022-01-26 14:16:45.389 | DEBUG    | __main__:trials:24 - Trial = 4364/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.391 | DEBUG    | __main__:trials:29 - Trial = 4364/30000 | Total reward = 52.00
2022-01-26 14:16:45.394 | DEBUG    | __main__:trials:24 - Trial = 4365/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.396 | DEBUG    | __main__:trials:29 - Trial = 4365/30000 | Total reward = 49.09
2022-01-26 14:16:45.399 | DEBUG    | __main__:trials:26 - Trial = 4366/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.401 | DEBUG    | __main__:trials:29 - Trial = 4366/30000 | Total reward = 31.69
2022-01-26 14:16:45.404 | DEBUG    | __main__:trials:24 - Trial = 4367/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.405 | DEBUG    | __main__:trials:29 - Trial = 4367/30000 | Total reward = 53.89
2022-01-26 14:16:45.409 | DEBUG    | __main__:trials:24 - Trial = 4368/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.410 | DEBUG    | __main__:trials:29 - Trial = 4368/30000 | Total reward = 39.89
2022-01-26 14:16:45.414 | DEBUG    | __main__:trials:24 - Trial = 4369/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.415 | DEBUG    | __main__:trials:29 - Trial = 4369/30000 | Total reward = 25.05
2022-01-26 14:16:45.418 | DEBUG    | __main__:trials:24 - Trial = 4370/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.420 | DEBUG    | __main__:trials:29 - Trial = 4370/30000 | Total reward = 55.08
2022-01-26 14:16:45.424 | DEBUG    | __main__:trials:24 - Trial = 4371/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.425 | DEBUG    | __main__:trials:29 - Trial = 4371/30000 | Total reward = 23.28
2022-01-26 14:16:45.429 | DEBUG    | __main__:trials:24 - Trial = 4372/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.430 | DEBUG    | __main__:trials:29 - Trial = 4372/30000 | Total reward = 44.81
2022-01-26 14:16:45.434 | DEBUG    | __main__:trials:24 - Trial = 4373/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.435 | DEBUG    | __main__:trials:29 - Trial = 4373/30000 | Total reward = 45.17
2022-01-26 14:16:45.439 | DEBUG    | __main__:trials:24 - Trial = 4374/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.440 | DEBUG    | __main__:trials:29 - Trial = 4374/30000 | Total reward = 22.28
2022-01-26 14:16:45.443 | DEBUG    | __main__:trials:24 - Trial = 4375/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.445 | DEBUG    | __main__:trials:29 - Trial = 4375/30000 | Total reward = 49.43
2022-01-26 14:16:45.448 | DEBUG    | __main__:trials:24 - Trial = 4376/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.450 | DEBUG    | __main__:trials:29 - Trial = 4376/30000 | Total reward = 25.98
2022-01-26 14:16:45.453 | DEBUG    | __main__:trials:24 - Trial = 4377/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.453 | DEBUG    | __main__:trials:29 - Trial = 4377/30000 | Total reward = 51.02
2022-01-26 14:16:45.458 | DEBUG    | __main__:trials:24 - Trial = 4378/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.458 | DEBUG    | __main__:trials:29 - Trial = 4378/30000 | Total reward = 36.12
2022-01-26 14:16:45.462 | DEBUG    | __main__:trials:24 - Trial = 4379/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.464 | DEBUG    | __main__:trials:29 - Trial = 4379/30000 | Total reward = 53.08
2022-01-26 14:16:45.467 | DEBUG    | __main__:trials:24 - Trial = 4380/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.469 | DEBUG    | __main__:trials:29 - Trial = 4380/30000 | Total reward = 52.09
2022-01-26 14:16:45.472 | DEBUG    | __main__:trials:26 - Trial = 4381/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.474 | DEBUG    | __main__:trials:29 - Trial = 4381/30000 | Total reward = 26.62
2022-01-26 14:16:45.477 | DEBUG    | __main__:trials:24 - Trial = 4382/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.479 | DEBUG    | __main__:trials:29 - Trial = 4382/30000 | Total reward = 31.91
2022-01-26 14:16:45.482 | DEBUG    | __main__:trials:24 - Trial = 4383/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.483 | DEBUG    | __main__:trials:29 - Trial = 4383/30000 | Total reward = 47.46
2022-01-26 14:16:45.487 | DEBUG    | __main__:trials:24 - Trial = 4384/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.489 | DEBUG    | __main__:trials:29 - Trial = 4384/30000 | Total reward = 49.43
2022-01-26 14:16:45.492 | DEBUG    | __main__:trials:24 - Trial = 4385/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.493 | DEBUG    | __main__:trials:29 - Trial = 4385/30000 | Total reward = 62.27
2022-01-26 14:16:45.497 | DEBUG    | __main__:trials:24 - Trial = 4386/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.499 | DEBUG    | __main__:trials:29 - Trial = 4386/30000 | Total reward = 57.87
2022-01-26 14:16:45.502 | DEBUG    | __main__:trials:24 - Trial = 4387/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.503 | DEBUG    | __main__:trials:29 - Trial = 4387/30000 | Total reward = 57.67
2022-01-26 14:16:45.507 | DEBUG    | __main__:trials:24 - Trial = 4388/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.509 | DEBUG    | __main__:trials:29 - Trial = 4388/30000 | Total reward = 62.72
2022-01-26 14:16:45.511 | DEBUG    | __main__:trials:24 - Trial = 4389/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.513 | DEBUG    | __main__:trials:29 - Trial = 4389/30000 | Total reward = 29.19
2022-01-26 14:16:45.516 | DEBUG    | __main__:trials:24 - Trial = 4390/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.518 | DEBUG    | __main__:trials:29 - Trial = 4390/30000 | Total reward = 24.09
2022-01-26 14:16:45.521 | DEBUG    | __main__:trials:24 - Trial = 4391/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.522 | DEBUG    | __main__:trials:29 - Trial = 4391/30000 | Total reward = 56.79
2022-01-26 14:16:45.527 | DEBUG    | __main__:trials:24 - Trial = 4392/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.528 | DEBUG    | __main__:trials:29 - Trial = 4392/30000 | Total reward = 50.02
2022-01-26 14:16:45.532 | DEBUG    | __main__:trials:24 - Trial = 4393/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.533 | DEBUG    | __main__:trials:29 - Trial = 4393/30000 | Total reward = 28.70
2022-01-26 14:16:45.537 | DEBUG    | __main__:trials:24 - Trial = 4394/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.538 | DEBUG    | __main__:trials:29 - Trial = 4394/30000 | Total reward = 50.27
2022-01-26 14:16:45.542 | DEBUG    | __main__:trials:24 - Trial = 4395/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.543 | DEBUG    | __main__:trials:29 - Trial = 4395/30000 | Total reward = 43.57
2022-01-26 14:16:45.546 | DEBUG    | __main__:trials:24 - Trial = 4396/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.546 | DEBUG    | __main__:trials:29 - Trial = 4396/30000 | Total reward = 51.26
2022-01-26 14:16:45.550 | DEBUG    | __main__:trials:24 - Trial = 4397/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.551 | DEBUG    | __main__:trials:29 - Trial = 4397/30000 | Total reward = 49.43
2022-01-26 14:16:45.554 | DEBUG    | __main__:trials:24 - Trial = 4398/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.556 | DEBUG    | __main__:trials:29 - Trial = 4398/30000 | Total reward = 26.19
2022-01-26 14:16:45.559 | DEBUG    | __main__:trials:24 - Trial = 4399/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.561 | DEBUG    | __main__:trials:29 - Trial = 4399/30000 | Total reward = 41.92
2022-01-26 14:16:45.564 | DEBUG    | __main__:trials:24 - Trial = 4400/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.566 | DEBUG    | __main__:trials:29 - Trial = 4400/30000 | Total reward = 36.36
2022-01-26 14:16:45.569 | DEBUG    | __main__:trials:24 - Trial = 4401/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.570 | DEBUG    | __main__:trials:29 - Trial = 4401/30000 | Total reward = 9.28
2022-01-26 14:16:45.574 | DEBUG    | __main__:trials:24 - Trial = 4402/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.576 | DEBUG    | __main__:trials:29 - Trial = 4402/30000 | Total reward = 45.69
2022-01-26 14:16:45.580 | DEBUG    | __main__:trials:24 - Trial = 4403/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.580 | DEBUG    | __main__:trials:29 - Trial = 4403/30000 | Total reward = 45.51
2022-01-26 14:16:45.584 | DEBUG    | __main__:trials:24 - Trial = 4404/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.586 | DEBUG    | __main__:trials:29 - Trial = 4404/30000 | Total reward = 24.54
2022-01-26 14:16:45.589 | DEBUG    | __main__:trials:24 - Trial = 4405/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.591 | DEBUG    | __main__:trials:29 - Trial = 4405/30000 | Total reward = 57.46
2022-01-26 14:16:45.594 | DEBUG    | __main__:trials:24 - Trial = 4406/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.596 | DEBUG    | __main__:trials:29 - Trial = 4406/30000 | Total reward = 48.62
2022-01-26 14:16:45.599 | DEBUG    | __main__:trials:24 - Trial = 4407/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.601 | DEBUG    | __main__:trials:29 - Trial = 4407/30000 | Total reward = 61.52
2022-01-26 14:16:45.604 | DEBUG    | __main__:trials:26 - Trial = 4408/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.605 | DEBUG    | __main__:trials:29 - Trial = 4408/30000 | Total reward = 24.63
2022-01-26 14:16:45.608 | DEBUG    | __main__:trials:24 - Trial = 4409/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.610 | DEBUG    | __main__:trials:29 - Trial = 4409/30000 | Total reward = 41.10
2022-01-26 14:16:45.613 | DEBUG    | __main__:trials:24 - Trial = 4410/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.615 | DEBUG    | __main__:trials:29 - Trial = 4410/30000 | Total reward = 49.76
2022-01-26 14:16:45.619 | DEBUG    | __main__:trials:24 - Trial = 4411/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.620 | DEBUG    | __main__:trials:29 - Trial = 4411/30000 | Total reward = 40.79
2022-01-26 14:16:45.624 | DEBUG    | __main__:trials:24 - Trial = 4412/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.625 | DEBUG    | __main__:trials:29 - Trial = 4412/30000 | Total reward = 49.43
2022-01-26 14:16:45.629 | DEBUG    | __main__:trials:24 - Trial = 4413/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.630 | DEBUG    | __main__:trials:29 - Trial = 4413/30000 | Total reward = 45.47
2022-01-26 14:16:45.634 | DEBUG    | __main__:trials:24 - Trial = 4414/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.635 | DEBUG    | __main__:trials:29 - Trial = 4414/30000 | Total reward = 48.28
2022-01-26 14:16:45.639 | DEBUG    | __main__:trials:24 - Trial = 4415/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.639 | DEBUG    | __main__:trials:29 - Trial = 4415/30000 | Total reward = 53.07
2022-01-26 14:16:45.644 | DEBUG    | __main__:trials:24 - Trial = 4416/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.645 | DEBUG    | __main__:trials:29 - Trial = 4416/30000 | Total reward = 59.86
2022-01-26 14:16:45.648 | DEBUG    | __main__:trials:24 - Trial = 4417/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.649 | DEBUG    | __main__:trials:29 - Trial = 4417/30000 | Total reward = 33.36
2022-01-26 14:16:45.653 | DEBUG    | __main__:trials:24 - Trial = 4418/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.653 | DEBUG    | __main__:trials:29 - Trial = 4418/30000 | Total reward = 54.19
2022-01-26 14:16:45.657 | DEBUG    | __main__:trials:24 - Trial = 4419/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.658 | DEBUG    | __main__:trials:29 - Trial = 4419/30000 | Total reward = 50.35
2022-01-26 14:16:45.661 | DEBUG    | __main__:trials:24 - Trial = 4420/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.662 | DEBUG    | __main__:trials:29 - Trial = 4420/30000 | Total reward = 45.52
2022-01-26 14:16:45.666 | DEBUG    | __main__:trials:24 - Trial = 4421/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.668 | DEBUG    | __main__:trials:29 - Trial = 4421/30000 | Total reward = 49.28
2022-01-26 14:16:45.671 | DEBUG    | __main__:trials:24 - Trial = 4422/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.672 | DEBUG    | __main__:trials:29 - Trial = 4422/30000 | Total reward = 50.78
2022-01-26 14:16:45.676 | DEBUG    | __main__:trials:24 - Trial = 4423/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.677 | DEBUG    | __main__:trials:29 - Trial = 4423/30000 | Total reward = 38.23
2022-01-26 14:16:45.681 | DEBUG    | __main__:trials:24 - Trial = 4424/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.683 | DEBUG    | __main__:trials:29 - Trial = 4424/30000 | Total reward = 51.37
2022-01-26 14:16:45.686 | DEBUG    | __main__:trials:24 - Trial = 4425/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.688 | DEBUG    | __main__:trials:29 - Trial = 4425/30000 | Total reward = 25.45
2022-01-26 14:16:45.691 | DEBUG    | __main__:trials:24 - Trial = 4426/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.693 | DEBUG    | __main__:trials:29 - Trial = 4426/30000 | Total reward = 58.51
2022-01-26 14:16:45.696 | DEBUG    | __main__:trials:24 - Trial = 4427/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.697 | DEBUG    | __main__:trials:29 - Trial = 4427/30000 | Total reward = 45.23
2022-01-26 14:16:45.700 | DEBUG    | __main__:trials:24 - Trial = 4428/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.702 | DEBUG    | __main__:trials:29 - Trial = 4428/30000 | Total reward = 47.61
2022-01-26 14:16:45.706 | DEBUG    | __main__:trials:24 - Trial = 4429/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.706 | DEBUG    | __main__:trials:29 - Trial = 4429/30000 | Total reward = 49.67
2022-01-26 14:16:45.711 | DEBUG    | __main__:trials:24 - Trial = 4430/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.713 | DEBUG    | __main__:trials:29 - Trial = 4430/30000 | Total reward = 39.32
2022-01-26 14:16:45.715 | DEBUG    | __main__:trials:24 - Trial = 4431/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.717 | DEBUG    | __main__:trials:29 - Trial = 4431/30000 | Total reward = 29.42
2022-01-26 14:16:45.721 | DEBUG    | __main__:trials:24 - Trial = 4432/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.722 | DEBUG    | __main__:trials:29 - Trial = 4432/30000 | Total reward = 47.95
2022-01-26 14:16:45.725 | DEBUG    | __main__:trials:24 - Trial = 4433/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.727 | DEBUG    | __main__:trials:29 - Trial = 4433/30000 | Total reward = 47.87
2022-01-26 14:16:45.731 | DEBUG    | __main__:trials:24 - Trial = 4434/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.733 | DEBUG    | __main__:trials:29 - Trial = 4434/30000 | Total reward = 53.18
2022-01-26 14:16:45.735 | DEBUG    | __main__:trials:24 - Trial = 4435/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.737 | DEBUG    | __main__:trials:29 - Trial = 4435/30000 | Total reward = 52.21
2022-01-26 14:16:45.741 | DEBUG    | __main__:trials:24 - Trial = 4436/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.741 | DEBUG    | __main__:trials:29 - Trial = 4436/30000 | Total reward = 49.72
2022-01-26 14:16:45.746 | DEBUG    | __main__:trials:24 - Trial = 4437/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.747 | DEBUG    | __main__:trials:29 - Trial = 4437/30000 | Total reward = 39.54
2022-01-26 14:16:45.751 | DEBUG    | __main__:trials:24 - Trial = 4438/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.752 | DEBUG    | __main__:trials:29 - Trial = 4438/30000 | Total reward = 63.87
2022-01-26 14:16:45.756 | DEBUG    | __main__:trials:24 - Trial = 4439/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.757 | DEBUG    | __main__:trials:29 - Trial = 4439/30000 | Total reward = 47.36
2022-01-26 14:16:45.761 | DEBUG    | __main__:trials:24 - Trial = 4440/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.762 | DEBUG    | __main__:trials:29 - Trial = 4440/30000 | Total reward = 47.57
2022-01-26 14:16:45.766 | DEBUG    | __main__:trials:24 - Trial = 4441/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.768 | DEBUG    | __main__:trials:29 - Trial = 4441/30000 | Total reward = 50.46
2022-01-26 14:16:45.771 | DEBUG    | __main__:trials:24 - Trial = 4442/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.772 | DEBUG    | __main__:trials:29 - Trial = 4442/30000 | Total reward = 47.49
2022-01-26 14:16:45.775 | DEBUG    | __main__:trials:24 - Trial = 4443/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.776 | DEBUG    | __main__:trials:29 - Trial = 4443/30000 | Total reward = 60.85
2022-01-26 14:16:45.779 | DEBUG    | __main__:trials:24 - Trial = 4444/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.780 | DEBUG    | __main__:trials:29 - Trial = 4444/30000 | Total reward = 41.20
2022-01-26 14:16:45.783 | DEBUG    | __main__:trials:24 - Trial = 4445/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.784 | DEBUG    | __main__:trials:29 - Trial = 4445/30000 | Total reward = 48.49
2022-01-26 14:16:45.791 | DEBUG    | __main__:trials:24 - Trial = 4446/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.792 | DEBUG    | __main__:trials:29 - Trial = 4446/30000 | Total reward = 46.82
2022-01-26 14:16:45.795 | DEBUG    | __main__:trials:24 - Trial = 4447/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.795 | DEBUG    | __main__:trials:29 - Trial = 4447/30000 | Total reward = 56.07
2022-01-26 14:16:45.799 | DEBUG    | __main__:trials:24 - Trial = 4448/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.799 | DEBUG    | __main__:trials:29 - Trial = 4448/30000 | Total reward = 52.35
2022-01-26 14:16:45.803 | DEBUG    | __main__:trials:24 - Trial = 4449/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.804 | DEBUG    | __main__:trials:29 - Trial = 4449/30000 | Total reward = 55.43
2022-01-26 14:16:45.807 | DEBUG    | __main__:trials:24 - Trial = 4450/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.808 | DEBUG    | __main__:trials:29 - Trial = 4450/30000 | Total reward = 47.82
2022-01-26 14:16:45.811 | DEBUG    | __main__:trials:24 - Trial = 4451/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.812 | DEBUG    | __main__:trials:29 - Trial = 4451/30000 | Total reward = 46.70
2022-01-26 14:16:45.815 | DEBUG    | __main__:trials:24 - Trial = 4452/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.816 | DEBUG    | __main__:trials:29 - Trial = 4452/30000 | Total reward = 38.09
2022-01-26 14:16:45.819 | DEBUG    | __main__:trials:24 - Trial = 4453/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.820 | DEBUG    | __main__:trials:29 - Trial = 4453/30000 | Total reward = 54.32
2022-01-26 14:16:45.823 | DEBUG    | __main__:trials:24 - Trial = 4454/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.823 | DEBUG    | __main__:trials:29 - Trial = 4454/30000 | Total reward = 50.30
2022-01-26 14:16:45.826 | DEBUG    | __main__:trials:24 - Trial = 4455/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.827 | DEBUG    | __main__:trials:29 - Trial = 4455/30000 | Total reward = 50.71
2022-01-26 14:16:45.830 | DEBUG    | __main__:trials:24 - Trial = 4456/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.831 | DEBUG    | __main__:trials:29 - Trial = 4456/30000 | Total reward = 46.91
2022-01-26 14:16:45.834 | DEBUG    | __main__:trials:24 - Trial = 4457/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.835 | DEBUG    | __main__:trials:29 - Trial = 4457/30000 | Total reward = 54.40
2022-01-26 14:16:45.838 | DEBUG    | __main__:trials:24 - Trial = 4458/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.839 | DEBUG    | __main__:trials:29 - Trial = 4458/30000 | Total reward = 51.10
2022-01-26 14:16:45.842 | DEBUG    | __main__:trials:24 - Trial = 4459/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.843 | DEBUG    | __main__:trials:29 - Trial = 4459/30000 | Total reward = 34.53
2022-01-26 14:16:45.846 | DEBUG    | __main__:trials:24 - Trial = 4460/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.846 | DEBUG    | __main__:trials:29 - Trial = 4460/30000 | Total reward = 38.61
2022-01-26 14:16:45.849 | DEBUG    | __main__:trials:24 - Trial = 4461/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.850 | DEBUG    | __main__:trials:29 - Trial = 4461/30000 | Total reward = 49.33
2022-01-26 14:16:45.853 | DEBUG    | __main__:trials:24 - Trial = 4462/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.854 | DEBUG    | __main__:trials:29 - Trial = 4462/30000 | Total reward = 49.77
2022-01-26 14:16:45.857 | DEBUG    | __main__:trials:24 - Trial = 4463/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.858 | DEBUG    | __main__:trials:29 - Trial = 4463/30000 | Total reward = 28.74
2022-01-26 14:16:45.861 | DEBUG    | __main__:trials:24 - Trial = 4464/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.862 | DEBUG    | __main__:trials:29 - Trial = 4464/30000 | Total reward = 29.21
2022-01-26 14:16:45.865 | DEBUG    | __main__:trials:24 - Trial = 4465/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.866 | DEBUG    | __main__:trials:29 - Trial = 4465/30000 | Total reward = 56.85
2022-01-26 14:16:45.869 | DEBUG    | __main__:trials:24 - Trial = 4466/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.869 | DEBUG    | __main__:trials:29 - Trial = 4466/30000 | Total reward = 51.01
2022-01-26 14:16:45.872 | DEBUG    | __main__:trials:24 - Trial = 4467/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.873 | DEBUG    | __main__:trials:29 - Trial = 4467/30000 | Total reward = 38.11
2022-01-26 14:16:45.876 | DEBUG    | __main__:trials:24 - Trial = 4468/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.877 | DEBUG    | __main__:trials:29 - Trial = 4468/30000 | Total reward = 48.68
2022-01-26 14:16:45.880 | DEBUG    | __main__:trials:24 - Trial = 4469/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.880 | DEBUG    | __main__:trials:29 - Trial = 4469/30000 | Total reward = 43.29
2022-01-26 14:16:45.883 | DEBUG    | __main__:trials:24 - Trial = 4470/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.884 | DEBUG    | __main__:trials:29 - Trial = 4470/30000 | Total reward = 58.40
2022-01-26 14:16:45.887 | DEBUG    | __main__:trials:24 - Trial = 4471/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.888 | DEBUG    | __main__:trials:29 - Trial = 4471/30000 | Total reward = 59.94
2022-01-26 14:16:45.891 | DEBUG    | __main__:trials:24 - Trial = 4472/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.892 | DEBUG    | __main__:trials:29 - Trial = 4472/30000 | Total reward = 48.10
2022-01-26 14:16:45.895 | DEBUG    | __main__:trials:24 - Trial = 4473/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.895 | DEBUG    | __main__:trials:29 - Trial = 4473/30000 | Total reward = 47.05
2022-01-26 14:16:45.898 | DEBUG    | __main__:trials:24 - Trial = 4474/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.899 | DEBUG    | __main__:trials:29 - Trial = 4474/30000 | Total reward = 49.57
2022-01-26 14:16:45.902 | DEBUG    | __main__:trials:24 - Trial = 4475/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.903 | DEBUG    | __main__:trials:29 - Trial = 4475/30000 | Total reward = 44.91
2022-01-26 14:16:45.906 | DEBUG    | __main__:trials:24 - Trial = 4476/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.907 | DEBUG    | __main__:trials:29 - Trial = 4476/30000 | Total reward = 43.93
2022-01-26 14:16:45.910 | DEBUG    | __main__:trials:24 - Trial = 4477/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.910 | DEBUG    | __main__:trials:29 - Trial = 4477/30000 | Total reward = 48.06
2022-01-26 14:16:45.913 | DEBUG    | __main__:trials:24 - Trial = 4478/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.914 | DEBUG    | __main__:trials:29 - Trial = 4478/30000 | Total reward = 59.43
2022-01-26 14:16:45.917 | DEBUG    | __main__:trials:26 - Trial = 4479/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.918 | DEBUG    | __main__:trials:29 - Trial = 4479/30000 | Total reward = 31.84
2022-01-26 14:16:45.921 | DEBUG    | __main__:trials:24 - Trial = 4480/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.921 | DEBUG    | __main__:trials:29 - Trial = 4480/30000 | Total reward = 30.13
2022-01-26 14:16:45.924 | DEBUG    | __main__:trials:24 - Trial = 4481/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.925 | DEBUG    | __main__:trials:29 - Trial = 4481/30000 | Total reward = 54.04
2022-01-26 14:16:45.928 | DEBUG    | __main__:trials:24 - Trial = 4482/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.929 | DEBUG    | __main__:trials:29 - Trial = 4482/30000 | Total reward = 52.49
2022-01-26 14:16:45.932 | DEBUG    | __main__:trials:24 - Trial = 4483/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.932 | DEBUG    | __main__:trials:29 - Trial = 4483/30000 | Total reward = 51.60
2022-01-26 14:16:45.935 | DEBUG    | __main__:trials:24 - Trial = 4484/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.936 | DEBUG    | __main__:trials:29 - Trial = 4484/30000 | Total reward = 50.77
2022-01-26 14:16:45.939 | DEBUG    | __main__:trials:24 - Trial = 4485/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.940 | DEBUG    | __main__:trials:29 - Trial = 4485/30000 | Total reward = 48.93
2022-01-26 14:16:45.943 | DEBUG    | __main__:trials:24 - Trial = 4486/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.944 | DEBUG    | __main__:trials:29 - Trial = 4486/30000 | Total reward = 49.67
2022-01-26 14:16:45.947 | DEBUG    | __main__:trials:24 - Trial = 4487/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.947 | DEBUG    | __main__:trials:29 - Trial = 4487/30000 | Total reward = 40.22
2022-01-26 14:16:45.950 | DEBUG    | __main__:trials:24 - Trial = 4488/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.951 | DEBUG    | __main__:trials:29 - Trial = 4488/30000 | Total reward = 38.11
2022-01-26 14:16:45.954 | DEBUG    | __main__:trials:26 - Trial = 4489/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:45.955 | DEBUG    | __main__:trials:29 - Trial = 4489/30000 | Total reward = 34.37
2022-01-26 14:16:45.959 | DEBUG    | __main__:trials:24 - Trial = 4490/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.960 | DEBUG    | __main__:trials:29 - Trial = 4490/30000 | Total reward = 45.34
2022-01-26 14:16:45.963 | DEBUG    | __main__:trials:24 - Trial = 4491/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.964 | DEBUG    | __main__:trials:29 - Trial = 4491/30000 | Total reward = 61.95
2022-01-26 14:16:45.967 | DEBUG    | __main__:trials:24 - Trial = 4492/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.968 | DEBUG    | __main__:trials:29 - Trial = 4492/30000 | Total reward = 50.72
2022-01-26 14:16:45.971 | DEBUG    | __main__:trials:24 - Trial = 4493/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.972 | DEBUG    | __main__:trials:29 - Trial = 4493/30000 | Total reward = 52.60
2022-01-26 14:16:45.975 | DEBUG    | __main__:trials:24 - Trial = 4494/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.975 | DEBUG    | __main__:trials:29 - Trial = 4494/30000 | Total reward = 52.21
2022-01-26 14:16:45.978 | DEBUG    | __main__:trials:24 - Trial = 4495/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.980 | DEBUG    | __main__:trials:29 - Trial = 4495/30000 | Total reward = 53.30
2022-01-26 14:16:45.983 | DEBUG    | __main__:trials:24 - Trial = 4496/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.984 | DEBUG    | __main__:trials:29 - Trial = 4496/30000 | Total reward = 32.49
2022-01-26 14:16:45.987 | DEBUG    | __main__:trials:24 - Trial = 4497/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.989 | DEBUG    | __main__:trials:29 - Trial = 4497/30000 | Total reward = 41.56
2022-01-26 14:16:45.992 | DEBUG    | __main__:trials:24 - Trial = 4498/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.994 | DEBUG    | __main__:trials:29 - Trial = 4498/30000 | Total reward = 43.84
2022-01-26 14:16:45.998 | DEBUG    | __main__:trials:24 - Trial = 4499/30000 | Max number of steps (20) reached
2022-01-26 14:16:45.999 | DEBUG    | __main__:trials:29 - Trial = 4499/30000 | Total reward = 51.41
2022-01-26 14:16:46.003 | DEBUG    | __main__:trials:24 - Trial = 4500/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.004 | DEBUG    | __main__:trials:29 - Trial = 4500/30000 | Total reward = 53.29
2022-01-26 14:16:46.007 | DEBUG    | __main__:trials:24 - Trial = 4501/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.008 | DEBUG    | __main__:trials:29 - Trial = 4501/30000 | Total reward = 47.88
2022-01-26 14:16:46.012 | DEBUG    | __main__:trials:24 - Trial = 4502/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.014 | DEBUG    | __main__:trials:29 - Trial = 4502/30000 | Total reward = 49.80
2022-01-26 14:16:46.018 | DEBUG    | __main__:trials:26 - Trial = 4503/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.019 | DEBUG    | __main__:trials:29 - Trial = 4503/30000 | Total reward = 40.08
2022-01-26 14:16:46.023 | DEBUG    | __main__:trials:24 - Trial = 4504/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.024 | DEBUG    | __main__:trials:29 - Trial = 4504/30000 | Total reward = 52.41
2022-01-26 14:16:46.027 | DEBUG    | __main__:trials:24 - Trial = 4505/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.029 | DEBUG    | __main__:trials:29 - Trial = 4505/30000 | Total reward = 42.20
2022-01-26 14:16:46.032 | DEBUG    | __main__:trials:26 - Trial = 4506/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.033 | DEBUG    | __main__:trials:29 - Trial = 4506/30000 | Total reward = 37.56
2022-01-26 14:16:46.037 | DEBUG    | __main__:trials:24 - Trial = 4507/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.039 | DEBUG    | __main__:trials:29 - Trial = 4507/30000 | Total reward = 60.01
2022-01-26 14:16:46.042 | DEBUG    | __main__:trials:24 - Trial = 4508/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.044 | DEBUG    | __main__:trials:29 - Trial = 4508/30000 | Total reward = 48.80
2022-01-26 14:16:46.047 | DEBUG    | __main__:trials:24 - Trial = 4509/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.048 | DEBUG    | __main__:trials:29 - Trial = 4509/30000 | Total reward = 43.32
2022-01-26 14:16:46.051 | DEBUG    | __main__:trials:24 - Trial = 4510/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.053 | DEBUG    | __main__:trials:29 - Trial = 4510/30000 | Total reward = 57.60
2022-01-26 14:16:46.056 | DEBUG    | __main__:trials:24 - Trial = 4511/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.058 | DEBUG    | __main__:trials:29 - Trial = 4511/30000 | Total reward = 43.20
2022-01-26 14:16:46.061 | DEBUG    | __main__:trials:24 - Trial = 4512/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.063 | DEBUG    | __main__:trials:29 - Trial = 4512/30000 | Total reward = 54.79
2022-01-26 14:16:46.066 | DEBUG    | __main__:trials:24 - Trial = 4513/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.068 | DEBUG    | __main__:trials:29 - Trial = 4513/30000 | Total reward = 49.43
2022-01-26 14:16:46.072 | DEBUG    | __main__:trials:24 - Trial = 4514/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.073 | DEBUG    | __main__:trials:29 - Trial = 4514/30000 | Total reward = 44.98
2022-01-26 14:16:46.077 | DEBUG    | __main__:trials:24 - Trial = 4515/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.078 | DEBUG    | __main__:trials:29 - Trial = 4515/30000 | Total reward = 62.15
2022-01-26 14:16:46.082 | DEBUG    | __main__:trials:24 - Trial = 4516/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.084 | DEBUG    | __main__:trials:29 - Trial = 4516/30000 | Total reward = 27.86
2022-01-26 14:16:46.088 | DEBUG    | __main__:trials:24 - Trial = 4517/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.089 | DEBUG    | __main__:trials:29 - Trial = 4517/30000 | Total reward = 49.23
2022-01-26 14:16:46.093 | DEBUG    | __main__:trials:24 - Trial = 4518/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.095 | DEBUG    | __main__:trials:29 - Trial = 4518/30000 | Total reward = 63.95
2022-01-26 14:16:46.098 | DEBUG    | __main__:trials:24 - Trial = 4519/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.099 | DEBUG    | __main__:trials:29 - Trial = 4519/30000 | Total reward = 51.41
2022-01-26 14:16:46.103 | DEBUG    | __main__:trials:24 - Trial = 4520/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.104 | DEBUG    | __main__:trials:29 - Trial = 4520/30000 | Total reward = 48.71
2022-01-26 14:16:46.108 | DEBUG    | __main__:trials:24 - Trial = 4521/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.109 | DEBUG    | __main__:trials:29 - Trial = 4521/30000 | Total reward = 45.67
2022-01-26 14:16:46.113 | DEBUG    | __main__:trials:24 - Trial = 4522/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.114 | DEBUG    | __main__:trials:29 - Trial = 4522/30000 | Total reward = 41.03
2022-01-26 14:16:46.118 | DEBUG    | __main__:trials:26 - Trial = 4523/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.119 | DEBUG    | __main__:trials:29 - Trial = 4523/30000 | Total reward = 8.58
2022-01-26 14:16:46.123 | DEBUG    | __main__:trials:24 - Trial = 4524/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.124 | DEBUG    | __main__:trials:29 - Trial = 4524/30000 | Total reward = 49.87
2022-01-26 14:16:46.128 | DEBUG    | __main__:trials:24 - Trial = 4525/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.129 | DEBUG    | __main__:trials:29 - Trial = 4525/30000 | Total reward = 43.54
2022-01-26 14:16:46.132 | DEBUG    | __main__:trials:24 - Trial = 4526/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.133 | DEBUG    | __main__:trials:29 - Trial = 4526/30000 | Total reward = 39.46
2022-01-26 14:16:46.137 | DEBUG    | __main__:trials:24 - Trial = 4527/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.137 | DEBUG    | __main__:trials:29 - Trial = 4527/30000 | Total reward = 44.88
2022-01-26 14:16:46.141 | DEBUG    | __main__:trials:26 - Trial = 4528/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.143 | DEBUG    | __main__:trials:29 - Trial = 4528/30000 | Total reward = 22.85
2022-01-26 14:16:46.147 | DEBUG    | __main__:trials:24 - Trial = 4529/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.147 | DEBUG    | __main__:trials:29 - Trial = 4529/30000 | Total reward = 48.54
2022-01-26 14:16:46.152 | DEBUG    | __main__:trials:24 - Trial = 4530/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.154 | DEBUG    | __main__:trials:29 - Trial = 4530/30000 | Total reward = 35.56
2022-01-26 14:16:46.157 | DEBUG    | __main__:trials:24 - Trial = 4531/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.158 | DEBUG    | __main__:trials:29 - Trial = 4531/30000 | Total reward = 48.47
2022-01-26 14:16:46.162 | DEBUG    | __main__:trials:24 - Trial = 4532/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.164 | DEBUG    | __main__:trials:29 - Trial = 4532/30000 | Total reward = 52.54
2022-01-26 14:16:46.167 | DEBUG    | __main__:trials:24 - Trial = 4533/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.168 | DEBUG    | __main__:trials:29 - Trial = 4533/30000 | Total reward = 49.55
2022-01-26 14:16:46.172 | DEBUG    | __main__:trials:24 - Trial = 4534/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.173 | DEBUG    | __main__:trials:29 - Trial = 4534/30000 | Total reward = 49.67
2022-01-26 14:16:46.178 | DEBUG    | __main__:trials:24 - Trial = 4535/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.179 | DEBUG    | __main__:trials:29 - Trial = 4535/30000 | Total reward = 36.35
2022-01-26 14:16:46.183 | DEBUG    | __main__:trials:24 - Trial = 4536/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.184 | DEBUG    | __main__:trials:29 - Trial = 4536/30000 | Total reward = 50.32
2022-01-26 14:16:46.188 | DEBUG    | __main__:trials:24 - Trial = 4537/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.190 | DEBUG    | __main__:trials:29 - Trial = 4537/30000 | Total reward = 51.91
2022-01-26 14:16:46.193 | DEBUG    | __main__:trials:24 - Trial = 4538/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.194 | DEBUG    | __main__:trials:29 - Trial = 4538/30000 | Total reward = 49.67
2022-01-26 14:16:46.198 | DEBUG    | __main__:trials:24 - Trial = 4539/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.200 | DEBUG    | __main__:trials:29 - Trial = 4539/30000 | Total reward = 35.87
2022-01-26 14:16:46.203 | DEBUG    | __main__:trials:24 - Trial = 4540/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.205 | DEBUG    | __main__:trials:29 - Trial = 4540/30000 | Total reward = 49.27
2022-01-26 14:16:46.208 | DEBUG    | __main__:trials:24 - Trial = 4541/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.209 | DEBUG    | __main__:trials:29 - Trial = 4541/30000 | Total reward = 47.56
2022-01-26 14:16:46.212 | DEBUG    | __main__:trials:24 - Trial = 4542/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.214 | DEBUG    | __main__:trials:29 - Trial = 4542/30000 | Total reward = 49.67
2022-01-26 14:16:46.217 | DEBUG    | __main__:trials:24 - Trial = 4543/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.219 | DEBUG    | __main__:trials:29 - Trial = 4543/30000 | Total reward = 44.35
2022-01-26 14:16:46.222 | DEBUG    | __main__:trials:24 - Trial = 4544/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.224 | DEBUG    | __main__:trials:29 - Trial = 4544/30000 | Total reward = 46.67
2022-01-26 14:16:46.226 | DEBUG    | __main__:trials:24 - Trial = 4545/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.228 | DEBUG    | __main__:trials:29 - Trial = 4545/30000 | Total reward = 49.50
2022-01-26 14:16:46.231 | DEBUG    | __main__:trials:24 - Trial = 4546/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.233 | DEBUG    | __main__:trials:29 - Trial = 4546/30000 | Total reward = 42.56
2022-01-26 14:16:46.236 | DEBUG    | __main__:trials:24 - Trial = 4547/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.238 | DEBUG    | __main__:trials:29 - Trial = 4547/30000 | Total reward = 52.36
2022-01-26 14:16:46.242 | DEBUG    | __main__:trials:24 - Trial = 4548/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.243 | DEBUG    | __main__:trials:29 - Trial = 4548/30000 | Total reward = 28.91
2022-01-26 14:16:46.247 | DEBUG    | __main__:trials:24 - Trial = 4549/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.248 | DEBUG    | __main__:trials:29 - Trial = 4549/30000 | Total reward = 29.65
2022-01-26 14:16:46.252 | DEBUG    | __main__:trials:24 - Trial = 4550/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.254 | DEBUG    | __main__:trials:29 - Trial = 4550/30000 | Total reward = 56.46
2022-01-26 14:16:46.257 | DEBUG    | __main__:trials:24 - Trial = 4551/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.258 | DEBUG    | __main__:trials:29 - Trial = 4551/30000 | Total reward = 50.72
2022-01-26 14:16:46.263 | DEBUG    | __main__:trials:24 - Trial = 4552/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.264 | DEBUG    | __main__:trials:29 - Trial = 4552/30000 | Total reward = 46.52
2022-01-26 14:16:46.268 | DEBUG    | __main__:trials:24 - Trial = 4553/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.268 | DEBUG    | __main__:trials:29 - Trial = 4553/30000 | Total reward = 47.04
2022-01-26 14:16:46.272 | DEBUG    | __main__:trials:24 - Trial = 4554/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.274 | DEBUG    | __main__:trials:29 - Trial = 4554/30000 | Total reward = 48.22
2022-01-26 14:16:46.277 | DEBUG    | __main__:trials:24 - Trial = 4555/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.278 | DEBUG    | __main__:trials:29 - Trial = 4555/30000 | Total reward = 39.30
2022-01-26 14:16:46.282 | DEBUG    | __main__:trials:24 - Trial = 4556/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.284 | DEBUG    | __main__:trials:29 - Trial = 4556/30000 | Total reward = 27.11
2022-01-26 14:16:46.288 | DEBUG    | __main__:trials:24 - Trial = 4557/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.288 | DEBUG    | __main__:trials:29 - Trial = 4557/30000 | Total reward = 65.04
2022-01-26 14:16:46.291 | DEBUG    | __main__:trials:26 - Trial = 4558/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.292 | DEBUG    | __main__:trials:29 - Trial = 4558/30000 | Total reward = 18.50
2022-01-26 14:16:46.295 | DEBUG    | __main__:trials:24 - Trial = 4559/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.297 | DEBUG    | __main__:trials:29 - Trial = 4559/30000 | Total reward = 53.98
2022-01-26 14:16:46.301 | DEBUG    | __main__:trials:24 - Trial = 4560/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.302 | DEBUG    | __main__:trials:29 - Trial = 4560/30000 | Total reward = 47.35
2022-01-26 14:16:46.306 | DEBUG    | __main__:trials:24 - Trial = 4561/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.307 | DEBUG    | __main__:trials:29 - Trial = 4561/30000 | Total reward = 33.77
2022-01-26 14:16:46.311 | DEBUG    | __main__:trials:24 - Trial = 4562/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.312 | DEBUG    | __main__:trials:29 - Trial = 4562/30000 | Total reward = 45.31
2022-01-26 14:16:46.316 | DEBUG    | __main__:trials:24 - Trial = 4563/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.317 | DEBUG    | __main__:trials:29 - Trial = 4563/30000 | Total reward = 56.03
2022-01-26 14:16:46.321 | DEBUG    | __main__:trials:24 - Trial = 4564/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.322 | DEBUG    | __main__:trials:29 - Trial = 4564/30000 | Total reward = 59.47
2022-01-26 14:16:46.326 | DEBUG    | __main__:trials:24 - Trial = 4565/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.328 | DEBUG    | __main__:trials:29 - Trial = 4565/30000 | Total reward = 56.10
2022-01-26 14:16:46.331 | DEBUG    | __main__:trials:24 - Trial = 4566/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.333 | DEBUG    | __main__:trials:29 - Trial = 4566/30000 | Total reward = 38.59
2022-01-26 14:16:46.336 | DEBUG    | __main__:trials:24 - Trial = 4567/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.337 | DEBUG    | __main__:trials:29 - Trial = 4567/30000 | Total reward = 28.74
2022-01-26 14:16:46.342 | DEBUG    | __main__:trials:24 - Trial = 4568/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.343 | DEBUG    | __main__:trials:29 - Trial = 4568/30000 | Total reward = 57.90
2022-01-26 14:16:46.346 | DEBUG    | __main__:trials:24 - Trial = 4569/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.348 | DEBUG    | __main__:trials:29 - Trial = 4569/30000 | Total reward = 53.67
2022-01-26 14:16:46.352 | DEBUG    | __main__:trials:24 - Trial = 4570/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.352 | DEBUG    | __main__:trials:29 - Trial = 4570/30000 | Total reward = 44.33
2022-01-26 14:16:46.357 | DEBUG    | __main__:trials:24 - Trial = 4571/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.358 | DEBUG    | __main__:trials:29 - Trial = 4571/30000 | Total reward = 43.84
2022-01-26 14:16:46.362 | DEBUG    | __main__:trials:24 - Trial = 4572/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.363 | DEBUG    | __main__:trials:29 - Trial = 4572/30000 | Total reward = 46.70
2022-01-26 14:16:46.367 | DEBUG    | __main__:trials:24 - Trial = 4573/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.368 | DEBUG    | __main__:trials:29 - Trial = 4573/30000 | Total reward = 52.70
2022-01-26 14:16:46.372 | DEBUG    | __main__:trials:24 - Trial = 4574/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.373 | DEBUG    | __main__:trials:29 - Trial = 4574/30000 | Total reward = 30.01
2022-01-26 14:16:46.376 | DEBUG    | __main__:trials:24 - Trial = 4575/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.378 | DEBUG    | __main__:trials:29 - Trial = 4575/30000 | Total reward = 36.42
2022-01-26 14:16:46.382 | DEBUG    | __main__:trials:24 - Trial = 4576/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.383 | DEBUG    | __main__:trials:29 - Trial = 4576/30000 | Total reward = 24.85
2022-01-26 14:16:46.387 | DEBUG    | __main__:trials:24 - Trial = 4577/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.389 | DEBUG    | __main__:trials:29 - Trial = 4577/30000 | Total reward = 31.59
2022-01-26 14:16:46.393 | DEBUG    | __main__:trials:24 - Trial = 4578/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.394 | DEBUG    | __main__:trials:29 - Trial = 4578/30000 | Total reward = 46.46
2022-01-26 14:16:46.398 | DEBUG    | __main__:trials:24 - Trial = 4579/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.399 | DEBUG    | __main__:trials:29 - Trial = 4579/30000 | Total reward = 30.79
2022-01-26 14:16:46.402 | DEBUG    | __main__:trials:24 - Trial = 4580/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.404 | DEBUG    | __main__:trials:29 - Trial = 4580/30000 | Total reward = 43.48
2022-01-26 14:16:46.408 | DEBUG    | __main__:trials:24 - Trial = 4581/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.409 | DEBUG    | __main__:trials:29 - Trial = 4581/30000 | Total reward = 48.25
2022-01-26 14:16:46.411 | DEBUG    | __main__:trials:26 - Trial = 4582/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.413 | DEBUG    | __main__:trials:29 - Trial = 4582/30000 | Total reward = 11.92
2022-01-26 14:16:46.417 | DEBUG    | __main__:trials:24 - Trial = 4583/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.418 | DEBUG    | __main__:trials:29 - Trial = 4583/30000 | Total reward = 42.17
2022-01-26 14:16:46.421 | DEBUG    | __main__:trials:24 - Trial = 4584/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.423 | DEBUG    | __main__:trials:29 - Trial = 4584/30000 | Total reward = 51.83
2022-01-26 14:16:46.427 | DEBUG    | __main__:trials:24 - Trial = 4585/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.428 | DEBUG    | __main__:trials:29 - Trial = 4585/30000 | Total reward = 44.49
2022-01-26 14:16:46.432 | DEBUG    | __main__:trials:24 - Trial = 4586/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.433 | DEBUG    | __main__:trials:29 - Trial = 4586/30000 | Total reward = 46.30
2022-01-26 14:16:46.437 | DEBUG    | __main__:trials:24 - Trial = 4587/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.439 | DEBUG    | __main__:trials:29 - Trial = 4587/30000 | Total reward = 57.85
2022-01-26 14:16:46.442 | DEBUG    | __main__:trials:24 - Trial = 4588/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.443 | DEBUG    | __main__:trials:29 - Trial = 4588/30000 | Total reward = 38.81
2022-01-26 14:16:46.447 | DEBUG    | __main__:trials:24 - Trial = 4589/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.448 | DEBUG    | __main__:trials:29 - Trial = 4589/30000 | Total reward = 44.34
2022-01-26 14:16:46.453 | DEBUG    | __main__:trials:24 - Trial = 4590/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.453 | DEBUG    | __main__:trials:29 - Trial = 4590/30000 | Total reward = 49.93
2022-01-26 14:16:46.456 | DEBUG    | __main__:trials:24 - Trial = 4591/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.458 | DEBUG    | __main__:trials:29 - Trial = 4591/30000 | Total reward = 53.49
2022-01-26 14:16:46.461 | DEBUG    | __main__:trials:24 - Trial = 4592/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.461 | DEBUG    | __main__:trials:29 - Trial = 4592/30000 | Total reward = 40.69
2022-01-26 14:16:46.465 | DEBUG    | __main__:trials:24 - Trial = 4593/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.465 | DEBUG    | __main__:trials:29 - Trial = 4593/30000 | Total reward = 29.59
2022-01-26 14:16:46.470 | DEBUG    | __main__:trials:24 - Trial = 4594/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.471 | DEBUG    | __main__:trials:29 - Trial = 4594/30000 | Total reward = 28.80
2022-01-26 14:16:46.475 | DEBUG    | __main__:trials:24 - Trial = 4595/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.477 | DEBUG    | __main__:trials:29 - Trial = 4595/30000 | Total reward = 47.97
2022-01-26 14:16:46.480 | DEBUG    | __main__:trials:24 - Trial = 4596/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.482 | DEBUG    | __main__:trials:29 - Trial = 4596/30000 | Total reward = 51.04
2022-01-26 14:16:46.485 | DEBUG    | __main__:trials:24 - Trial = 4597/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.486 | DEBUG    | __main__:trials:29 - Trial = 4597/30000 | Total reward = 42.98
2022-01-26 14:16:46.490 | DEBUG    | __main__:trials:24 - Trial = 4598/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.492 | DEBUG    | __main__:trials:29 - Trial = 4598/30000 | Total reward = 48.38
2022-01-26 14:16:46.495 | DEBUG    | __main__:trials:24 - Trial = 4599/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.497 | DEBUG    | __main__:trials:29 - Trial = 4599/30000 | Total reward = 43.96
2022-01-26 14:16:46.499 | DEBUG    | __main__:trials:26 - Trial = 4600/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.501 | DEBUG    | __main__:trials:29 - Trial = 4600/30000 | Total reward = 17.85
2022-01-26 14:16:46.505 | DEBUG    | __main__:trials:24 - Trial = 4601/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.506 | DEBUG    | __main__:trials:29 - Trial = 4601/30000 | Total reward = 49.48
2022-01-26 14:16:46.509 | DEBUG    | __main__:trials:24 - Trial = 4602/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.510 | DEBUG    | __main__:trials:29 - Trial = 4602/30000 | Total reward = 46.97
2022-01-26 14:16:46.513 | DEBUG    | __main__:trials:24 - Trial = 4603/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.515 | DEBUG    | __main__:trials:29 - Trial = 4603/30000 | Total reward = 50.61
2022-01-26 14:16:46.519 | DEBUG    | __main__:trials:24 - Trial = 4604/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.519 | DEBUG    | __main__:trials:29 - Trial = 4604/30000 | Total reward = 27.18
2022-01-26 14:16:46.523 | DEBUG    | __main__:trials:26 - Trial = 4605/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.525 | DEBUG    | __main__:trials:29 - Trial = 4605/30000 | Total reward = 28.45
2022-01-26 14:16:46.528 | DEBUG    | __main__:trials:24 - Trial = 4606/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.529 | DEBUG    | __main__:trials:29 - Trial = 4606/30000 | Total reward = 44.45
2022-01-26 14:16:46.532 | DEBUG    | __main__:trials:26 - Trial = 4607/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.532 | DEBUG    | __main__:trials:29 - Trial = 4607/30000 | Total reward = 17.85
2022-01-26 14:16:46.536 | DEBUG    | __main__:trials:24 - Trial = 4608/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.536 | DEBUG    | __main__:trials:29 - Trial = 4608/30000 | Total reward = 42.12
2022-01-26 14:16:46.540 | DEBUG    | __main__:trials:24 - Trial = 4609/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.540 | DEBUG    | __main__:trials:29 - Trial = 4609/30000 | Total reward = 50.79
2022-01-26 14:16:46.544 | DEBUG    | __main__:trials:24 - Trial = 4610/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.545 | DEBUG    | __main__:trials:29 - Trial = 4610/30000 | Total reward = 43.15
2022-01-26 14:16:46.548 | DEBUG    | __main__:trials:24 - Trial = 4611/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.550 | DEBUG    | __main__:trials:29 - Trial = 4611/30000 | Total reward = 40.88
2022-01-26 14:16:46.554 | DEBUG    | __main__:trials:24 - Trial = 4612/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.554 | DEBUG    | __main__:trials:29 - Trial = 4612/30000 | Total reward = 48.77
2022-01-26 14:16:46.559 | DEBUG    | __main__:trials:24 - Trial = 4613/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.560 | DEBUG    | __main__:trials:29 - Trial = 4613/30000 | Total reward = 49.55
2022-01-26 14:16:46.564 | DEBUG    | __main__:trials:24 - Trial = 4614/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.566 | DEBUG    | __main__:trials:29 - Trial = 4614/30000 | Total reward = 36.28
2022-01-26 14:16:46.570 | DEBUG    | __main__:trials:24 - Trial = 4615/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.571 | DEBUG    | __main__:trials:29 - Trial = 4615/30000 | Total reward = 60.47
2022-01-26 14:16:46.574 | DEBUG    | __main__:trials:24 - Trial = 4616/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.576 | DEBUG    | __main__:trials:29 - Trial = 4616/30000 | Total reward = 53.21
2022-01-26 14:16:46.580 | DEBUG    | __main__:trials:24 - Trial = 4617/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.581 | DEBUG    | __main__:trials:29 - Trial = 4617/30000 | Total reward = 46.83
2022-01-26 14:16:46.585 | DEBUG    | __main__:trials:24 - Trial = 4618/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.587 | DEBUG    | __main__:trials:29 - Trial = 4618/30000 | Total reward = 46.87
2022-01-26 14:16:46.590 | DEBUG    | __main__:trials:24 - Trial = 4619/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.591 | DEBUG    | __main__:trials:29 - Trial = 4619/30000 | Total reward = 34.04
2022-01-26 14:16:46.596 | DEBUG    | __main__:trials:24 - Trial = 4620/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.596 | DEBUG    | __main__:trials:29 - Trial = 4620/30000 | Total reward = 42.61
2022-01-26 14:16:46.600 | DEBUG    | __main__:trials:24 - Trial = 4621/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.601 | DEBUG    | __main__:trials:29 - Trial = 4621/30000 | Total reward = 52.16
2022-01-26 14:16:46.604 | DEBUG    | __main__:trials:24 - Trial = 4622/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.605 | DEBUG    | __main__:trials:29 - Trial = 4622/30000 | Total reward = 48.25
2022-01-26 14:16:46.609 | DEBUG    | __main__:trials:24 - Trial = 4623/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.610 | DEBUG    | __main__:trials:29 - Trial = 4623/30000 | Total reward = 41.71
2022-01-26 14:16:46.613 | DEBUG    | __main__:trials:24 - Trial = 4624/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.615 | DEBUG    | __main__:trials:29 - Trial = 4624/30000 | Total reward = 39.71
2022-01-26 14:16:46.618 | DEBUG    | __main__:trials:24 - Trial = 4625/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.620 | DEBUG    | __main__:trials:29 - Trial = 4625/30000 | Total reward = 43.30
2022-01-26 14:16:46.624 | DEBUG    | __main__:trials:24 - Trial = 4626/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.625 | DEBUG    | __main__:trials:29 - Trial = 4626/30000 | Total reward = 47.24
2022-01-26 14:16:46.628 | DEBUG    | __main__:trials:26 - Trial = 4627/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.630 | DEBUG    | __main__:trials:29 - Trial = 4627/30000 | Total reward = 13.78
2022-01-26 14:16:46.633 | DEBUG    | __main__:trials:24 - Trial = 4628/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.635 | DEBUG    | __main__:trials:29 - Trial = 4628/30000 | Total reward = 53.23
2022-01-26 14:16:46.638 | DEBUG    | __main__:trials:24 - Trial = 4629/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.640 | DEBUG    | __main__:trials:29 - Trial = 4629/30000 | Total reward = 52.20
2022-01-26 14:16:46.643 | DEBUG    | __main__:trials:24 - Trial = 4630/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.644 | DEBUG    | __main__:trials:29 - Trial = 4630/30000 | Total reward = 46.30
2022-01-26 14:16:46.647 | DEBUG    | __main__:trials:24 - Trial = 4631/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.649 | DEBUG    | __main__:trials:29 - Trial = 4631/30000 | Total reward = 46.26
2022-01-26 14:16:46.652 | DEBUG    | __main__:trials:24 - Trial = 4632/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.654 | DEBUG    | __main__:trials:29 - Trial = 4632/30000 | Total reward = 46.58
2022-01-26 14:16:46.658 | DEBUG    | __main__:trials:24 - Trial = 4633/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.659 | DEBUG    | __main__:trials:29 - Trial = 4633/30000 | Total reward = 52.67
2022-01-26 14:16:46.663 | DEBUG    | __main__:trials:24 - Trial = 4634/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.665 | DEBUG    | __main__:trials:29 - Trial = 4634/30000 | Total reward = 27.51
2022-01-26 14:16:46.668 | DEBUG    | __main__:trials:24 - Trial = 4635/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.670 | DEBUG    | __main__:trials:29 - Trial = 4635/30000 | Total reward = 50.42
2022-01-26 14:16:46.674 | DEBUG    | __main__:trials:24 - Trial = 4636/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.676 | DEBUG    | __main__:trials:29 - Trial = 4636/30000 | Total reward = 53.45
2022-01-26 14:16:46.679 | DEBUG    | __main__:trials:24 - Trial = 4637/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.681 | DEBUG    | __main__:trials:29 - Trial = 4637/30000 | Total reward = 46.70
2022-01-26 14:16:46.684 | DEBUG    | __main__:trials:24 - Trial = 4638/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.686 | DEBUG    | __main__:trials:29 - Trial = 4638/30000 | Total reward = 43.83
2022-01-26 14:16:46.689 | DEBUG    | __main__:trials:24 - Trial = 4639/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.690 | DEBUG    | __main__:trials:29 - Trial = 4639/30000 | Total reward = 44.29
2022-01-26 14:16:46.694 | DEBUG    | __main__:trials:24 - Trial = 4640/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.695 | DEBUG    | __main__:trials:29 - Trial = 4640/30000 | Total reward = 48.77
2022-01-26 14:16:46.699 | DEBUG    | __main__:trials:24 - Trial = 4641/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.700 | DEBUG    | __main__:trials:29 - Trial = 4641/30000 | Total reward = 24.09
2022-01-26 14:16:46.704 | DEBUG    | __main__:trials:24 - Trial = 4642/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.705 | DEBUG    | __main__:trials:29 - Trial = 4642/30000 | Total reward = 47.14
2022-01-26 14:16:46.709 | DEBUG    | __main__:trials:24 - Trial = 4643/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.710 | DEBUG    | __main__:trials:29 - Trial = 4643/30000 | Total reward = 45.81
2022-01-26 14:16:46.714 | DEBUG    | __main__:trials:24 - Trial = 4644/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.716 | DEBUG    | __main__:trials:29 - Trial = 4644/30000 | Total reward = 45.84
2022-01-26 14:16:46.719 | DEBUG    | __main__:trials:24 - Trial = 4645/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.720 | DEBUG    | __main__:trials:29 - Trial = 4645/30000 | Total reward = 52.65
2022-01-26 14:16:46.724 | DEBUG    | __main__:trials:24 - Trial = 4646/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.726 | DEBUG    | __main__:trials:29 - Trial = 4646/30000 | Total reward = 41.51
2022-01-26 14:16:46.730 | DEBUG    | __main__:trials:24 - Trial = 4647/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.732 | DEBUG    | __main__:trials:29 - Trial = 4647/30000 | Total reward = 57.52
2022-01-26 14:16:46.734 | DEBUG    | __main__:trials:24 - Trial = 4648/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.736 | DEBUG    | __main__:trials:29 - Trial = 4648/30000 | Total reward = 48.05
2022-01-26 14:16:46.739 | DEBUG    | __main__:trials:24 - Trial = 4649/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.741 | DEBUG    | __main__:trials:29 - Trial = 4649/30000 | Total reward = 49.50
2022-01-26 14:16:46.744 | DEBUG    | __main__:trials:24 - Trial = 4650/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.746 | DEBUG    | __main__:trials:29 - Trial = 4650/30000 | Total reward = 49.53
2022-01-26 14:16:46.750 | DEBUG    | __main__:trials:24 - Trial = 4651/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.751 | DEBUG    | __main__:trials:29 - Trial = 4651/30000 | Total reward = 50.72
2022-01-26 14:16:46.755 | DEBUG    | __main__:trials:24 - Trial = 4652/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.757 | DEBUG    | __main__:trials:29 - Trial = 4652/30000 | Total reward = 32.33
2022-01-26 14:16:46.759 | DEBUG    | __main__:trials:24 - Trial = 4653/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.760 | DEBUG    | __main__:trials:29 - Trial = 4653/30000 | Total reward = 47.88
2022-01-26 14:16:46.764 | DEBUG    | __main__:trials:24 - Trial = 4654/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.765 | DEBUG    | __main__:trials:29 - Trial = 4654/30000 | Total reward = 43.51
2022-01-26 14:16:46.769 | DEBUG    | __main__:trials:24 - Trial = 4655/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.770 | DEBUG    | __main__:trials:29 - Trial = 4655/30000 | Total reward = 23.35
2022-01-26 14:16:46.774 | DEBUG    | __main__:trials:26 - Trial = 4656/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.774 | DEBUG    | __main__:trials:29 - Trial = 4656/30000 | Total reward = 26.86
2022-01-26 14:16:46.779 | DEBUG    | __main__:trials:24 - Trial = 4657/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.779 | DEBUG    | __main__:trials:29 - Trial = 4657/30000 | Total reward = 35.36
2022-01-26 14:16:46.784 | DEBUG    | __main__:trials:24 - Trial = 4658/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.786 | DEBUG    | __main__:trials:29 - Trial = 4658/30000 | Total reward = 33.23
2022-01-26 14:16:46.790 | DEBUG    | __main__:trials:24 - Trial = 4659/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.791 | DEBUG    | __main__:trials:29 - Trial = 4659/30000 | Total reward = 49.09
2022-01-26 14:16:46.794 | DEBUG    | __main__:trials:24 - Trial = 4660/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.797 | DEBUG    | __main__:trials:29 - Trial = 4660/30000 | Total reward = 57.07
2022-01-26 14:16:46.800 | DEBUG    | __main__:trials:24 - Trial = 4661/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.802 | DEBUG    | __main__:trials:29 - Trial = 4661/30000 | Total reward = 49.62
2022-01-26 14:16:46.805 | DEBUG    | __main__:trials:24 - Trial = 4662/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.807 | DEBUG    | __main__:trials:29 - Trial = 4662/30000 | Total reward = 44.03
2022-01-26 14:16:46.811 | DEBUG    | __main__:trials:24 - Trial = 4663/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.812 | DEBUG    | __main__:trials:29 - Trial = 4663/30000 | Total reward = 35.55
2022-01-26 14:16:46.816 | DEBUG    | __main__:trials:24 - Trial = 4664/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.818 | DEBUG    | __main__:trials:29 - Trial = 4664/30000 | Total reward = 42.96
2022-01-26 14:16:46.821 | DEBUG    | __main__:trials:26 - Trial = 4665/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.822 | DEBUG    | __main__:trials:29 - Trial = 4665/30000 | Total reward = 17.85
2022-01-26 14:16:46.825 | DEBUG    | __main__:trials:24 - Trial = 4666/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.826 | DEBUG    | __main__:trials:29 - Trial = 4666/30000 | Total reward = 46.98
2022-01-26 14:16:46.829 | DEBUG    | __main__:trials:24 - Trial = 4667/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.831 | DEBUG    | __main__:trials:29 - Trial = 4667/30000 | Total reward = 48.07
2022-01-26 14:16:46.834 | DEBUG    | __main__:trials:24 - Trial = 4668/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.836 | DEBUG    | __main__:trials:29 - Trial = 4668/30000 | Total reward = 52.94
2022-01-26 14:16:46.839 | DEBUG    | __main__:trials:24 - Trial = 4669/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.841 | DEBUG    | __main__:trials:29 - Trial = 4669/30000 | Total reward = 40.81
2022-01-26 14:16:46.844 | DEBUG    | __main__:trials:24 - Trial = 4670/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.846 | DEBUG    | __main__:trials:29 - Trial = 4670/30000 | Total reward = 48.30
2022-01-26 14:16:46.850 | DEBUG    | __main__:trials:24 - Trial = 4671/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.851 | DEBUG    | __main__:trials:29 - Trial = 4671/30000 | Total reward = 44.30
2022-01-26 14:16:46.854 | DEBUG    | __main__:trials:24 - Trial = 4672/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.857 | DEBUG    | __main__:trials:29 - Trial = 4672/30000 | Total reward = 47.03
2022-01-26 14:16:46.860 | DEBUG    | __main__:trials:24 - Trial = 4673/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.862 | DEBUG    | __main__:trials:29 - Trial = 4673/30000 | Total reward = 54.59
2022-01-26 14:16:46.866 | DEBUG    | __main__:trials:24 - Trial = 4674/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.867 | DEBUG    | __main__:trials:29 - Trial = 4674/30000 | Total reward = 46.53
2022-01-26 14:16:46.871 | DEBUG    | __main__:trials:24 - Trial = 4675/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.873 | DEBUG    | __main__:trials:29 - Trial = 4675/30000 | Total reward = 57.10
2022-01-26 14:16:46.876 | DEBUG    | __main__:trials:24 - Trial = 4676/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.878 | DEBUG    | __main__:trials:29 - Trial = 4676/30000 | Total reward = 28.57
2022-01-26 14:16:46.881 | DEBUG    | __main__:trials:24 - Trial = 4677/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.882 | DEBUG    | __main__:trials:29 - Trial = 4677/30000 | Total reward = 43.26
2022-01-26 14:16:46.886 | DEBUG    | __main__:trials:24 - Trial = 4678/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.888 | DEBUG    | __main__:trials:29 - Trial = 4678/30000 | Total reward = 54.04
2022-01-26 14:16:46.892 | DEBUG    | __main__:trials:24 - Trial = 4679/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.893 | DEBUG    | __main__:trials:29 - Trial = 4679/30000 | Total reward = 43.44
2022-01-26 14:16:46.897 | DEBUG    | __main__:trials:24 - Trial = 4680/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.898 | DEBUG    | __main__:trials:29 - Trial = 4680/30000 | Total reward = 49.26
2022-01-26 14:16:46.902 | DEBUG    | __main__:trials:24 - Trial = 4681/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.904 | DEBUG    | __main__:trials:29 - Trial = 4681/30000 | Total reward = 38.92
2022-01-26 14:16:46.907 | DEBUG    | __main__:trials:26 - Trial = 4682/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.908 | DEBUG    | __main__:trials:29 - Trial = 4682/30000 | Total reward = 18.85
2022-01-26 14:16:46.912 | DEBUG    | __main__:trials:24 - Trial = 4683/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.913 | DEBUG    | __main__:trials:29 - Trial = 4683/30000 | Total reward = 46.66
2022-01-26 14:16:46.916 | DEBUG    | __main__:trials:24 - Trial = 4684/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.918 | DEBUG    | __main__:trials:29 - Trial = 4684/30000 | Total reward = 44.01
2022-01-26 14:16:46.920 | DEBUG    | __main__:trials:26 - Trial = 4685/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.922 | DEBUG    | __main__:trials:29 - Trial = 4685/30000 | Total reward = 21.28
2022-01-26 14:16:46.926 | DEBUG    | __main__:trials:24 - Trial = 4686/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.927 | DEBUG    | __main__:trials:29 - Trial = 4686/30000 | Total reward = 51.74
2022-01-26 14:16:46.930 | DEBUG    | __main__:trials:26 - Trial = 4687/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.932 | DEBUG    | __main__:trials:29 - Trial = 4687/30000 | Total reward = 19.33
2022-01-26 14:16:46.935 | DEBUG    | __main__:trials:26 - Trial = 4688/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:46.937 | DEBUG    | __main__:trials:29 - Trial = 4688/30000 | Total reward = 34.46
2022-01-26 14:16:46.940 | DEBUG    | __main__:trials:24 - Trial = 4689/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.942 | DEBUG    | __main__:trials:29 - Trial = 4689/30000 | Total reward = 47.49
2022-01-26 14:16:46.946 | DEBUG    | __main__:trials:24 - Trial = 4690/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.947 | DEBUG    | __main__:trials:29 - Trial = 4690/30000 | Total reward = 47.93
2022-01-26 14:16:46.951 | DEBUG    | __main__:trials:24 - Trial = 4691/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.953 | DEBUG    | __main__:trials:29 - Trial = 4691/30000 | Total reward = 45.89
2022-01-26 14:16:46.956 | DEBUG    | __main__:trials:24 - Trial = 4692/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.958 | DEBUG    | __main__:trials:29 - Trial = 4692/30000 | Total reward = 61.69
2022-01-26 14:16:46.962 | DEBUG    | __main__:trials:24 - Trial = 4693/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.963 | DEBUG    | __main__:trials:29 - Trial = 4693/30000 | Total reward = 39.86
2022-01-26 14:16:46.966 | DEBUG    | __main__:trials:24 - Trial = 4694/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.968 | DEBUG    | __main__:trials:29 - Trial = 4694/30000 | Total reward = 40.85
2022-01-26 14:16:46.971 | DEBUG    | __main__:trials:24 - Trial = 4695/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.973 | DEBUG    | __main__:trials:29 - Trial = 4695/30000 | Total reward = 31.99
2022-01-26 14:16:46.977 | DEBUG    | __main__:trials:24 - Trial = 4696/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.979 | DEBUG    | __main__:trials:29 - Trial = 4696/30000 | Total reward = 55.60
2022-01-26 14:16:46.983 | DEBUG    | __main__:trials:24 - Trial = 4697/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.984 | DEBUG    | __main__:trials:29 - Trial = 4697/30000 | Total reward = 49.09
2022-01-26 14:16:46.988 | DEBUG    | __main__:trials:24 - Trial = 4698/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.990 | DEBUG    | __main__:trials:29 - Trial = 4698/30000 | Total reward = 42.93
2022-01-26 14:16:46.993 | DEBUG    | __main__:trials:24 - Trial = 4699/30000 | Max number of steps (20) reached
2022-01-26 14:16:46.995 | DEBUG    | __main__:trials:29 - Trial = 4699/30000 | Total reward = 45.19
2022-01-26 14:16:46.999 | DEBUG    | __main__:trials:24 - Trial = 4700/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.000 | DEBUG    | __main__:trials:29 - Trial = 4700/30000 | Total reward = 50.25
2022-01-26 14:16:47.004 | DEBUG    | __main__:trials:24 - Trial = 4701/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.005 | DEBUG    | __main__:trials:29 - Trial = 4701/30000 | Total reward = 47.69
2022-01-26 14:16:47.009 | DEBUG    | __main__:trials:24 - Trial = 4702/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.011 | DEBUG    | __main__:trials:29 - Trial = 4702/30000 | Total reward = 52.22
2022-01-26 14:16:47.015 | DEBUG    | __main__:trials:24 - Trial = 4703/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.016 | DEBUG    | __main__:trials:29 - Trial = 4703/30000 | Total reward = 38.79
2022-01-26 14:16:47.020 | DEBUG    | __main__:trials:24 - Trial = 4704/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.022 | DEBUG    | __main__:trials:29 - Trial = 4704/30000 | Total reward = 30.86
2022-01-26 14:16:47.025 | DEBUG    | __main__:trials:24 - Trial = 4705/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.026 | DEBUG    | __main__:trials:29 - Trial = 4705/30000 | Total reward = 44.11
2022-01-26 14:16:47.029 | DEBUG    | __main__:trials:24 - Trial = 4706/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.031 | DEBUG    | __main__:trials:29 - Trial = 4706/30000 | Total reward = 52.83
2022-01-26 14:16:47.035 | DEBUG    | __main__:trials:24 - Trial = 4707/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.036 | DEBUG    | __main__:trials:29 - Trial = 4707/30000 | Total reward = 47.24
2022-01-26 14:16:47.040 | DEBUG    | __main__:trials:24 - Trial = 4708/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.041 | DEBUG    | __main__:trials:29 - Trial = 4708/30000 | Total reward = 46.78
2022-01-26 14:16:47.044 | DEBUG    | __main__:trials:24 - Trial = 4709/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.046 | DEBUG    | __main__:trials:29 - Trial = 4709/30000 | Total reward = 47.74
2022-01-26 14:16:47.050 | DEBUG    | __main__:trials:24 - Trial = 4710/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.051 | DEBUG    | __main__:trials:29 - Trial = 4710/30000 | Total reward = 48.92
2022-01-26 14:16:47.055 | DEBUG    | __main__:trials:24 - Trial = 4711/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.057 | DEBUG    | __main__:trials:29 - Trial = 4711/30000 | Total reward = 57.63
2022-01-26 14:16:47.060 | DEBUG    | __main__:trials:24 - Trial = 4712/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.062 | DEBUG    | __main__:trials:29 - Trial = 4712/30000 | Total reward = 38.11
2022-01-26 14:16:47.065 | DEBUG    | __main__:trials:24 - Trial = 4713/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.067 | DEBUG    | __main__:trials:29 - Trial = 4713/30000 | Total reward = 46.27
2022-01-26 14:16:47.071 | DEBUG    | __main__:trials:24 - Trial = 4714/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.072 | DEBUG    | __main__:trials:29 - Trial = 4714/30000 | Total reward = 45.98
2022-01-26 14:16:47.076 | DEBUG    | __main__:trials:24 - Trial = 4715/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.077 | DEBUG    | __main__:trials:29 - Trial = 4715/30000 | Total reward = 46.70
2022-01-26 14:16:47.081 | DEBUG    | __main__:trials:24 - Trial = 4716/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.084 | DEBUG    | __main__:trials:29 - Trial = 4716/30000 | Total reward = 48.25
2022-01-26 14:16:47.087 | DEBUG    | __main__:trials:24 - Trial = 4717/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.089 | DEBUG    | __main__:trials:29 - Trial = 4717/30000 | Total reward = 46.07
2022-01-26 14:16:47.093 | DEBUG    | __main__:trials:24 - Trial = 4718/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.095 | DEBUG    | __main__:trials:29 - Trial = 4718/30000 | Total reward = 38.62
2022-01-26 14:16:47.098 | DEBUG    | __main__:trials:24 - Trial = 4719/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.102 | DEBUG    | __main__:trials:29 - Trial = 4719/30000 | Total reward = 26.05
2022-01-26 14:16:47.105 | DEBUG    | __main__:trials:24 - Trial = 4720/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.106 | DEBUG    | __main__:trials:29 - Trial = 4720/30000 | Total reward = 25.51
2022-01-26 14:16:47.109 | DEBUG    | __main__:trials:24 - Trial = 4721/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.110 | DEBUG    | __main__:trials:29 - Trial = 4721/30000 | Total reward = 33.98
2022-01-26 14:16:47.114 | DEBUG    | __main__:trials:24 - Trial = 4722/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.115 | DEBUG    | __main__:trials:29 - Trial = 4722/30000 | Total reward = 36.36
2022-01-26 14:16:47.119 | DEBUG    | __main__:trials:24 - Trial = 4723/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.121 | DEBUG    | __main__:trials:29 - Trial = 4723/30000 | Total reward = 42.66
2022-01-26 14:16:47.124 | DEBUG    | __main__:trials:24 - Trial = 4724/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.125 | DEBUG    | __main__:trials:29 - Trial = 4724/30000 | Total reward = 46.81
2022-01-26 14:16:47.129 | DEBUG    | __main__:trials:24 - Trial = 4725/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.131 | DEBUG    | __main__:trials:29 - Trial = 4725/30000 | Total reward = 38.45
2022-01-26 14:16:47.135 | DEBUG    | __main__:trials:24 - Trial = 4726/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.136 | DEBUG    | __main__:trials:29 - Trial = 4726/30000 | Total reward = 58.51
2022-01-26 14:16:47.140 | DEBUG    | __main__:trials:24 - Trial = 4727/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.142 | DEBUG    | __main__:trials:29 - Trial = 4727/30000 | Total reward = 46.70
2022-01-26 14:16:47.145 | DEBUG    | __main__:trials:24 - Trial = 4728/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.147 | DEBUG    | __main__:trials:29 - Trial = 4728/30000 | Total reward = 51.97
2022-01-26 14:16:47.150 | DEBUG    | __main__:trials:24 - Trial = 4729/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.152 | DEBUG    | __main__:trials:29 - Trial = 4729/30000 | Total reward = 51.23
2022-01-26 14:16:47.155 | DEBUG    | __main__:trials:24 - Trial = 4730/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.157 | DEBUG    | __main__:trials:29 - Trial = 4730/30000 | Total reward = 52.37
2022-01-26 14:16:47.161 | DEBUG    | __main__:trials:24 - Trial = 4731/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.162 | DEBUG    | __main__:trials:29 - Trial = 4731/30000 | Total reward = 52.94
2022-01-26 14:16:47.165 | DEBUG    | __main__:trials:24 - Trial = 4732/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.166 | DEBUG    | __main__:trials:29 - Trial = 4732/30000 | Total reward = 47.34
2022-01-26 14:16:47.170 | DEBUG    | __main__:trials:24 - Trial = 4733/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.170 | DEBUG    | __main__:trials:29 - Trial = 4733/30000 | Total reward = 44.89
2022-01-26 14:16:47.174 | DEBUG    | __main__:trials:24 - Trial = 4734/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.175 | DEBUG    | __main__:trials:29 - Trial = 4734/30000 | Total reward = 24.16
2022-01-26 14:16:47.179 | DEBUG    | __main__:trials:24 - Trial = 4735/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.180 | DEBUG    | __main__:trials:29 - Trial = 4735/30000 | Total reward = 44.86
2022-01-26 14:16:47.184 | DEBUG    | __main__:trials:24 - Trial = 4736/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.185 | DEBUG    | __main__:trials:29 - Trial = 4736/30000 | Total reward = 35.97
2022-01-26 14:16:47.188 | DEBUG    | __main__:trials:24 - Trial = 4737/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.190 | DEBUG    | __main__:trials:29 - Trial = 4737/30000 | Total reward = 45.42
2022-01-26 14:16:47.193 | DEBUG    | __main__:trials:24 - Trial = 4738/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.194 | DEBUG    | __main__:trials:29 - Trial = 4738/30000 | Total reward = 41.66
2022-01-26 14:16:47.197 | DEBUG    | __main__:trials:24 - Trial = 4739/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.198 | DEBUG    | __main__:trials:29 - Trial = 4739/30000 | Total reward = 44.67
2022-01-26 14:16:47.202 | DEBUG    | __main__:trials:24 - Trial = 4740/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.203 | DEBUG    | __main__:trials:29 - Trial = 4740/30000 | Total reward = 48.46
2022-01-26 14:16:47.207 | DEBUG    | __main__:trials:24 - Trial = 4741/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.209 | DEBUG    | __main__:trials:29 - Trial = 4741/30000 | Total reward = 45.30
2022-01-26 14:16:47.212 | DEBUG    | __main__:trials:24 - Trial = 4742/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.213 | DEBUG    | __main__:trials:29 - Trial = 4742/30000 | Total reward = 47.23
2022-01-26 14:16:47.216 | DEBUG    | __main__:trials:24 - Trial = 4743/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.217 | DEBUG    | __main__:trials:29 - Trial = 4743/30000 | Total reward = 45.23
2022-01-26 14:16:47.221 | DEBUG    | __main__:trials:24 - Trial = 4744/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.221 | DEBUG    | __main__:trials:29 - Trial = 4744/30000 | Total reward = 46.70
2022-01-26 14:16:47.225 | DEBUG    | __main__:trials:24 - Trial = 4745/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.227 | DEBUG    | __main__:trials:29 - Trial = 4745/30000 | Total reward = 31.53
2022-01-26 14:16:47.231 | DEBUG    | __main__:trials:24 - Trial = 4746/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.232 | DEBUG    | __main__:trials:29 - Trial = 4746/30000 | Total reward = 42.75
2022-01-26 14:16:47.236 | DEBUG    | __main__:trials:24 - Trial = 4747/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.237 | DEBUG    | __main__:trials:29 - Trial = 4747/30000 | Total reward = 42.37
2022-01-26 14:16:47.241 | DEBUG    | __main__:trials:24 - Trial = 4748/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.242 | DEBUG    | __main__:trials:29 - Trial = 4748/30000 | Total reward = 44.36
2022-01-26 14:16:47.245 | DEBUG    | __main__:trials:24 - Trial = 4749/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.247 | DEBUG    | __main__:trials:29 - Trial = 4749/30000 | Total reward = 29.00
2022-01-26 14:16:47.251 | DEBUG    | __main__:trials:24 - Trial = 4750/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.253 | DEBUG    | __main__:trials:29 - Trial = 4750/30000 | Total reward = 27.95
2022-01-26 14:16:47.256 | DEBUG    | __main__:trials:24 - Trial = 4751/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.258 | DEBUG    | __main__:trials:29 - Trial = 4751/30000 | Total reward = 48.56
2022-01-26 14:16:47.262 | DEBUG    | __main__:trials:24 - Trial = 4752/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.264 | DEBUG    | __main__:trials:29 - Trial = 4752/30000 | Total reward = 27.07
2022-01-26 14:16:47.267 | DEBUG    | __main__:trials:24 - Trial = 4753/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.269 | DEBUG    | __main__:trials:29 - Trial = 4753/30000 | Total reward = 48.33
2022-01-26 14:16:47.273 | DEBUG    | __main__:trials:24 - Trial = 4754/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.273 | DEBUG    | __main__:trials:29 - Trial = 4754/30000 | Total reward = 55.92
2022-01-26 14:16:47.278 | DEBUG    | __main__:trials:24 - Trial = 4755/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.279 | DEBUG    | __main__:trials:29 - Trial = 4755/30000 | Total reward = 43.61
2022-01-26 14:16:47.282 | DEBUG    | __main__:trials:24 - Trial = 4756/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.284 | DEBUG    | __main__:trials:29 - Trial = 4756/30000 | Total reward = 27.59
2022-01-26 14:16:47.288 | DEBUG    | __main__:trials:24 - Trial = 4757/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.290 | DEBUG    | __main__:trials:29 - Trial = 4757/30000 | Total reward = 47.11
2022-01-26 14:16:47.293 | DEBUG    | __main__:trials:24 - Trial = 4758/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.295 | DEBUG    | __main__:trials:29 - Trial = 4758/30000 | Total reward = 48.32
2022-01-26 14:16:47.299 | DEBUG    | __main__:trials:24 - Trial = 4759/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.301 | DEBUG    | __main__:trials:29 - Trial = 4759/30000 | Total reward = 56.65
2022-01-26 14:16:47.304 | DEBUG    | __main__:trials:24 - Trial = 4760/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.306 | DEBUG    | __main__:trials:29 - Trial = 4760/30000 | Total reward = 48.43
2022-01-26 14:16:47.310 | DEBUG    | __main__:trials:24 - Trial = 4761/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.311 | DEBUG    | __main__:trials:29 - Trial = 4761/30000 | Total reward = 43.20
2022-01-26 14:16:47.315 | DEBUG    | __main__:trials:24 - Trial = 4762/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.317 | DEBUG    | __main__:trials:29 - Trial = 4762/30000 | Total reward = 44.64
2022-01-26 14:16:47.320 | DEBUG    | __main__:trials:24 - Trial = 4763/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.322 | DEBUG    | __main__:trials:29 - Trial = 4763/30000 | Total reward = 46.44
2022-01-26 14:16:47.326 | DEBUG    | __main__:trials:24 - Trial = 4764/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.327 | DEBUG    | __main__:trials:29 - Trial = 4764/30000 | Total reward = 33.05
2022-01-26 14:16:47.329 | DEBUG    | __main__:trials:26 - Trial = 4765/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.330 | DEBUG    | __main__:trials:29 - Trial = 4765/30000 | Total reward = 14.30
2022-01-26 14:16:47.334 | DEBUG    | __main__:trials:24 - Trial = 4766/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.334 | DEBUG    | __main__:trials:29 - Trial = 4766/30000 | Total reward = 59.69
2022-01-26 14:16:47.338 | DEBUG    | __main__:trials:24 - Trial = 4767/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.339 | DEBUG    | __main__:trials:29 - Trial = 4767/30000 | Total reward = 44.68
2022-01-26 14:16:47.343 | DEBUG    | __main__:trials:24 - Trial = 4768/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.345 | DEBUG    | __main__:trials:29 - Trial = 4768/30000 | Total reward = 46.70
2022-01-26 14:16:47.348 | DEBUG    | __main__:trials:24 - Trial = 4769/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.350 | DEBUG    | __main__:trials:29 - Trial = 4769/30000 | Total reward = 47.44
2022-01-26 14:16:47.354 | DEBUG    | __main__:trials:24 - Trial = 4770/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.355 | DEBUG    | __main__:trials:29 - Trial = 4770/30000 | Total reward = 48.87
2022-01-26 14:16:47.359 | DEBUG    | __main__:trials:24 - Trial = 4771/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.361 | DEBUG    | __main__:trials:29 - Trial = 4771/30000 | Total reward = 48.97
2022-01-26 14:16:47.364 | DEBUG    | __main__:trials:24 - Trial = 4772/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.366 | DEBUG    | __main__:trials:29 - Trial = 4772/30000 | Total reward = 47.00
2022-01-26 14:16:47.370 | DEBUG    | __main__:trials:24 - Trial = 4773/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.371 | DEBUG    | __main__:trials:29 - Trial = 4773/30000 | Total reward = 48.86
2022-01-26 14:16:47.375 | DEBUG    | __main__:trials:24 - Trial = 4774/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.375 | DEBUG    | __main__:trials:29 - Trial = 4774/30000 | Total reward = 43.26
2022-01-26 14:16:47.380 | DEBUG    | __main__:trials:24 - Trial = 4775/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.381 | DEBUG    | __main__:trials:29 - Trial = 4775/30000 | Total reward = 45.29
2022-01-26 14:16:47.385 | DEBUG    | __main__:trials:24 - Trial = 4776/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.386 | DEBUG    | __main__:trials:29 - Trial = 4776/30000 | Total reward = 38.77
2022-01-26 14:16:47.390 | DEBUG    | __main__:trials:24 - Trial = 4777/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.392 | DEBUG    | __main__:trials:29 - Trial = 4777/30000 | Total reward = 42.65
2022-01-26 14:16:47.395 | DEBUG    | __main__:trials:24 - Trial = 4778/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.396 | DEBUG    | __main__:trials:29 - Trial = 4778/30000 | Total reward = 53.51
2022-01-26 14:16:47.400 | DEBUG    | __main__:trials:24 - Trial = 4779/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.402 | DEBUG    | __main__:trials:29 - Trial = 4779/30000 | Total reward = 51.45
2022-01-26 14:16:47.406 | DEBUG    | __main__:trials:24 - Trial = 4780/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.406 | DEBUG    | __main__:trials:29 - Trial = 4780/30000 | Total reward = 40.92
2022-01-26 14:16:47.411 | DEBUG    | __main__:trials:24 - Trial = 4781/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.412 | DEBUG    | __main__:trials:29 - Trial = 4781/30000 | Total reward = 48.32
2022-01-26 14:16:47.416 | DEBUG    | __main__:trials:24 - Trial = 4782/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.417 | DEBUG    | __main__:trials:29 - Trial = 4782/30000 | Total reward = 53.56
2022-01-26 14:16:47.421 | DEBUG    | __main__:trials:24 - Trial = 4783/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.422 | DEBUG    | __main__:trials:29 - Trial = 4783/30000 | Total reward = 47.22
2022-01-26 14:16:47.425 | DEBUG    | __main__:trials:24 - Trial = 4784/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.427 | DEBUG    | __main__:trials:29 - Trial = 4784/30000 | Total reward = 46.25
2022-01-26 14:16:47.431 | DEBUG    | __main__:trials:24 - Trial = 4785/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.432 | DEBUG    | __main__:trials:29 - Trial = 4785/30000 | Total reward = 42.03
2022-01-26 14:16:47.436 | DEBUG    | __main__:trials:24 - Trial = 4786/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.437 | DEBUG    | __main__:trials:29 - Trial = 4786/30000 | Total reward = 42.20
2022-01-26 14:16:47.441 | DEBUG    | __main__:trials:24 - Trial = 4787/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.443 | DEBUG    | __main__:trials:29 - Trial = 4787/30000 | Total reward = 47.58
2022-01-26 14:16:47.447 | DEBUG    | __main__:trials:24 - Trial = 4788/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.448 | DEBUG    | __main__:trials:29 - Trial = 4788/30000 | Total reward = 39.48
2022-01-26 14:16:47.452 | DEBUG    | __main__:trials:24 - Trial = 4789/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.454 | DEBUG    | __main__:trials:29 - Trial = 4789/30000 | Total reward = 44.93
2022-01-26 14:16:47.458 | DEBUG    | __main__:trials:24 - Trial = 4790/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.460 | DEBUG    | __main__:trials:29 - Trial = 4790/30000 | Total reward = 62.74
2022-01-26 14:16:47.463 | DEBUG    | __main__:trials:24 - Trial = 4791/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.465 | DEBUG    | __main__:trials:29 - Trial = 4791/30000 | Total reward = 52.24
2022-01-26 14:16:47.469 | DEBUG    | __main__:trials:24 - Trial = 4792/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.471 | DEBUG    | __main__:trials:29 - Trial = 4792/30000 | Total reward = 37.04
2022-01-26 14:16:47.474 | DEBUG    | __main__:trials:24 - Trial = 4793/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.476 | DEBUG    | __main__:trials:29 - Trial = 4793/30000 | Total reward = 51.34
2022-01-26 14:16:47.479 | DEBUG    | __main__:trials:24 - Trial = 4794/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.480 | DEBUG    | __main__:trials:29 - Trial = 4794/30000 | Total reward = 41.62
2022-01-26 14:16:47.484 | DEBUG    | __main__:trials:26 - Trial = 4795/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.486 | DEBUG    | __main__:trials:29 - Trial = 4795/30000 | Total reward = 21.22
2022-01-26 14:16:47.489 | DEBUG    | __main__:trials:24 - Trial = 4796/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.490 | DEBUG    | __main__:trials:29 - Trial = 4796/30000 | Total reward = 47.72
2022-01-26 14:16:47.495 | DEBUG    | __main__:trials:24 - Trial = 4797/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.496 | DEBUG    | __main__:trials:29 - Trial = 4797/30000 | Total reward = 52.46
2022-01-26 14:16:47.499 | DEBUG    | __main__:trials:26 - Trial = 4798/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.501 | DEBUG    | __main__:trials:29 - Trial = 4798/30000 | Total reward = 33.37
2022-01-26 14:16:47.505 | DEBUG    | __main__:trials:24 - Trial = 4799/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.506 | DEBUG    | __main__:trials:29 - Trial = 4799/30000 | Total reward = 49.13
2022-01-26 14:16:47.510 | DEBUG    | __main__:trials:24 - Trial = 4800/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.511 | DEBUG    | __main__:trials:29 - Trial = 4800/30000 | Total reward = 42.76
2022-01-26 14:16:47.515 | DEBUG    | __main__:trials:24 - Trial = 4801/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.517 | DEBUG    | __main__:trials:29 - Trial = 4801/30000 | Total reward = 50.72
2022-01-26 14:16:47.521 | DEBUG    | __main__:trials:24 - Trial = 4802/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.522 | DEBUG    | __main__:trials:29 - Trial = 4802/30000 | Total reward = 35.28
2022-01-26 14:16:47.525 | DEBUG    | __main__:trials:24 - Trial = 4803/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.527 | DEBUG    | __main__:trials:29 - Trial = 4803/30000 | Total reward = 46.59
2022-01-26 14:16:47.529 | DEBUG    | __main__:trials:24 - Trial = 4804/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.530 | DEBUG    | __main__:trials:29 - Trial = 4804/30000 | Total reward = 59.76
2022-01-26 14:16:47.534 | DEBUG    | __main__:trials:24 - Trial = 4805/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.535 | DEBUG    | __main__:trials:29 - Trial = 4805/30000 | Total reward = 43.64
2022-01-26 14:16:47.539 | DEBUG    | __main__:trials:24 - Trial = 4806/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.540 | DEBUG    | __main__:trials:29 - Trial = 4806/30000 | Total reward = 58.53
2022-01-26 14:16:47.544 | DEBUG    | __main__:trials:24 - Trial = 4807/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.546 | DEBUG    | __main__:trials:29 - Trial = 4807/30000 | Total reward = 41.83
2022-01-26 14:16:47.549 | DEBUG    | __main__:trials:26 - Trial = 4808/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.550 | DEBUG    | __main__:trials:29 - Trial = 4808/30000 | Total reward = 27.74
2022-01-26 14:16:47.554 | DEBUG    | __main__:trials:24 - Trial = 4809/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.555 | DEBUG    | __main__:trials:29 - Trial = 4809/30000 | Total reward = 43.96
2022-01-26 14:16:47.559 | DEBUG    | __main__:trials:24 - Trial = 4810/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.560 | DEBUG    | __main__:trials:29 - Trial = 4810/30000 | Total reward = 44.46
2022-01-26 14:16:47.563 | DEBUG    | __main__:trials:24 - Trial = 4811/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.565 | DEBUG    | __main__:trials:29 - Trial = 4811/30000 | Total reward = 50.54
2022-01-26 14:16:47.569 | DEBUG    | __main__:trials:24 - Trial = 4812/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.571 | DEBUG    | __main__:trials:29 - Trial = 4812/30000 | Total reward = 51.22
2022-01-26 14:16:47.574 | DEBUG    | __main__:trials:24 - Trial = 4813/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.575 | DEBUG    | __main__:trials:29 - Trial = 4813/30000 | Total reward = 49.89
2022-01-26 14:16:47.579 | DEBUG    | __main__:trials:24 - Trial = 4814/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.580 | DEBUG    | __main__:trials:29 - Trial = 4814/30000 | Total reward = 43.43
2022-01-26 14:16:47.584 | DEBUG    | __main__:trials:24 - Trial = 4815/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.586 | DEBUG    | __main__:trials:29 - Trial = 4815/30000 | Total reward = 42.82
2022-01-26 14:16:47.589 | DEBUG    | __main__:trials:24 - Trial = 4816/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.590 | DEBUG    | __main__:trials:29 - Trial = 4816/30000 | Total reward = 43.96
2022-01-26 14:16:47.592 | DEBUG    | __main__:trials:26 - Trial = 4817/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.593 | DEBUG    | __main__:trials:29 - Trial = 4817/30000 | Total reward = 10.78
2022-01-26 14:16:47.597 | DEBUG    | __main__:trials:26 - Trial = 4818/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.598 | DEBUG    | __main__:trials:29 - Trial = 4818/30000 | Total reward = 41.70
2022-01-26 14:16:47.602 | DEBUG    | __main__:trials:24 - Trial = 4819/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.604 | DEBUG    | __main__:trials:29 - Trial = 4819/30000 | Total reward = 50.89
2022-01-26 14:16:47.608 | DEBUG    | __main__:trials:24 - Trial = 4820/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.609 | DEBUG    | __main__:trials:29 - Trial = 4820/30000 | Total reward = 47.55
2022-01-26 14:16:47.614 | DEBUG    | __main__:trials:24 - Trial = 4821/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.616 | DEBUG    | __main__:trials:29 - Trial = 4821/30000 | Total reward = 53.45
2022-01-26 14:16:47.619 | DEBUG    | __main__:trials:26 - Trial = 4822/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.620 | DEBUG    | __main__:trials:29 - Trial = 4822/30000 | Total reward = 37.06
2022-01-26 14:16:47.624 | DEBUG    | __main__:trials:24 - Trial = 4823/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.625 | DEBUG    | __main__:trials:29 - Trial = 4823/30000 | Total reward = 56.25
2022-01-26 14:16:47.630 | DEBUG    | __main__:trials:24 - Trial = 4824/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.632 | DEBUG    | __main__:trials:29 - Trial = 4824/30000 | Total reward = 49.95
2022-01-26 14:16:47.636 | DEBUG    | __main__:trials:24 - Trial = 4825/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.637 | DEBUG    | __main__:trials:29 - Trial = 4825/30000 | Total reward = 39.44
2022-01-26 14:16:47.640 | DEBUG    | __main__:trials:24 - Trial = 4826/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.642 | DEBUG    | __main__:trials:29 - Trial = 4826/30000 | Total reward = 43.30
2022-01-26 14:16:47.646 | DEBUG    | __main__:trials:24 - Trial = 4827/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.648 | DEBUG    | __main__:trials:29 - Trial = 4827/30000 | Total reward = 49.57
2022-01-26 14:16:47.651 | DEBUG    | __main__:trials:26 - Trial = 4828/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.651 | DEBUG    | __main__:trials:29 - Trial = 4828/30000 | Total reward = 24.19
2022-01-26 14:16:47.656 | DEBUG    | __main__:trials:24 - Trial = 4829/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.658 | DEBUG    | __main__:trials:29 - Trial = 4829/30000 | Total reward = 44.10
2022-01-26 14:16:47.661 | DEBUG    | __main__:trials:24 - Trial = 4830/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.662 | DEBUG    | __main__:trials:29 - Trial = 4830/30000 | Total reward = 51.88
2022-01-26 14:16:47.667 | DEBUG    | __main__:trials:24 - Trial = 4831/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.669 | DEBUG    | __main__:trials:29 - Trial = 4831/30000 | Total reward = 19.50
2022-01-26 14:16:47.672 | DEBUG    | __main__:trials:24 - Trial = 4832/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.673 | DEBUG    | __main__:trials:29 - Trial = 4832/30000 | Total reward = 51.08
2022-01-26 14:16:47.676 | DEBUG    | __main__:trials:24 - Trial = 4833/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.678 | DEBUG    | __main__:trials:29 - Trial = 4833/30000 | Total reward = 43.59
2022-01-26 14:16:47.682 | DEBUG    | __main__:trials:24 - Trial = 4834/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.683 | DEBUG    | __main__:trials:29 - Trial = 4834/30000 | Total reward = 58.55
2022-01-26 14:16:47.687 | DEBUG    | __main__:trials:24 - Trial = 4835/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.689 | DEBUG    | __main__:trials:29 - Trial = 4835/30000 | Total reward = 46.55
2022-01-26 14:16:47.692 | DEBUG    | __main__:trials:24 - Trial = 4836/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.693 | DEBUG    | __main__:trials:29 - Trial = 4836/30000 | Total reward = 49.23
2022-01-26 14:16:47.698 | DEBUG    | __main__:trials:24 - Trial = 4837/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.699 | DEBUG    | __main__:trials:29 - Trial = 4837/30000 | Total reward = 57.25
2022-01-26 14:16:47.702 | DEBUG    | __main__:trials:24 - Trial = 4838/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.704 | DEBUG    | __main__:trials:29 - Trial = 4838/30000 | Total reward = 48.69
2022-01-26 14:16:47.707 | DEBUG    | __main__:trials:24 - Trial = 4839/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.709 | DEBUG    | __main__:trials:29 - Trial = 4839/30000 | Total reward = 43.62
2022-01-26 14:16:47.713 | DEBUG    | __main__:trials:24 - Trial = 4840/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.714 | DEBUG    | __main__:trials:29 - Trial = 4840/30000 | Total reward = 34.34
2022-01-26 14:16:47.718 | DEBUG    | __main__:trials:24 - Trial = 4841/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.720 | DEBUG    | __main__:trials:29 - Trial = 4841/30000 | Total reward = 46.62
2022-01-26 14:16:47.724 | DEBUG    | __main__:trials:24 - Trial = 4842/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.725 | DEBUG    | __main__:trials:29 - Trial = 4842/30000 | Total reward = 58.11
2022-01-26 14:16:47.728 | DEBUG    | __main__:trials:24 - Trial = 4843/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.729 | DEBUG    | __main__:trials:29 - Trial = 4843/30000 | Total reward = 47.09
2022-01-26 14:16:47.734 | DEBUG    | __main__:trials:24 - Trial = 4844/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.734 | DEBUG    | __main__:trials:29 - Trial = 4844/30000 | Total reward = 41.37
2022-01-26 14:16:47.738 | DEBUG    | __main__:trials:24 - Trial = 4845/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.739 | DEBUG    | __main__:trials:29 - Trial = 4845/30000 | Total reward = 42.66
2022-01-26 14:16:47.744 | DEBUG    | __main__:trials:24 - Trial = 4846/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.745 | DEBUG    | __main__:trials:29 - Trial = 4846/30000 | Total reward = 49.86
2022-01-26 14:16:47.749 | DEBUG    | __main__:trials:24 - Trial = 4847/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.750 | DEBUG    | __main__:trials:29 - Trial = 4847/30000 | Total reward = 49.68
2022-01-26 14:16:47.754 | DEBUG    | __main__:trials:24 - Trial = 4848/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.755 | DEBUG    | __main__:trials:29 - Trial = 4848/30000 | Total reward = 41.59
2022-01-26 14:16:47.759 | DEBUG    | __main__:trials:24 - Trial = 4849/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.760 | DEBUG    | __main__:trials:29 - Trial = 4849/30000 | Total reward = 55.91
2022-01-26 14:16:47.765 | DEBUG    | __main__:trials:24 - Trial = 4850/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.766 | DEBUG    | __main__:trials:29 - Trial = 4850/30000 | Total reward = 47.61
2022-01-26 14:16:47.769 | DEBUG    | __main__:trials:24 - Trial = 4851/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.771 | DEBUG    | __main__:trials:29 - Trial = 4851/30000 | Total reward = 36.10
2022-01-26 14:16:47.775 | DEBUG    | __main__:trials:24 - Trial = 4852/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.776 | DEBUG    | __main__:trials:29 - Trial = 4852/30000 | Total reward = 38.98
2022-01-26 14:16:47.780 | DEBUG    | __main__:trials:24 - Trial = 4853/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.783 | DEBUG    | __main__:trials:29 - Trial = 4853/30000 | Total reward = 58.60
2022-01-26 14:16:47.786 | DEBUG    | __main__:trials:24 - Trial = 4854/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.787 | DEBUG    | __main__:trials:29 - Trial = 4854/30000 | Total reward = 38.19
2022-01-26 14:16:47.791 | DEBUG    | __main__:trials:24 - Trial = 4855/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.792 | DEBUG    | __main__:trials:29 - Trial = 4855/30000 | Total reward = 48.78
2022-01-26 14:16:47.796 | DEBUG    | __main__:trials:24 - Trial = 4856/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.796 | DEBUG    | __main__:trials:29 - Trial = 4856/30000 | Total reward = 31.65
2022-01-26 14:16:47.800 | DEBUG    | __main__:trials:24 - Trial = 4857/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.802 | DEBUG    | __main__:trials:29 - Trial = 4857/30000 | Total reward = 49.53
2022-01-26 14:16:47.805 | DEBUG    | __main__:trials:24 - Trial = 4858/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.807 | DEBUG    | __main__:trials:29 - Trial = 4858/30000 | Total reward = 37.41
2022-01-26 14:16:47.811 | DEBUG    | __main__:trials:24 - Trial = 4859/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.813 | DEBUG    | __main__:trials:29 - Trial = 4859/30000 | Total reward = 47.95
2022-01-26 14:16:47.816 | DEBUG    | __main__:trials:24 - Trial = 4860/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.818 | DEBUG    | __main__:trials:29 - Trial = 4860/30000 | Total reward = 37.63
2022-01-26 14:16:47.822 | DEBUG    | __main__:trials:24 - Trial = 4861/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.823 | DEBUG    | __main__:trials:29 - Trial = 4861/30000 | Total reward = 54.49
2022-01-26 14:16:47.827 | DEBUG    | __main__:trials:24 - Trial = 4862/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.828 | DEBUG    | __main__:trials:29 - Trial = 4862/30000 | Total reward = 43.22
2022-01-26 14:16:47.832 | DEBUG    | __main__:trials:24 - Trial = 4863/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.833 | DEBUG    | __main__:trials:29 - Trial = 4863/30000 | Total reward = 44.71
2022-01-26 14:16:47.837 | DEBUG    | __main__:trials:24 - Trial = 4864/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.838 | DEBUG    | __main__:trials:29 - Trial = 4864/30000 | Total reward = 49.34
2022-01-26 14:16:47.842 | DEBUG    | __main__:trials:24 - Trial = 4865/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.844 | DEBUG    | __main__:trials:29 - Trial = 4865/30000 | Total reward = 34.73
2022-01-26 14:16:47.847 | DEBUG    | __main__:trials:24 - Trial = 4866/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.849 | DEBUG    | __main__:trials:29 - Trial = 4866/30000 | Total reward = 46.39
2022-01-26 14:16:47.852 | DEBUG    | __main__:trials:24 - Trial = 4867/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.854 | DEBUG    | __main__:trials:29 - Trial = 4867/30000 | Total reward = 32.19
2022-01-26 14:16:47.857 | DEBUG    | __main__:trials:24 - Trial = 4868/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.858 | DEBUG    | __main__:trials:29 - Trial = 4868/30000 | Total reward = 46.25
2022-01-26 14:16:47.861 | DEBUG    | __main__:trials:24 - Trial = 4869/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.862 | DEBUG    | __main__:trials:29 - Trial = 4869/30000 | Total reward = 46.21
2022-01-26 14:16:47.866 | DEBUG    | __main__:trials:24 - Trial = 4870/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.866 | DEBUG    | __main__:trials:29 - Trial = 4870/30000 | Total reward = 43.66
2022-01-26 14:16:47.870 | DEBUG    | __main__:trials:24 - Trial = 4871/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.871 | DEBUG    | __main__:trials:29 - Trial = 4871/30000 | Total reward = 43.02
2022-01-26 14:16:47.874 | DEBUG    | __main__:trials:26 - Trial = 4872/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:47.875 | DEBUG    | __main__:trials:29 - Trial = 4872/30000 | Total reward = 22.99
2022-01-26 14:16:47.878 | DEBUG    | __main__:trials:24 - Trial = 4873/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.879 | DEBUG    | __main__:trials:29 - Trial = 4873/30000 | Total reward = 49.24
2022-01-26 14:16:47.883 | DEBUG    | __main__:trials:24 - Trial = 4874/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.883 | DEBUG    | __main__:trials:29 - Trial = 4874/30000 | Total reward = 52.90
2022-01-26 14:16:47.887 | DEBUG    | __main__:trials:24 - Trial = 4875/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.888 | DEBUG    | __main__:trials:29 - Trial = 4875/30000 | Total reward = 45.03
2022-01-26 14:16:47.892 | DEBUG    | __main__:trials:24 - Trial = 4876/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.893 | DEBUG    | __main__:trials:29 - Trial = 4876/30000 | Total reward = 31.76
2022-01-26 14:16:47.897 | DEBUG    | __main__:trials:24 - Trial = 4877/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.898 | DEBUG    | __main__:trials:29 - Trial = 4877/30000 | Total reward = 32.93
2022-01-26 14:16:47.902 | DEBUG    | __main__:trials:24 - Trial = 4878/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.904 | DEBUG    | __main__:trials:29 - Trial = 4878/30000 | Total reward = 47.03
2022-01-26 14:16:47.907 | DEBUG    | __main__:trials:24 - Trial = 4879/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.909 | DEBUG    | __main__:trials:29 - Trial = 4879/30000 | Total reward = 49.24
2022-01-26 14:16:47.912 | DEBUG    | __main__:trials:24 - Trial = 4880/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.914 | DEBUG    | __main__:trials:29 - Trial = 4880/30000 | Total reward = 51.95
2022-01-26 14:16:47.918 | DEBUG    | __main__:trials:24 - Trial = 4881/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.919 | DEBUG    | __main__:trials:29 - Trial = 4881/30000 | Total reward = 60.03
2022-01-26 14:16:47.922 | DEBUG    | __main__:trials:24 - Trial = 4882/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.924 | DEBUG    | __main__:trials:29 - Trial = 4882/30000 | Total reward = 48.29
2022-01-26 14:16:47.928 | DEBUG    | __main__:trials:24 - Trial = 4883/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.929 | DEBUG    | __main__:trials:29 - Trial = 4883/30000 | Total reward = 44.16
2022-01-26 14:16:47.933 | DEBUG    | __main__:trials:24 - Trial = 4884/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.933 | DEBUG    | __main__:trials:29 - Trial = 4884/30000 | Total reward = 38.47
2022-01-26 14:16:47.937 | DEBUG    | __main__:trials:24 - Trial = 4885/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.937 | DEBUG    | __main__:trials:29 - Trial = 4885/30000 | Total reward = 32.61
2022-01-26 14:16:47.942 | DEBUG    | __main__:trials:24 - Trial = 4886/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.943 | DEBUG    | __main__:trials:29 - Trial = 4886/30000 | Total reward = 41.88
2022-01-26 14:16:47.947 | DEBUG    | __main__:trials:24 - Trial = 4887/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.949 | DEBUG    | __main__:trials:29 - Trial = 4887/30000 | Total reward = 49.84
2022-01-26 14:16:47.952 | DEBUG    | __main__:trials:24 - Trial = 4888/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.953 | DEBUG    | __main__:trials:29 - Trial = 4888/30000 | Total reward = 34.58
2022-01-26 14:16:47.956 | DEBUG    | __main__:trials:24 - Trial = 4889/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.958 | DEBUG    | __main__:trials:29 - Trial = 4889/30000 | Total reward = 48.59
2022-01-26 14:16:47.961 | DEBUG    | __main__:trials:24 - Trial = 4890/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.963 | DEBUG    | __main__:trials:29 - Trial = 4890/30000 | Total reward = 42.16
2022-01-26 14:16:47.966 | DEBUG    | __main__:trials:24 - Trial = 4891/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.967 | DEBUG    | __main__:trials:29 - Trial = 4891/30000 | Total reward = 48.59
2022-01-26 14:16:47.970 | DEBUG    | __main__:trials:24 - Trial = 4892/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.972 | DEBUG    | __main__:trials:29 - Trial = 4892/30000 | Total reward = 36.85
2022-01-26 14:16:47.975 | DEBUG    | __main__:trials:24 - Trial = 4893/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.977 | DEBUG    | __main__:trials:29 - Trial = 4893/30000 | Total reward = 51.98
2022-01-26 14:16:47.980 | DEBUG    | __main__:trials:24 - Trial = 4894/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.981 | DEBUG    | __main__:trials:29 - Trial = 4894/30000 | Total reward = 48.98
2022-01-26 14:16:47.984 | DEBUG    | __main__:trials:24 - Trial = 4895/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.985 | DEBUG    | __main__:trials:29 - Trial = 4895/30000 | Total reward = 48.40
2022-01-26 14:16:47.988 | DEBUG    | __main__:trials:24 - Trial = 4896/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.989 | DEBUG    | __main__:trials:29 - Trial = 4896/30000 | Total reward = 44.66
2022-01-26 14:16:47.992 | DEBUG    | __main__:trials:24 - Trial = 4897/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.994 | DEBUG    | __main__:trials:29 - Trial = 4897/30000 | Total reward = 47.24
2022-01-26 14:16:47.997 | DEBUG    | __main__:trials:24 - Trial = 4898/30000 | Max number of steps (20) reached
2022-01-26 14:16:47.998 | DEBUG    | __main__:trials:29 - Trial = 4898/30000 | Total reward = 44.55
2022-01-26 14:16:48.001 | DEBUG    | __main__:trials:24 - Trial = 4899/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.003 | DEBUG    | __main__:trials:29 - Trial = 4899/30000 | Total reward = 43.29
2022-01-26 14:16:48.006 | DEBUG    | __main__:trials:24 - Trial = 4900/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.008 | DEBUG    | __main__:trials:29 - Trial = 4900/30000 | Total reward = 41.94
2022-01-26 14:16:48.012 | DEBUG    | __main__:trials:24 - Trial = 4901/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.012 | DEBUG    | __main__:trials:29 - Trial = 4901/30000 | Total reward = 46.06
2022-01-26 14:16:48.017 | DEBUG    | __main__:trials:24 - Trial = 4902/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.018 | DEBUG    | __main__:trials:29 - Trial = 4902/30000 | Total reward = 49.82
2022-01-26 14:16:48.021 | DEBUG    | __main__:trials:24 - Trial = 4903/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.023 | DEBUG    | __main__:trials:29 - Trial = 4903/30000 | Total reward = 46.80
2022-01-26 14:16:48.027 | DEBUG    | __main__:trials:24 - Trial = 4904/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.028 | DEBUG    | __main__:trials:29 - Trial = 4904/30000 | Total reward = 48.05
2022-01-26 14:16:48.032 | DEBUG    | __main__:trials:24 - Trial = 4905/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.032 | DEBUG    | __main__:trials:29 - Trial = 4905/30000 | Total reward = 43.10
2022-01-26 14:16:48.037 | DEBUG    | __main__:trials:24 - Trial = 4906/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.038 | DEBUG    | __main__:trials:29 - Trial = 4906/30000 | Total reward = 43.68
2022-01-26 14:16:48.042 | DEBUG    | __main__:trials:24 - Trial = 4907/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.044 | DEBUG    | __main__:trials:29 - Trial = 4907/30000 | Total reward = 40.90
2022-01-26 14:16:48.047 | DEBUG    | __main__:trials:24 - Trial = 4908/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.049 | DEBUG    | __main__:trials:29 - Trial = 4908/30000 | Total reward = 35.86
2022-01-26 14:16:48.052 | DEBUG    | __main__:trials:24 - Trial = 4909/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.053 | DEBUG    | __main__:trials:29 - Trial = 4909/30000 | Total reward = 48.52
2022-01-26 14:16:48.057 | DEBUG    | __main__:trials:24 - Trial = 4910/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.058 | DEBUG    | __main__:trials:29 - Trial = 4910/30000 | Total reward = 47.31
2022-01-26 14:16:48.061 | DEBUG    | __main__:trials:24 - Trial = 4911/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.063 | DEBUG    | __main__:trials:29 - Trial = 4911/30000 | Total reward = 51.17
2022-01-26 14:16:48.066 | DEBUG    | __main__:trials:24 - Trial = 4912/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.068 | DEBUG    | __main__:trials:29 - Trial = 4912/30000 | Total reward = 53.48
2022-01-26 14:16:48.072 | DEBUG    | __main__:trials:24 - Trial = 4913/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.073 | DEBUG    | __main__:trials:29 - Trial = 4913/30000 | Total reward = 39.98
2022-01-26 14:16:48.077 | DEBUG    | __main__:trials:24 - Trial = 4914/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.078 | DEBUG    | __main__:trials:29 - Trial = 4914/30000 | Total reward = 46.26
2022-01-26 14:16:48.082 | DEBUG    | __main__:trials:24 - Trial = 4915/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.084 | DEBUG    | __main__:trials:29 - Trial = 4915/30000 | Total reward = 49.11
2022-01-26 14:16:48.088 | DEBUG    | __main__:trials:24 - Trial = 4916/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.090 | DEBUG    | __main__:trials:29 - Trial = 4916/30000 | Total reward = 31.06
2022-01-26 14:16:48.093 | DEBUG    | __main__:trials:24 - Trial = 4917/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.095 | DEBUG    | __main__:trials:29 - Trial = 4917/30000 | Total reward = 47.08
2022-01-26 14:16:48.098 | DEBUG    | __main__:trials:26 - Trial = 4918/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:48.099 | DEBUG    | __main__:trials:29 - Trial = 4918/30000 | Total reward = 28.05
2022-01-26 14:16:48.103 | DEBUG    | __main__:trials:24 - Trial = 4919/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.104 | DEBUG    | __main__:trials:29 - Trial = 4919/30000 | Total reward = 50.26
2022-01-26 14:16:48.109 | DEBUG    | __main__:trials:24 - Trial = 4920/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.110 | DEBUG    | __main__:trials:29 - Trial = 4920/30000 | Total reward = 49.44
2022-01-26 14:16:48.114 | DEBUG    | __main__:trials:24 - Trial = 4921/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.116 | DEBUG    | __main__:trials:29 - Trial = 4921/30000 | Total reward = 53.75
2022-01-26 14:16:48.119 | DEBUG    | __main__:trials:24 - Trial = 4922/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.121 | DEBUG    | __main__:trials:29 - Trial = 4922/30000 | Total reward = 33.17
2022-01-26 14:16:48.125 | DEBUG    | __main__:trials:24 - Trial = 4923/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.126 | DEBUG    | __main__:trials:29 - Trial = 4923/30000 | Total reward = 44.47
2022-01-26 14:16:48.130 | DEBUG    | __main__:trials:24 - Trial = 4924/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.131 | DEBUG    | __main__:trials:29 - Trial = 4924/30000 | Total reward = 50.19
2022-01-26 14:16:48.134 | DEBUG    | __main__:trials:24 - Trial = 4925/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.136 | DEBUG    | __main__:trials:29 - Trial = 4925/30000 | Total reward = 46.14
2022-01-26 14:16:48.139 | DEBUG    | __main__:trials:24 - Trial = 4926/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.141 | DEBUG    | __main__:trials:29 - Trial = 4926/30000 | Total reward = 49.92
2022-01-26 14:16:48.144 | DEBUG    | __main__:trials:24 - Trial = 4927/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.145 | DEBUG    | __main__:trials:29 - Trial = 4927/30000 | Total reward = 44.87
2022-01-26 14:16:48.150 | DEBUG    | __main__:trials:24 - Trial = 4928/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.151 | DEBUG    | __main__:trials:29 - Trial = 4928/30000 | Total reward = 53.49
2022-01-26 14:16:48.154 | DEBUG    | __main__:trials:24 - Trial = 4929/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.156 | DEBUG    | __main__:trials:29 - Trial = 4929/30000 | Total reward = 48.22
2022-01-26 14:16:48.159 | DEBUG    | __main__:trials:24 - Trial = 4930/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.161 | DEBUG    | __main__:trials:29 - Trial = 4930/30000 | Total reward = 32.94
2022-01-26 14:16:48.164 | DEBUG    | __main__:trials:24 - Trial = 4931/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.166 | DEBUG    | __main__:trials:29 - Trial = 4931/30000 | Total reward = 48.78
2022-01-26 14:16:48.169 | DEBUG    | __main__:trials:26 - Trial = 4932/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:48.171 | DEBUG    | __main__:trials:29 - Trial = 4932/30000 | Total reward = 14.46
2022-01-26 14:16:48.174 | DEBUG    | __main__:trials:24 - Trial = 4933/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.176 | DEBUG    | __main__:trials:29 - Trial = 4933/30000 | Total reward = 48.94
2022-01-26 14:16:48.180 | DEBUG    | __main__:trials:24 - Trial = 4934/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.180 | DEBUG    | __main__:trials:29 - Trial = 4934/30000 | Total reward = 64.00
2022-01-26 14:16:48.185 | DEBUG    | __main__:trials:24 - Trial = 4935/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.186 | DEBUG    | __main__:trials:29 - Trial = 4935/30000 | Total reward = 51.82
2022-01-26 14:16:48.189 | DEBUG    | __main__:trials:24 - Trial = 4936/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.189 | DEBUG    | __main__:trials:29 - Trial = 4936/30000 | Total reward = 44.12
2022-01-26 14:16:48.193 | DEBUG    | __main__:trials:24 - Trial = 4937/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.194 | DEBUG    | __main__:trials:29 - Trial = 4937/30000 | Total reward = 53.95
2022-01-26 14:16:48.198 | DEBUG    | __main__:trials:24 - Trial = 4938/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.199 | DEBUG    | __main__:trials:29 - Trial = 4938/30000 | Total reward = 30.53
2022-01-26 14:16:48.203 | DEBUG    | __main__:trials:24 - Trial = 4939/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.204 | DEBUG    | __main__:trials:29 - Trial = 4939/30000 | Total reward = 38.99
2022-01-26 14:16:48.207 | DEBUG    | __main__:trials:24 - Trial = 4940/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.209 | DEBUG    | __main__:trials:29 - Trial = 4940/30000 | Total reward = 52.60
2022-01-26 14:16:48.213 | DEBUG    | __main__:trials:24 - Trial = 4941/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.213 | DEBUG    | __main__:trials:29 - Trial = 4941/30000 | Total reward = 53.57
2022-01-26 14:16:48.217 | DEBUG    | __main__:trials:24 - Trial = 4942/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.218 | DEBUG    | __main__:trials:29 - Trial = 4942/30000 | Total reward = 48.61
2022-01-26 14:16:48.223 | DEBUG    | __main__:trials:24 - Trial = 4943/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.224 | DEBUG    | __main__:trials:29 - Trial = 4943/30000 | Total reward = 50.52
2022-01-26 14:16:48.228 | DEBUG    | __main__:trials:24 - Trial = 4944/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.230 | DEBUG    | __main__:trials:29 - Trial = 4944/30000 | Total reward = 54.24
2022-01-26 14:16:48.233 | DEBUG    | __main__:trials:24 - Trial = 4945/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.234 | DEBUG    | __main__:trials:29 - Trial = 4945/30000 | Total reward = 48.19
2022-01-26 14:16:48.239 | DEBUG    | __main__:trials:24 - Trial = 4946/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.240 | DEBUG    | __main__:trials:29 - Trial = 4946/30000 | Total reward = 49.42
2022-01-26 14:16:48.244 | DEBUG    | __main__:trials:24 - Trial = 4947/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.245 | DEBUG    | __main__:trials:29 - Trial = 4947/30000 | Total reward = 43.33
2022-01-26 14:16:48.249 | DEBUG    | __main__:trials:24 - Trial = 4948/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.250 | DEBUG    | __main__:trials:29 - Trial = 4948/30000 | Total reward = 48.07
2022-01-26 14:16:48.254 | DEBUG    | __main__:trials:24 - Trial = 4949/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.255 | DEBUG    | __main__:trials:29 - Trial = 4949/30000 | Total reward = 58.23
2022-01-26 14:16:48.259 | DEBUG    | __main__:trials:24 - Trial = 4950/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.261 | DEBUG    | __main__:trials:29 - Trial = 4950/30000 | Total reward = 49.94
2022-01-26 14:16:48.264 | DEBUG    | __main__:trials:24 - Trial = 4951/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.265 | DEBUG    | __main__:trials:29 - Trial = 4951/30000 | Total reward = 44.39
2022-01-26 14:16:48.270 | DEBUG    | __main__:trials:24 - Trial = 4952/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.271 | DEBUG    | __main__:trials:29 - Trial = 4952/30000 | Total reward = 43.12
2022-01-26 14:16:48.274 | DEBUG    | __main__:trials:24 - Trial = 4953/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.276 | DEBUG    | __main__:trials:29 - Trial = 4953/30000 | Total reward = 50.75
2022-01-26 14:16:48.279 | DEBUG    | __main__:trials:24 - Trial = 4954/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.280 | DEBUG    | __main__:trials:29 - Trial = 4954/30000 | Total reward = 31.66
2022-01-26 14:16:48.283 | DEBUG    | __main__:trials:24 - Trial = 4955/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.285 | DEBUG    | __main__:trials:29 - Trial = 4955/30000 | Total reward = 51.60
2022-01-26 14:16:48.288 | DEBUG    | __main__:trials:24 - Trial = 4956/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.290 | DEBUG    | __main__:trials:29 - Trial = 4956/30000 | Total reward = 49.75
2022-01-26 14:16:48.294 | DEBUG    | __main__:trials:24 - Trial = 4957/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.295 | DEBUG    | __main__:trials:29 - Trial = 4957/30000 | Total reward = 50.61
2022-01-26 14:16:48.299 | DEBUG    | __main__:trials:24 - Trial = 4958/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.300 | DEBUG    | __main__:trials:29 - Trial = 4958/30000 | Total reward = 61.99
2022-01-26 14:16:48.303 | DEBUG    | __main__:trials:24 - Trial = 4959/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.305 | DEBUG    | __main__:trials:29 - Trial = 4959/30000 | Total reward = 49.96
2022-01-26 14:16:48.309 | DEBUG    | __main__:trials:24 - Trial = 4960/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.310 | DEBUG    | __main__:trials:29 - Trial = 4960/30000 | Total reward = 53.70
2022-01-26 14:16:48.314 | DEBUG    | __main__:trials:24 - Trial = 4961/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.315 | DEBUG    | __main__:trials:29 - Trial = 4961/30000 | Total reward = 60.08
2022-01-26 14:16:48.319 | DEBUG    | __main__:trials:24 - Trial = 4962/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.319 | DEBUG    | __main__:trials:29 - Trial = 4962/30000 | Total reward = 48.64
2022-01-26 14:16:48.324 | DEBUG    | __main__:trials:24 - Trial = 4963/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.325 | DEBUG    | __main__:trials:29 - Trial = 4963/30000 | Total reward = 49.28
2022-01-26 14:16:48.328 | DEBUG    | __main__:trials:24 - Trial = 4964/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.330 | DEBUG    | __main__:trials:29 - Trial = 4964/30000 | Total reward = 50.71
2022-01-26 14:16:48.334 | DEBUG    | __main__:trials:24 - Trial = 4965/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.335 | DEBUG    | __main__:trials:29 - Trial = 4965/30000 | Total reward = 49.11
2022-01-26 14:16:48.339 | DEBUG    | __main__:trials:24 - Trial = 4966/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.341 | DEBUG    | __main__:trials:29 - Trial = 4966/30000 | Total reward = 49.15
2022-01-26 14:16:48.345 | DEBUG    | __main__:trials:24 - Trial = 4967/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.346 | DEBUG    | __main__:trials:29 - Trial = 4967/30000 | Total reward = 49.06
2022-01-26 14:16:48.349 | DEBUG    | __main__:trials:24 - Trial = 4968/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.350 | DEBUG    | __main__:trials:29 - Trial = 4968/30000 | Total reward = 44.76
2022-01-26 14:16:48.354 | DEBUG    | __main__:trials:24 - Trial = 4969/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.356 | DEBUG    | __main__:trials:29 - Trial = 4969/30000 | Total reward = 47.42
2022-01-26 14:16:48.359 | DEBUG    | __main__:trials:24 - Trial = 4970/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.361 | DEBUG    | __main__:trials:29 - Trial = 4970/30000 | Total reward = 41.71
2022-01-26 14:16:48.363 | DEBUG    | __main__:trials:24 - Trial = 4971/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.365 | DEBUG    | __main__:trials:29 - Trial = 4971/30000 | Total reward = 50.81
2022-01-26 14:16:48.368 | DEBUG    | __main__:trials:24 - Trial = 4972/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.370 | DEBUG    | __main__:trials:29 - Trial = 4972/30000 | Total reward = 52.31
2022-01-26 14:16:48.374 | DEBUG    | __main__:trials:24 - Trial = 4973/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.374 | DEBUG    | __main__:trials:29 - Trial = 4973/30000 | Total reward = 41.49
2022-01-26 14:16:48.378 | DEBUG    | __main__:trials:24 - Trial = 4974/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.379 | DEBUG    | __main__:trials:29 - Trial = 4974/30000 | Total reward = 49.40
2022-01-26 14:16:48.383 | DEBUG    | __main__:trials:24 - Trial = 4975/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.385 | DEBUG    | __main__:trials:29 - Trial = 4975/30000 | Total reward = 49.78
2022-01-26 14:16:48.388 | DEBUG    | __main__:trials:24 - Trial = 4976/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.389 | DEBUG    | __main__:trials:29 - Trial = 4976/30000 | Total reward = 48.61
2022-01-26 14:16:48.394 | DEBUG    | __main__:trials:24 - Trial = 4977/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.395 | DEBUG    | __main__:trials:29 - Trial = 4977/30000 | Total reward = 47.08
2022-01-26 14:16:48.398 | DEBUG    | __main__:trials:24 - Trial = 4978/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.400 | DEBUG    | __main__:trials:29 - Trial = 4978/30000 | Total reward = 30.27
2022-01-26 14:16:48.403 | DEBUG    | __main__:trials:26 - Trial = 4979/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:48.404 | DEBUG    | __main__:trials:29 - Trial = 4979/30000 | Total reward = 15.30
2022-01-26 14:16:48.408 | DEBUG    | __main__:trials:24 - Trial = 4980/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.408 | DEBUG    | __main__:trials:29 - Trial = 4980/30000 | Total reward = 49.49
2022-01-26 14:16:48.413 | DEBUG    | __main__:trials:24 - Trial = 4981/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.414 | DEBUG    | __main__:trials:29 - Trial = 4981/30000 | Total reward = 47.42
2022-01-26 14:16:48.418 | DEBUG    | __main__:trials:24 - Trial = 4982/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.420 | DEBUG    | __main__:trials:29 - Trial = 4982/30000 | Total reward = 46.50
2022-01-26 14:16:48.423 | DEBUG    | __main__:trials:24 - Trial = 4983/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.424 | DEBUG    | __main__:trials:29 - Trial = 4983/30000 | Total reward = 39.78
2022-01-26 14:16:48.428 | DEBUG    | __main__:trials:24 - Trial = 4984/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.430 | DEBUG    | __main__:trials:29 - Trial = 4984/30000 | Total reward = 47.69
2022-01-26 14:16:48.434 | DEBUG    | __main__:trials:24 - Trial = 4985/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.435 | DEBUG    | __main__:trials:29 - Trial = 4985/30000 | Total reward = 51.60
2022-01-26 14:16:48.439 | DEBUG    | __main__:trials:24 - Trial = 4986/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.439 | DEBUG    | __main__:trials:29 - Trial = 4986/30000 | Total reward = 34.77
2022-01-26 14:16:48.443 | DEBUG    | __main__:trials:24 - Trial = 4987/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.445 | DEBUG    | __main__:trials:29 - Trial = 4987/30000 | Total reward = 66.48
2022-01-26 14:16:48.448 | DEBUG    | __main__:trials:24 - Trial = 4988/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.449 | DEBUG    | __main__:trials:29 - Trial = 4988/30000 | Total reward = 48.39
2022-01-26 14:16:48.453 | DEBUG    | __main__:trials:24 - Trial = 4989/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.454 | DEBUG    | __main__:trials:29 - Trial = 4989/30000 | Total reward = 41.20
2022-01-26 14:16:48.458 | DEBUG    | __main__:trials:24 - Trial = 4990/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.460 | DEBUG    | __main__:trials:29 - Trial = 4990/30000 | Total reward = 44.75
2022-01-26 14:16:48.463 | DEBUG    | __main__:trials:24 - Trial = 4991/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.465 | DEBUG    | __main__:trials:29 - Trial = 4991/30000 | Total reward = 49.25
2022-01-26 14:16:48.468 | DEBUG    | __main__:trials:24 - Trial = 4992/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.470 | DEBUG    | __main__:trials:29 - Trial = 4992/30000 | Total reward = 53.42
2022-01-26 14:16:48.473 | DEBUG    | __main__:trials:24 - Trial = 4993/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.474 | DEBUG    | __main__:trials:29 - Trial = 4993/30000 | Total reward = 48.53
2022-01-26 14:16:48.478 | DEBUG    | __main__:trials:24 - Trial = 4994/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.480 | DEBUG    | __main__:trials:29 - Trial = 4994/30000 | Total reward = 36.10
2022-01-26 14:16:48.483 | DEBUG    | __main__:trials:24 - Trial = 4995/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.485 | DEBUG    | __main__:trials:29 - Trial = 4995/30000 | Total reward = 51.76
2022-01-26 14:16:48.488 | DEBUG    | __main__:trials:24 - Trial = 4996/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.490 | DEBUG    | __main__:trials:29 - Trial = 4996/30000 | Total reward = 49.16
2022-01-26 14:16:48.493 | DEBUG    | __main__:trials:26 - Trial = 4997/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:48.495 | DEBUG    | __main__:trials:29 - Trial = 4997/30000 | Total reward = 27.74
2022-01-26 14:16:48.499 | DEBUG    | __main__:trials:24 - Trial = 4998/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.500 | DEBUG    | __main__:trials:29 - Trial = 4998/30000 | Total reward = 53.24
2022-01-26 14:16:48.503 | DEBUG    | __main__:trials:24 - Trial = 4999/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.505 | DEBUG    | __main__:trials:29 - Trial = 4999/30000 | Total reward = 52.73
2022-01-26 14:16:48.508 | DEBUG    | __main__:trials:24 - Trial = 5000/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.509 | DEBUG    | __main__:trials:29 - Trial = 5000/30000 | Total reward = 29.97
2022-01-26 14:16:48.513 | DEBUG    | __main__:trials:24 - Trial = 5001/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.514 | DEBUG    | __main__:trials:29 - Trial = 5001/30000 | Total reward = 44.17
2022-01-26 14:16:48.519 | DEBUG    | __main__:trials:24 - Trial = 5002/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.519 | DEBUG    | __main__:trials:29 - Trial = 5002/30000 | Total reward = 50.19
2022-01-26 14:16:48.524 | DEBUG    | __main__:trials:24 - Trial = 5003/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.525 | DEBUG    | __main__:trials:29 - Trial = 5003/30000 | Total reward = 46.56
2022-01-26 14:16:48.529 | DEBUG    | __main__:trials:24 - Trial = 5004/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.530 | DEBUG    | __main__:trials:29 - Trial = 5004/30000 | Total reward = 46.74
2022-01-26 14:16:48.534 | DEBUG    | __main__:trials:24 - Trial = 5005/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.536 | DEBUG    | __main__:trials:29 - Trial = 5005/30000 | Total reward = 49.40
2022-01-26 14:16:48.539 | DEBUG    | __main__:trials:24 - Trial = 5006/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.541 | DEBUG    | __main__:trials:29 - Trial = 5006/30000 | Total reward = 43.91
2022-01-26 14:16:48.544 | DEBUG    | __main__:trials:24 - Trial = 5007/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.545 | DEBUG    | __main__:trials:29 - Trial = 5007/30000 | Total reward = 46.74
2022-01-26 14:16:48.549 | DEBUG    | __main__:trials:24 - Trial = 5008/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.550 | DEBUG    | __main__:trials:29 - Trial = 5008/30000 | Total reward = 44.34
2022-01-26 14:16:48.554 | DEBUG    | __main__:trials:24 - Trial = 5009/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.554 | DEBUG    | __main__:trials:29 - Trial = 5009/30000 | Total reward = 36.48
2022-01-26 14:16:48.558 | DEBUG    | __main__:trials:24 - Trial = 5010/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.559 | DEBUG    | __main__:trials:29 - Trial = 5010/30000 | Total reward = 51.49
2022-01-26 14:16:48.564 | DEBUG    | __main__:trials:24 - Trial = 5011/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.565 | DEBUG    | __main__:trials:29 - Trial = 5011/30000 | Total reward = 35.63
2022-01-26 14:16:48.568 | DEBUG    | __main__:trials:24 - Trial = 5012/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.570 | DEBUG    | __main__:trials:29 - Trial = 5012/30000 | Total reward = 46.98
2022-01-26 14:16:48.573 | DEBUG    | __main__:trials:24 - Trial = 5013/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.574 | DEBUG    | __main__:trials:29 - Trial = 5013/30000 | Total reward = 55.42
2022-01-26 14:16:48.578 | DEBUG    | __main__:trials:24 - Trial = 5014/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.579 | DEBUG    | __main__:trials:29 - Trial = 5014/30000 | Total reward = 44.73
2022-01-26 14:16:48.583 | DEBUG    | __main__:trials:24 - Trial = 5015/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.584 | DEBUG    | __main__:trials:29 - Trial = 5015/30000 | Total reward = 45.68
2022-01-26 14:16:48.587 | DEBUG    | __main__:trials:24 - Trial = 5016/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.589 | DEBUG    | __main__:trials:29 - Trial = 5016/30000 | Total reward = 43.98
2022-01-26 14:16:48.592 | DEBUG    | __main__:trials:24 - Trial = 5017/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.594 | DEBUG    | __main__:trials:29 - Trial = 5017/30000 | Total reward = 49.30
2022-01-26 14:16:48.597 | DEBUG    | __main__:trials:24 - Trial = 5018/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.598 | DEBUG    | __main__:trials:29 - Trial = 5018/30000 | Total reward = 50.06
2022-01-26 14:16:48.602 | DEBUG    | __main__:trials:24 - Trial = 5019/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.603 | DEBUG    | __main__:trials:29 - Trial = 5019/30000 | Total reward = 45.27
2022-01-26 14:16:48.607 | DEBUG    | __main__:trials:24 - Trial = 5020/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.608 | DEBUG    | __main__:trials:29 - Trial = 5020/30000 | Total reward = 40.79
2022-01-26 14:16:48.612 | DEBUG    | __main__:trials:24 - Trial = 5021/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.614 | DEBUG    | __main__:trials:29 - Trial = 5021/30000 | Total reward = 49.79
2022-01-26 14:16:48.617 | DEBUG    | __main__:trials:24 - Trial = 5022/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.618 | DEBUG    | __main__:trials:29 - Trial = 5022/30000 | Total reward = 49.45
2022-01-26 14:16:48.622 | DEBUG    | __main__:trials:24 - Trial = 5023/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.624 | DEBUG    | __main__:trials:29 - Trial = 5023/30000 | Total reward = 46.54
2022-01-26 14:16:48.628 | DEBUG    | __main__:trials:24 - Trial = 5024/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.629 | DEBUG    | __main__:trials:29 - Trial = 5024/30000 | Total reward = 51.02
2022-01-26 14:16:48.633 | DEBUG    | __main__:trials:24 - Trial = 5025/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.633 | DEBUG    | __main__:trials:29 - Trial = 5025/30000 | Total reward = 54.28
2022-01-26 14:16:48.638 | DEBUG    | __main__:trials:24 - Trial = 5026/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.639 | DEBUG    | __main__:trials:29 - Trial = 5026/30000 | Total reward = 46.44
2022-01-26 14:16:48.643 | DEBUG    | __main__:trials:24 - Trial = 5027/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.644 | DEBUG    | __main__:trials:29 - Trial = 5027/30000 | Total reward = 52.16
2022-01-26 14:16:48.649 | DEBUG    | __main__:trials:24 - Trial = 5028/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.649 | DEBUG    | __main__:trials:29 - Trial = 5028/30000 | Total reward = 52.72
2022-01-26 14:16:48.652 | DEBUG    | __main__:trials:24 - Trial = 5029/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.654 | DEBUG    | __main__:trials:29 - Trial = 5029/30000 | Total reward = 48.78
2022-01-26 14:16:48.658 | DEBUG    | __main__:trials:24 - Trial = 5030/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.658 | DEBUG    | __main__:trials:29 - Trial = 5030/30000 | Total reward = 43.38
2022-01-26 14:16:48.662 | DEBUG    | __main__:trials:24 - Trial = 5031/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.662 | DEBUG    | __main__:trials:29 - Trial = 5031/30000 | Total reward = 47.33
2022-01-26 14:16:48.666 | DEBUG    | __main__:trials:24 - Trial = 5032/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.668 | DEBUG    | __main__:trials:29 - Trial = 5032/30000 | Total reward = 54.06
2022-01-26 14:16:48.671 | DEBUG    | __main__:trials:24 - Trial = 5033/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.672 | DEBUG    | __main__:trials:29 - Trial = 5033/30000 | Total reward = 48.82
2022-01-26 14:16:48.675 | DEBUG    | __main__:trials:24 - Trial = 5034/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.677 | DEBUG    | __main__:trials:29 - Trial = 5034/30000 | Total reward = 30.52
2022-01-26 14:16:48.680 | DEBUG    | __main__:trials:24 - Trial = 5035/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.682 | DEBUG    | __main__:trials:29 - Trial = 5035/30000 | Total reward = 49.11
2022-01-26 14:16:48.685 | DEBUG    | __main__:trials:24 - Trial = 5036/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.687 | DEBUG    | __main__:trials:29 - Trial = 5036/30000 | Total reward = 48.52
2022-01-26 14:16:48.691 | DEBUG    | __main__:trials:24 - Trial = 5037/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.692 | DEBUG    | __main__:trials:29 - Trial = 5037/30000 | Total reward = 49.02
2022-01-26 14:16:48.696 | DEBUG    | __main__:trials:24 - Trial = 5038/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.698 | DEBUG    | __main__:trials:29 - Trial = 5038/30000 | Total reward = 48.78
2022-01-26 14:16:48.701 | DEBUG    | __main__:trials:24 - Trial = 5039/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.702 | DEBUG    | __main__:trials:29 - Trial = 5039/30000 | Total reward = 49.25
2022-01-26 14:16:48.706 | DEBUG    | __main__:trials:24 - Trial = 5040/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.708 | DEBUG    | __main__:trials:29 - Trial = 5040/30000 | Total reward = 48.45
2022-01-26 14:16:48.711 | DEBUG    | __main__:trials:24 - Trial = 5041/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.713 | DEBUG    | __main__:trials:29 - Trial = 5041/30000 | Total reward = 40.18
2022-01-26 14:16:48.716 | DEBUG    | __main__:trials:24 - Trial = 5042/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.718 | DEBUG    | __main__:trials:29 - Trial = 5042/30000 | Total reward = 45.70
2022-01-26 14:16:48.722 | DEBUG    | __main__:trials:24 - Trial = 5043/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.723 | DEBUG    | __main__:trials:29 - Trial = 5043/30000 | Total reward = 51.44
2022-01-26 14:16:48.727 | DEBUG    | __main__:trials:24 - Trial = 5044/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.728 | DEBUG    | __main__:trials:29 - Trial = 5044/30000 | Total reward = 56.63
2022-01-26 14:16:48.732 | DEBUG    | __main__:trials:24 - Trial = 5045/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.734 | DEBUG    | __main__:trials:29 - Trial = 5045/30000 | Total reward = 46.03
2022-01-26 14:16:48.737 | DEBUG    | __main__:trials:24 - Trial = 5046/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.738 | DEBUG    | __main__:trials:29 - Trial = 5046/30000 | Total reward = 48.02
2022-01-26 14:16:48.743 | DEBUG    | __main__:trials:24 - Trial = 5047/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.745 | DEBUG    | __main__:trials:29 - Trial = 5047/30000 | Total reward = 38.58
2022-01-26 14:16:48.748 | DEBUG    | __main__:trials:24 - Trial = 5048/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.749 | DEBUG    | __main__:trials:29 - Trial = 5048/30000 | Total reward = 52.81
2022-01-26 14:16:48.752 | DEBUG    | __main__:trials:24 - Trial = 5049/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.754 | DEBUG    | __main__:trials:29 - Trial = 5049/30000 | Total reward = 44.98
2022-01-26 14:16:48.758 | DEBUG    | __main__:trials:24 - Trial = 5050/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.759 | DEBUG    | __main__:trials:29 - Trial = 5050/30000 | Total reward = 54.82
2022-01-26 14:16:48.763 | DEBUG    | __main__:trials:24 - Trial = 5051/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.765 | DEBUG    | __main__:trials:29 - Trial = 5051/30000 | Total reward = 52.27
2022-01-26 14:16:48.768 | DEBUG    | __main__:trials:24 - Trial = 5052/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.769 | DEBUG    | __main__:trials:29 - Trial = 5052/30000 | Total reward = 58.23
2022-01-26 14:16:48.773 | DEBUG    | __main__:trials:24 - Trial = 5053/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.774 | DEBUG    | __main__:trials:29 - Trial = 5053/30000 | Total reward = 48.94
2022-01-26 14:16:48.778 | DEBUG    | __main__:trials:24 - Trial = 5054/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.778 | DEBUG    | __main__:trials:29 - Trial = 5054/30000 | Total reward = 40.66
2022-01-26 14:16:48.782 | DEBUG    | __main__:trials:24 - Trial = 5055/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.784 | DEBUG    | __main__:trials:29 - Trial = 5055/30000 | Total reward = 45.16
2022-01-26 14:16:48.787 | DEBUG    | __main__:trials:24 - Trial = 5056/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.789 | DEBUG    | __main__:trials:29 - Trial = 5056/30000 | Total reward = 52.36
2022-01-26 14:16:48.793 | DEBUG    | __main__:trials:24 - Trial = 5057/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.794 | DEBUG    | __main__:trials:29 - Trial = 5057/30000 | Total reward = 40.73
2022-01-26 14:16:48.798 | DEBUG    | __main__:trials:24 - Trial = 5058/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.799 | DEBUG    | __main__:trials:29 - Trial = 5058/30000 | Total reward = 55.32
2022-01-26 14:16:48.803 | DEBUG    | __main__:trials:24 - Trial = 5059/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.804 | DEBUG    | __main__:trials:29 - Trial = 5059/30000 | Total reward = 47.90
2022-01-26 14:16:48.808 | DEBUG    | __main__:trials:24 - Trial = 5060/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.809 | DEBUG    | __main__:trials:29 - Trial = 5060/30000 | Total reward = 50.52
2022-01-26 14:16:48.813 | DEBUG    | __main__:trials:24 - Trial = 5061/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.815 | DEBUG    | __main__:trials:29 - Trial = 5061/30000 | Total reward = 52.51
2022-01-26 14:16:48.818 | DEBUG    | __main__:trials:24 - Trial = 5062/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.820 | DEBUG    | __main__:trials:29 - Trial = 5062/30000 | Total reward = 41.30
2022-01-26 14:16:48.824 | DEBUG    | __main__:trials:24 - Trial = 5063/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.824 | DEBUG    | __main__:trials:29 - Trial = 5063/30000 | Total reward = 52.85
2022-01-26 14:16:48.829 | DEBUG    | __main__:trials:24 - Trial = 5064/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.830 | DEBUG    | __main__:trials:29 - Trial = 5064/30000 | Total reward = 53.45
2022-01-26 14:16:48.834 | DEBUG    | __main__:trials:24 - Trial = 5065/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.836 | DEBUG    | __main__:trials:29 - Trial = 5065/30000 | Total reward = 46.07
2022-01-26 14:16:48.839 | DEBUG    | __main__:trials:24 - Trial = 5066/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.841 | DEBUG    | __main__:trials:29 - Trial = 5066/30000 | Total reward = 48.32
2022-01-26 14:16:48.844 | DEBUG    | __main__:trials:24 - Trial = 5067/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.846 | DEBUG    | __main__:trials:29 - Trial = 5067/30000 | Total reward = 45.70
2022-01-26 14:16:48.849 | DEBUG    | __main__:trials:24 - Trial = 5068/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.851 | DEBUG    | __main__:trials:29 - Trial = 5068/30000 | Total reward = 41.22
2022-01-26 14:16:48.854 | DEBUG    | __main__:trials:24 - Trial = 5069/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.856 | DEBUG    | __main__:trials:29 - Trial = 5069/30000 | Total reward = 54.27
2022-01-26 14:16:48.859 | DEBUG    | __main__:trials:24 - Trial = 5070/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.859 | DEBUG    | __main__:trials:29 - Trial = 5070/30000 | Total reward = 57.91
2022-01-26 14:16:48.863 | DEBUG    | __main__:trials:24 - Trial = 5071/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.863 | DEBUG    | __main__:trials:29 - Trial = 5071/30000 | Total reward = 53.34
2022-01-26 14:16:48.867 | DEBUG    | __main__:trials:24 - Trial = 5072/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.867 | DEBUG    | __main__:trials:29 - Trial = 5072/30000 | Total reward = 44.93
2022-01-26 14:16:48.871 | DEBUG    | __main__:trials:24 - Trial = 5073/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.871 | DEBUG    | __main__:trials:29 - Trial = 5073/30000 | Total reward = 50.97
2022-01-26 14:16:48.875 | DEBUG    | __main__:trials:24 - Trial = 5074/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.876 | DEBUG    | __main__:trials:29 - Trial = 5074/30000 | Total reward = 52.79
2022-01-26 14:16:48.880 | DEBUG    | __main__:trials:24 - Trial = 5075/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.882 | DEBUG    | __main__:trials:29 - Trial = 5075/30000 | Total reward = 51.05
2022-01-26 14:16:48.885 | DEBUG    | __main__:trials:24 - Trial = 5076/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.887 | DEBUG    | __main__:trials:29 - Trial = 5076/30000 | Total reward = 50.29
2022-01-26 14:16:48.890 | DEBUG    | __main__:trials:24 - Trial = 5077/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.891 | DEBUG    | __main__:trials:29 - Trial = 5077/30000 | Total reward = 41.39
2022-01-26 14:16:48.894 | DEBUG    | __main__:trials:24 - Trial = 5078/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.896 | DEBUG    | __main__:trials:29 - Trial = 5078/30000 | Total reward = 47.44
2022-01-26 14:16:48.900 | DEBUG    | __main__:trials:24 - Trial = 5079/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.901 | DEBUG    | __main__:trials:29 - Trial = 5079/30000 | Total reward = 25.08
2022-01-26 14:16:48.905 | DEBUG    | __main__:trials:24 - Trial = 5080/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.906 | DEBUG    | __main__:trials:29 - Trial = 5080/30000 | Total reward = 57.68
2022-01-26 14:16:48.910 | DEBUG    | __main__:trials:24 - Trial = 5081/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.912 | DEBUG    | __main__:trials:29 - Trial = 5081/30000 | Total reward = 49.00
2022-01-26 14:16:48.916 | DEBUG    | __main__:trials:24 - Trial = 5082/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.917 | DEBUG    | __main__:trials:29 - Trial = 5082/30000 | Total reward = 49.74
2022-01-26 14:16:48.921 | DEBUG    | __main__:trials:24 - Trial = 5083/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.922 | DEBUG    | __main__:trials:29 - Trial = 5083/30000 | Total reward = 18.07
2022-01-26 14:16:48.926 | DEBUG    | __main__:trials:24 - Trial = 5084/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.928 | DEBUG    | __main__:trials:29 - Trial = 5084/30000 | Total reward = 57.32
2022-01-26 14:16:48.932 | DEBUG    | __main__:trials:24 - Trial = 5085/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.934 | DEBUG    | __main__:trials:29 - Trial = 5085/30000 | Total reward = 24.69
2022-01-26 14:16:48.937 | DEBUG    | __main__:trials:24 - Trial = 5086/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.938 | DEBUG    | __main__:trials:29 - Trial = 5086/30000 | Total reward = 54.70
2022-01-26 14:16:48.942 | DEBUG    | __main__:trials:24 - Trial = 5087/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.943 | DEBUG    | __main__:trials:29 - Trial = 5087/30000 | Total reward = 48.91
2022-01-26 14:16:48.947 | DEBUG    | __main__:trials:24 - Trial = 5088/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.949 | DEBUG    | __main__:trials:29 - Trial = 5088/30000 | Total reward = 47.79
2022-01-26 14:16:48.952 | DEBUG    | __main__:trials:24 - Trial = 5089/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.953 | DEBUG    | __main__:trials:29 - Trial = 5089/30000 | Total reward = 34.74
2022-01-26 14:16:48.956 | DEBUG    | __main__:trials:24 - Trial = 5090/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.957 | DEBUG    | __main__:trials:29 - Trial = 5090/30000 | Total reward = 51.74
2022-01-26 14:16:48.962 | DEBUG    | __main__:trials:24 - Trial = 5091/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.963 | DEBUG    | __main__:trials:29 - Trial = 5091/30000 | Total reward = 54.75
2022-01-26 14:16:48.967 | DEBUG    | __main__:trials:24 - Trial = 5092/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.969 | DEBUG    | __main__:trials:29 - Trial = 5092/30000 | Total reward = 52.03
2022-01-26 14:16:48.972 | DEBUG    | __main__:trials:24 - Trial = 5093/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.974 | DEBUG    | __main__:trials:29 - Trial = 5093/30000 | Total reward = 53.08
2022-01-26 14:16:48.977 | DEBUG    | __main__:trials:24 - Trial = 5094/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.978 | DEBUG    | __main__:trials:29 - Trial = 5094/30000 | Total reward = 49.73
2022-01-26 14:16:48.983 | DEBUG    | __main__:trials:24 - Trial = 5095/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.983 | DEBUG    | __main__:trials:29 - Trial = 5095/30000 | Total reward = 42.19
2022-01-26 14:16:48.988 | DEBUG    | __main__:trials:24 - Trial = 5096/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.989 | DEBUG    | __main__:trials:29 - Trial = 5096/30000 | Total reward = 53.20
2022-01-26 14:16:48.993 | DEBUG    | __main__:trials:24 - Trial = 5097/30000 | Max number of steps (20) reached
2022-01-26 14:16:48.994 | DEBUG    | __main__:trials:29 - Trial = 5097/30000 | Total reward = 43.00
2022-01-26 14:16:48.998 | DEBUG    | __main__:trials:24 - Trial = 5098/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.000 | DEBUG    | __main__:trials:29 - Trial = 5098/30000 | Total reward = 49.63
2022-01-26 14:16:49.003 | DEBUG    | __main__:trials:24 - Trial = 5099/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.005 | DEBUG    | __main__:trials:29 - Trial = 5099/30000 | Total reward = 43.97
2022-01-26 14:16:49.008 | DEBUG    | __main__:trials:24 - Trial = 5100/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.009 | DEBUG    | __main__:trials:29 - Trial = 5100/30000 | Total reward = 20.51
2022-01-26 14:16:49.013 | DEBUG    | __main__:trials:24 - Trial = 5101/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.014 | DEBUG    | __main__:trials:29 - Trial = 5101/30000 | Total reward = 49.14
2022-01-26 14:16:49.018 | DEBUG    | __main__:trials:24 - Trial = 5102/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.020 | DEBUG    | __main__:trials:29 - Trial = 5102/30000 | Total reward = 36.61
2022-01-26 14:16:49.023 | DEBUG    | __main__:trials:24 - Trial = 5103/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.024 | DEBUG    | __main__:trials:29 - Trial = 5103/30000 | Total reward = 47.26
2022-01-26 14:16:49.028 | DEBUG    | __main__:trials:24 - Trial = 5104/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.029 | DEBUG    | __main__:trials:29 - Trial = 5104/30000 | Total reward = 39.43
2022-01-26 14:16:49.034 | DEBUG    | __main__:trials:24 - Trial = 5105/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.034 | DEBUG    | __main__:trials:29 - Trial = 5105/30000 | Total reward = 36.37
2022-01-26 14:16:49.039 | DEBUG    | __main__:trials:24 - Trial = 5106/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.040 | DEBUG    | __main__:trials:29 - Trial = 5106/30000 | Total reward = 47.53
2022-01-26 14:16:49.044 | DEBUG    | __main__:trials:24 - Trial = 5107/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.045 | DEBUG    | __main__:trials:29 - Trial = 5107/30000 | Total reward = 44.39
2022-01-26 14:16:49.049 | DEBUG    | __main__:trials:24 - Trial = 5108/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.051 | DEBUG    | __main__:trials:29 - Trial = 5108/30000 | Total reward = 51.02
2022-01-26 14:16:49.054 | DEBUG    | __main__:trials:24 - Trial = 5109/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.055 | DEBUG    | __main__:trials:29 - Trial = 5109/30000 | Total reward = 46.67
2022-01-26 14:16:49.059 | DEBUG    | __main__:trials:24 - Trial = 5110/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.061 | DEBUG    | __main__:trials:29 - Trial = 5110/30000 | Total reward = 41.92
2022-01-26 14:16:49.065 | DEBUG    | __main__:trials:24 - Trial = 5111/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.067 | DEBUG    | __main__:trials:29 - Trial = 5111/30000 | Total reward = 54.97
2022-01-26 14:16:49.070 | DEBUG    | __main__:trials:24 - Trial = 5112/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.071 | DEBUG    | __main__:trials:29 - Trial = 5112/30000 | Total reward = 49.41
2022-01-26 14:16:49.076 | DEBUG    | __main__:trials:24 - Trial = 5113/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.077 | DEBUG    | __main__:trials:29 - Trial = 5113/30000 | Total reward = 42.25
2022-01-26 14:16:49.080 | DEBUG    | __main__:trials:24 - Trial = 5114/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.081 | DEBUG    | __main__:trials:29 - Trial = 5114/30000 | Total reward = 48.19
2022-01-26 14:16:49.086 | DEBUG    | __main__:trials:24 - Trial = 5115/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.087 | DEBUG    | __main__:trials:29 - Trial = 5115/30000 | Total reward = 35.53
2022-01-26 14:16:49.091 | DEBUG    | __main__:trials:24 - Trial = 5116/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.093 | DEBUG    | __main__:trials:29 - Trial = 5116/30000 | Total reward = 28.55
2022-01-26 14:16:49.096 | DEBUG    | __main__:trials:24 - Trial = 5117/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.098 | DEBUG    | __main__:trials:29 - Trial = 5117/30000 | Total reward = 41.04
2022-01-26 14:16:49.102 | DEBUG    | __main__:trials:24 - Trial = 5118/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.102 | DEBUG    | __main__:trials:29 - Trial = 5118/30000 | Total reward = 52.92
2022-01-26 14:16:49.106 | DEBUG    | __main__:trials:24 - Trial = 5119/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.107 | DEBUG    | __main__:trials:29 - Trial = 5119/30000 | Total reward = 54.28
2022-01-26 14:16:49.112 | DEBUG    | __main__:trials:24 - Trial = 5120/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.112 | DEBUG    | __main__:trials:29 - Trial = 5120/30000 | Total reward = 43.38
2022-01-26 14:16:49.117 | DEBUG    | __main__:trials:24 - Trial = 5121/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.118 | DEBUG    | __main__:trials:29 - Trial = 5121/30000 | Total reward = 48.14
2022-01-26 14:16:49.122 | DEBUG    | __main__:trials:24 - Trial = 5122/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.123 | DEBUG    | __main__:trials:29 - Trial = 5122/30000 | Total reward = 50.44
2022-01-26 14:16:49.127 | DEBUG    | __main__:trials:24 - Trial = 5123/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.128 | DEBUG    | __main__:trials:29 - Trial = 5123/30000 | Total reward = 51.02
2022-01-26 14:16:49.132 | DEBUG    | __main__:trials:24 - Trial = 5124/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.133 | DEBUG    | __main__:trials:29 - Trial = 5124/30000 | Total reward = 47.92
2022-01-26 14:16:49.137 | DEBUG    | __main__:trials:24 - Trial = 5125/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.138 | DEBUG    | __main__:trials:29 - Trial = 5125/30000 | Total reward = 53.68
2022-01-26 14:16:49.143 | DEBUG    | __main__:trials:24 - Trial = 5126/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.143 | DEBUG    | __main__:trials:29 - Trial = 5126/30000 | Total reward = 36.52
2022-01-26 14:16:49.147 | DEBUG    | __main__:trials:26 - Trial = 5127/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.149 | DEBUG    | __main__:trials:29 - Trial = 5127/30000 | Total reward = 34.87
2022-01-26 14:16:49.152 | DEBUG    | __main__:trials:24 - Trial = 5128/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.153 | DEBUG    | __main__:trials:29 - Trial = 5128/30000 | Total reward = 51.02
2022-01-26 14:16:49.157 | DEBUG    | __main__:trials:24 - Trial = 5129/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.158 | DEBUG    | __main__:trials:29 - Trial = 5129/30000 | Total reward = 35.83
2022-01-26 14:16:49.162 | DEBUG    | __main__:trials:24 - Trial = 5130/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.163 | DEBUG    | __main__:trials:29 - Trial = 5130/30000 | Total reward = 49.87
2022-01-26 14:16:49.167 | DEBUG    | __main__:trials:24 - Trial = 5131/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.169 | DEBUG    | __main__:trials:29 - Trial = 5131/30000 | Total reward = 53.48
2022-01-26 14:16:49.172 | DEBUG    | __main__:trials:24 - Trial = 5132/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.173 | DEBUG    | __main__:trials:29 - Trial = 5132/30000 | Total reward = 48.59
2022-01-26 14:16:49.176 | DEBUG    | __main__:trials:24 - Trial = 5133/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.177 | DEBUG    | __main__:trials:29 - Trial = 5133/30000 | Total reward = 51.12
2022-01-26 14:16:49.181 | DEBUG    | __main__:trials:24 - Trial = 5134/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.182 | DEBUG    | __main__:trials:29 - Trial = 5134/30000 | Total reward = 49.71
2022-01-26 14:16:49.186 | DEBUG    | __main__:trials:24 - Trial = 5135/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.188 | DEBUG    | __main__:trials:29 - Trial = 5135/30000 | Total reward = 51.02
2022-01-26 14:16:49.190 | DEBUG    | __main__:trials:24 - Trial = 5136/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.192 | DEBUG    | __main__:trials:29 - Trial = 5136/30000 | Total reward = 31.33
2022-01-26 14:16:49.196 | DEBUG    | __main__:trials:24 - Trial = 5137/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.197 | DEBUG    | __main__:trials:29 - Trial = 5137/30000 | Total reward = 46.31
2022-01-26 14:16:49.200 | DEBUG    | __main__:trials:24 - Trial = 5138/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.202 | DEBUG    | __main__:trials:29 - Trial = 5138/30000 | Total reward = 52.70
2022-01-26 14:16:49.206 | DEBUG    | __main__:trials:24 - Trial = 5139/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.207 | DEBUG    | __main__:trials:29 - Trial = 5139/30000 | Total reward = 50.12
2022-01-26 14:16:49.211 | DEBUG    | __main__:trials:24 - Trial = 5140/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.212 | DEBUG    | __main__:trials:29 - Trial = 5140/30000 | Total reward = 48.70
2022-01-26 14:16:49.216 | DEBUG    | __main__:trials:24 - Trial = 5141/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.218 | DEBUG    | __main__:trials:29 - Trial = 5141/30000 | Total reward = 56.97
2022-01-26 14:16:49.222 | DEBUG    | __main__:trials:24 - Trial = 5142/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.222 | DEBUG    | __main__:trials:29 - Trial = 5142/30000 | Total reward = 39.51
2022-01-26 14:16:49.226 | DEBUG    | __main__:trials:24 - Trial = 5143/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.227 | DEBUG    | __main__:trials:29 - Trial = 5143/30000 | Total reward = 50.33
2022-01-26 14:16:49.232 | DEBUG    | __main__:trials:24 - Trial = 5144/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.232 | DEBUG    | __main__:trials:29 - Trial = 5144/30000 | Total reward = 58.90
2022-01-26 14:16:49.237 | DEBUG    | __main__:trials:24 - Trial = 5145/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.238 | DEBUG    | __main__:trials:29 - Trial = 5145/30000 | Total reward = 51.48
2022-01-26 14:16:49.241 | DEBUG    | __main__:trials:26 - Trial = 5146/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.242 | DEBUG    | __main__:trials:29 - Trial = 5146/30000 | Total reward = 26.06
2022-01-26 14:16:49.246 | DEBUG    | __main__:trials:24 - Trial = 5147/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.247 | DEBUG    | __main__:trials:29 - Trial = 5147/30000 | Total reward = 44.35
2022-01-26 14:16:49.251 | DEBUG    | __main__:trials:24 - Trial = 5148/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.253 | DEBUG    | __main__:trials:29 - Trial = 5148/30000 | Total reward = 48.47
2022-01-26 14:16:49.257 | DEBUG    | __main__:trials:24 - Trial = 5149/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.258 | DEBUG    | __main__:trials:29 - Trial = 5149/30000 | Total reward = 49.71
2022-01-26 14:16:49.262 | DEBUG    | __main__:trials:24 - Trial = 5150/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.263 | DEBUG    | __main__:trials:29 - Trial = 5150/30000 | Total reward = 51.30
2022-01-26 14:16:49.267 | DEBUG    | __main__:trials:24 - Trial = 5151/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.268 | DEBUG    | __main__:trials:29 - Trial = 5151/30000 | Total reward = 49.45
2022-01-26 14:16:49.272 | DEBUG    | __main__:trials:24 - Trial = 5152/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.274 | DEBUG    | __main__:trials:29 - Trial = 5152/30000 | Total reward = 50.23
2022-01-26 14:16:49.278 | DEBUG    | __main__:trials:24 - Trial = 5153/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.279 | DEBUG    | __main__:trials:29 - Trial = 5153/30000 | Total reward = 47.14
2022-01-26 14:16:49.283 | DEBUG    | __main__:trials:24 - Trial = 5154/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.284 | DEBUG    | __main__:trials:29 - Trial = 5154/30000 | Total reward = 54.15
2022-01-26 14:16:49.288 | DEBUG    | __main__:trials:24 - Trial = 5155/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.289 | DEBUG    | __main__:trials:29 - Trial = 5155/30000 | Total reward = 37.80
2022-01-26 14:16:49.294 | DEBUG    | __main__:trials:24 - Trial = 5156/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.295 | DEBUG    | __main__:trials:29 - Trial = 5156/30000 | Total reward = 50.47
2022-01-26 14:16:49.298 | DEBUG    | __main__:trials:24 - Trial = 5157/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.300 | DEBUG    | __main__:trials:29 - Trial = 5157/30000 | Total reward = 47.96
2022-01-26 14:16:49.303 | DEBUG    | __main__:trials:24 - Trial = 5158/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.305 | DEBUG    | __main__:trials:29 - Trial = 5158/30000 | Total reward = 52.86
2022-01-26 14:16:49.309 | DEBUG    | __main__:trials:24 - Trial = 5159/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.310 | DEBUG    | __main__:trials:29 - Trial = 5159/30000 | Total reward = 43.06
2022-01-26 14:16:49.314 | DEBUG    | __main__:trials:24 - Trial = 5160/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.315 | DEBUG    | __main__:trials:29 - Trial = 5160/30000 | Total reward = 45.10
2022-01-26 14:16:49.319 | DEBUG    | __main__:trials:26 - Trial = 5161/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.321 | DEBUG    | __main__:trials:29 - Trial = 5161/30000 | Total reward = 27.32
2022-01-26 14:16:49.324 | DEBUG    | __main__:trials:26 - Trial = 5162/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.325 | DEBUG    | __main__:trials:29 - Trial = 5162/30000 | Total reward = 27.32
2022-01-26 14:16:49.329 | DEBUG    | __main__:trials:24 - Trial = 5163/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.330 | DEBUG    | __main__:trials:29 - Trial = 5163/30000 | Total reward = 50.10
2022-01-26 14:16:49.334 | DEBUG    | __main__:trials:24 - Trial = 5164/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.336 | DEBUG    | __main__:trials:29 - Trial = 5164/30000 | Total reward = 61.08
2022-01-26 14:16:49.340 | DEBUG    | __main__:trials:24 - Trial = 5165/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.340 | DEBUG    | __main__:trials:29 - Trial = 5165/30000 | Total reward = 49.44
2022-01-26 14:16:49.345 | DEBUG    | __main__:trials:24 - Trial = 5166/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.346 | DEBUG    | __main__:trials:29 - Trial = 5166/30000 | Total reward = 45.51
2022-01-26 14:16:49.350 | DEBUG    | __main__:trials:24 - Trial = 5167/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.351 | DEBUG    | __main__:trials:29 - Trial = 5167/30000 | Total reward = 49.47
2022-01-26 14:16:49.355 | DEBUG    | __main__:trials:24 - Trial = 5168/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.356 | DEBUG    | __main__:trials:29 - Trial = 5168/30000 | Total reward = 49.91
2022-01-26 14:16:49.359 | DEBUG    | __main__:trials:24 - Trial = 5169/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.361 | DEBUG    | __main__:trials:29 - Trial = 5169/30000 | Total reward = 49.29
2022-01-26 14:16:49.364 | DEBUG    | __main__:trials:24 - Trial = 5170/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.366 | DEBUG    | __main__:trials:29 - Trial = 5170/30000 | Total reward = 37.09
2022-01-26 14:16:49.369 | DEBUG    | __main__:trials:24 - Trial = 5171/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.371 | DEBUG    | __main__:trials:29 - Trial = 5171/30000 | Total reward = 43.06
2022-01-26 14:16:49.374 | DEBUG    | __main__:trials:24 - Trial = 5172/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.376 | DEBUG    | __main__:trials:29 - Trial = 5172/30000 | Total reward = 59.47
2022-01-26 14:16:49.379 | DEBUG    | __main__:trials:26 - Trial = 5173/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.380 | DEBUG    | __main__:trials:29 - Trial = 5173/30000 | Total reward = 18.64
2022-01-26 14:16:49.384 | DEBUG    | __main__:trials:24 - Trial = 5174/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.386 | DEBUG    | __main__:trials:29 - Trial = 5174/30000 | Total reward = 40.11
2022-01-26 14:16:49.389 | DEBUG    | __main__:trials:24 - Trial = 5175/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.390 | DEBUG    | __main__:trials:29 - Trial = 5175/30000 | Total reward = 53.38
2022-01-26 14:16:49.394 | DEBUG    | __main__:trials:26 - Trial = 5176/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.395 | DEBUG    | __main__:trials:29 - Trial = 5176/30000 | Total reward = 12.98
2022-01-26 14:16:49.398 | DEBUG    | __main__:trials:24 - Trial = 5177/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.400 | DEBUG    | __main__:trials:29 - Trial = 5177/30000 | Total reward = 58.16
2022-01-26 14:16:49.404 | DEBUG    | __main__:trials:24 - Trial = 5178/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.406 | DEBUG    | __main__:trials:29 - Trial = 5178/30000 | Total reward = 44.66
2022-01-26 14:16:49.409 | DEBUG    | __main__:trials:24 - Trial = 5179/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.411 | DEBUG    | __main__:trials:29 - Trial = 5179/30000 | Total reward = 62.52
2022-01-26 14:16:49.415 | DEBUG    | __main__:trials:24 - Trial = 5180/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.416 | DEBUG    | __main__:trials:29 - Trial = 5180/30000 | Total reward = 40.09
2022-01-26 14:16:49.420 | DEBUG    | __main__:trials:24 - Trial = 5181/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.422 | DEBUG    | __main__:trials:29 - Trial = 5181/30000 | Total reward = 49.15
2022-01-26 14:16:49.425 | DEBUG    | __main__:trials:24 - Trial = 5182/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.427 | DEBUG    | __main__:trials:29 - Trial = 5182/30000 | Total reward = 39.44
2022-01-26 14:16:49.430 | DEBUG    | __main__:trials:24 - Trial = 5183/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.432 | DEBUG    | __main__:trials:29 - Trial = 5183/30000 | Total reward = 24.12
2022-01-26 14:16:49.435 | DEBUG    | __main__:trials:24 - Trial = 5184/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.437 | DEBUG    | __main__:trials:29 - Trial = 5184/30000 | Total reward = 48.22
2022-01-26 14:16:49.439 | DEBUG    | __main__:trials:24 - Trial = 5185/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.441 | DEBUG    | __main__:trials:29 - Trial = 5185/30000 | Total reward = 50.65
2022-01-26 14:16:49.445 | DEBUG    | __main__:trials:24 - Trial = 5186/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.446 | DEBUG    | __main__:trials:29 - Trial = 5186/30000 | Total reward = 50.61
2022-01-26 14:16:49.450 | DEBUG    | __main__:trials:24 - Trial = 5187/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.452 | DEBUG    | __main__:trials:29 - Trial = 5187/30000 | Total reward = 48.85
2022-01-26 14:16:49.455 | DEBUG    | __main__:trials:24 - Trial = 5188/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.456 | DEBUG    | __main__:trials:29 - Trial = 5188/30000 | Total reward = 40.33
2022-01-26 14:16:49.460 | DEBUG    | __main__:trials:24 - Trial = 5189/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.462 | DEBUG    | __main__:trials:29 - Trial = 5189/30000 | Total reward = 52.48
2022-01-26 14:16:49.465 | DEBUG    | __main__:trials:24 - Trial = 5190/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.466 | DEBUG    | __main__:trials:29 - Trial = 5190/30000 | Total reward = 51.30
2022-01-26 14:16:49.471 | DEBUG    | __main__:trials:24 - Trial = 5191/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.472 | DEBUG    | __main__:trials:29 - Trial = 5191/30000 | Total reward = 49.09
2022-01-26 14:16:49.476 | DEBUG    | __main__:trials:24 - Trial = 5192/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.478 | DEBUG    | __main__:trials:29 - Trial = 5192/30000 | Total reward = 53.79
2022-01-26 14:16:49.481 | DEBUG    | __main__:trials:24 - Trial = 5193/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.482 | DEBUG    | __main__:trials:29 - Trial = 5193/30000 | Total reward = 50.53
2022-01-26 14:16:49.486 | DEBUG    | __main__:trials:24 - Trial = 5194/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.487 | DEBUG    | __main__:trials:29 - Trial = 5194/30000 | Total reward = 46.64
2022-01-26 14:16:49.491 | DEBUG    | __main__:trials:24 - Trial = 5195/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.493 | DEBUG    | __main__:trials:29 - Trial = 5195/30000 | Total reward = 47.53
2022-01-26 14:16:49.496 | DEBUG    | __main__:trials:24 - Trial = 5196/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.498 | DEBUG    | __main__:trials:29 - Trial = 5196/30000 | Total reward = 50.48
2022-01-26 14:16:49.501 | DEBUG    | __main__:trials:24 - Trial = 5197/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.502 | DEBUG    | __main__:trials:29 - Trial = 5197/30000 | Total reward = 48.85
2022-01-26 14:16:49.505 | DEBUG    | __main__:trials:24 - Trial = 5198/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.507 | DEBUG    | __main__:trials:29 - Trial = 5198/30000 | Total reward = 50.39
2022-01-26 14:16:49.510 | DEBUG    | __main__:trials:24 - Trial = 5199/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.510 | DEBUG    | __main__:trials:29 - Trial = 5199/30000 | Total reward = 44.91
2022-01-26 14:16:49.514 | DEBUG    | __main__:trials:24 - Trial = 5200/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.515 | DEBUG    | __main__:trials:29 - Trial = 5200/30000 | Total reward = 47.27
2022-01-26 14:16:49.519 | DEBUG    | __main__:trials:24 - Trial = 5201/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.520 | DEBUG    | __main__:trials:29 - Trial = 5201/30000 | Total reward = 50.38
2022-01-26 14:16:49.524 | DEBUG    | __main__:trials:24 - Trial = 5202/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.526 | DEBUG    | __main__:trials:29 - Trial = 5202/30000 | Total reward = 40.31
2022-01-26 14:16:49.529 | DEBUG    | __main__:trials:24 - Trial = 5203/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.530 | DEBUG    | __main__:trials:29 - Trial = 5203/30000 | Total reward = 48.72
2022-01-26 14:16:49.534 | DEBUG    | __main__:trials:24 - Trial = 5204/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.534 | DEBUG    | __main__:trials:29 - Trial = 5204/30000 | Total reward = 36.23
2022-01-26 14:16:49.539 | DEBUG    | __main__:trials:24 - Trial = 5205/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.540 | DEBUG    | __main__:trials:29 - Trial = 5205/30000 | Total reward = 45.98
2022-01-26 14:16:49.544 | DEBUG    | __main__:trials:24 - Trial = 5206/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.546 | DEBUG    | __main__:trials:29 - Trial = 5206/30000 | Total reward = 49.20
2022-01-26 14:16:49.549 | DEBUG    | __main__:trials:24 - Trial = 5207/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.550 | DEBUG    | __main__:trials:29 - Trial = 5207/30000 | Total reward = 45.19
2022-01-26 14:16:49.555 | DEBUG    | __main__:trials:24 - Trial = 5208/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.555 | DEBUG    | __main__:trials:29 - Trial = 5208/30000 | Total reward = 44.11
2022-01-26 14:16:49.558 | DEBUG    | __main__:trials:26 - Trial = 5209/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.559 | DEBUG    | __main__:trials:29 - Trial = 5209/30000 | Total reward = 9.16
2022-01-26 14:16:49.562 | DEBUG    | __main__:trials:26 - Trial = 5210/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.564 | DEBUG    | __main__:trials:29 - Trial = 5210/30000 | Total reward = 22.06
2022-01-26 14:16:49.567 | DEBUG    | __main__:trials:26 - Trial = 5211/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.567 | DEBUG    | __main__:trials:29 - Trial = 5211/30000 | Total reward = 25.32
2022-01-26 14:16:49.571 | DEBUG    | __main__:trials:24 - Trial = 5212/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.573 | DEBUG    | __main__:trials:29 - Trial = 5212/30000 | Total reward = 40.31
2022-01-26 14:16:49.577 | DEBUG    | __main__:trials:24 - Trial = 5213/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.577 | DEBUG    | __main__:trials:29 - Trial = 5213/30000 | Total reward = 48.84
2022-01-26 14:16:49.581 | DEBUG    | __main__:trials:24 - Trial = 5214/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.582 | DEBUG    | __main__:trials:29 - Trial = 5214/30000 | Total reward = 41.88
2022-01-26 14:16:49.585 | DEBUG    | __main__:trials:24 - Trial = 5215/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.587 | DEBUG    | __main__:trials:29 - Trial = 5215/30000 | Total reward = 22.33
2022-01-26 14:16:49.591 | DEBUG    | __main__:trials:24 - Trial = 5216/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.592 | DEBUG    | __main__:trials:29 - Trial = 5216/30000 | Total reward = 47.94
2022-01-26 14:16:49.596 | DEBUG    | __main__:trials:24 - Trial = 5217/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.598 | DEBUG    | __main__:trials:29 - Trial = 5217/30000 | Total reward = 49.82
2022-01-26 14:16:49.602 | DEBUG    | __main__:trials:24 - Trial = 5218/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.602 | DEBUG    | __main__:trials:29 - Trial = 5218/30000 | Total reward = 49.22
2022-01-26 14:16:49.607 | DEBUG    | __main__:trials:24 - Trial = 5219/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.607 | DEBUG    | __main__:trials:29 - Trial = 5219/30000 | Total reward = 46.36
2022-01-26 14:16:49.612 | DEBUG    | __main__:trials:24 - Trial = 5220/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.612 | DEBUG    | __main__:trials:29 - Trial = 5220/30000 | Total reward = 50.94
2022-01-26 14:16:49.616 | DEBUG    | __main__:trials:24 - Trial = 5221/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.617 | DEBUG    | __main__:trials:29 - Trial = 5221/30000 | Total reward = 59.70
2022-01-26 14:16:49.621 | DEBUG    | __main__:trials:24 - Trial = 5222/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.622 | DEBUG    | __main__:trials:29 - Trial = 5222/30000 | Total reward = 49.85
2022-01-26 14:16:49.625 | DEBUG    | __main__:trials:26 - Trial = 5223/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.626 | DEBUG    | __main__:trials:29 - Trial = 5223/30000 | Total reward = 31.73
2022-01-26 14:16:49.630 | DEBUG    | __main__:trials:24 - Trial = 5224/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.630 | DEBUG    | __main__:trials:29 - Trial = 5224/30000 | Total reward = 59.97
2022-01-26 14:16:49.634 | DEBUG    | __main__:trials:24 - Trial = 5225/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.635 | DEBUG    | __main__:trials:29 - Trial = 5225/30000 | Total reward = 58.60
2022-01-26 14:16:49.640 | DEBUG    | __main__:trials:24 - Trial = 5226/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.641 | DEBUG    | __main__:trials:29 - Trial = 5226/30000 | Total reward = 43.85
2022-01-26 14:16:49.645 | DEBUG    | __main__:trials:24 - Trial = 5227/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.646 | DEBUG    | __main__:trials:29 - Trial = 5227/30000 | Total reward = 15.96
2022-01-26 14:16:49.650 | DEBUG    | __main__:trials:24 - Trial = 5228/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.651 | DEBUG    | __main__:trials:29 - Trial = 5228/30000 | Total reward = 54.70
2022-01-26 14:16:49.655 | DEBUG    | __main__:trials:24 - Trial = 5229/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.657 | DEBUG    | __main__:trials:29 - Trial = 5229/30000 | Total reward = 47.54
2022-01-26 14:16:49.660 | DEBUG    | __main__:trials:24 - Trial = 5230/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.662 | DEBUG    | __main__:trials:29 - Trial = 5230/30000 | Total reward = 54.73
2022-01-26 14:16:49.666 | DEBUG    | __main__:trials:24 - Trial = 5231/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.667 | DEBUG    | __main__:trials:29 - Trial = 5231/30000 | Total reward = 30.98
2022-01-26 14:16:49.671 | DEBUG    | __main__:trials:24 - Trial = 5232/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.673 | DEBUG    | __main__:trials:29 - Trial = 5232/30000 | Total reward = 38.80
2022-01-26 14:16:49.676 | DEBUG    | __main__:trials:26 - Trial = 5233/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:49.677 | DEBUG    | __main__:trials:29 - Trial = 5233/30000 | Total reward = 19.77
2022-01-26 14:16:49.680 | DEBUG    | __main__:trials:24 - Trial = 5234/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.681 | DEBUG    | __main__:trials:29 - Trial = 5234/30000 | Total reward = 51.32
2022-01-26 14:16:49.684 | DEBUG    | __main__:trials:24 - Trial = 5235/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.685 | DEBUG    | __main__:trials:29 - Trial = 5235/30000 | Total reward = 55.34
2022-01-26 14:16:49.689 | DEBUG    | __main__:trials:24 - Trial = 5236/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.690 | DEBUG    | __main__:trials:29 - Trial = 5236/30000 | Total reward = 39.52
2022-01-26 14:16:49.694 | DEBUG    | __main__:trials:24 - Trial = 5237/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.695 | DEBUG    | __main__:trials:29 - Trial = 5237/30000 | Total reward = 49.10
2022-01-26 14:16:49.699 | DEBUG    | __main__:trials:24 - Trial = 5238/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.701 | DEBUG    | __main__:trials:29 - Trial = 5238/30000 | Total reward = 48.94
2022-01-26 14:16:49.704 | DEBUG    | __main__:trials:24 - Trial = 5239/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.706 | DEBUG    | __main__:trials:29 - Trial = 5239/30000 | Total reward = 49.69
2022-01-26 14:16:49.710 | DEBUG    | __main__:trials:24 - Trial = 5240/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.710 | DEBUG    | __main__:trials:29 - Trial = 5240/30000 | Total reward = 50.23
2022-01-26 14:16:49.715 | DEBUG    | __main__:trials:24 - Trial = 5241/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.715 | DEBUG    | __main__:trials:29 - Trial = 5241/30000 | Total reward = 48.76
2022-01-26 14:16:49.720 | DEBUG    | __main__:trials:24 - Trial = 5242/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.721 | DEBUG    | __main__:trials:29 - Trial = 5242/30000 | Total reward = 42.53
2022-01-26 14:16:49.725 | DEBUG    | __main__:trials:24 - Trial = 5243/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.726 | DEBUG    | __main__:trials:29 - Trial = 5243/30000 | Total reward = 5.14
2022-01-26 14:16:49.729 | DEBUG    | __main__:trials:24 - Trial = 5244/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.730 | DEBUG    | __main__:trials:29 - Trial = 5244/30000 | Total reward = 48.05
2022-01-26 14:16:49.734 | DEBUG    | __main__:trials:24 - Trial = 5245/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.735 | DEBUG    | __main__:trials:29 - Trial = 5245/30000 | Total reward = 50.33
2022-01-26 14:16:49.739 | DEBUG    | __main__:trials:24 - Trial = 5246/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.740 | DEBUG    | __main__:trials:29 - Trial = 5246/30000 | Total reward = 49.38
2022-01-26 14:16:49.743 | DEBUG    | __main__:trials:24 - Trial = 5247/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.745 | DEBUG    | __main__:trials:29 - Trial = 5247/30000 | Total reward = 44.94
2022-01-26 14:16:49.748 | DEBUG    | __main__:trials:24 - Trial = 5248/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.748 | DEBUG    | __main__:trials:29 - Trial = 5248/30000 | Total reward = 33.00
2022-01-26 14:16:49.752 | DEBUG    | __main__:trials:24 - Trial = 5249/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.753 | DEBUG    | __main__:trials:29 - Trial = 5249/30000 | Total reward = 47.82
2022-01-26 14:16:49.757 | DEBUG    | __main__:trials:24 - Trial = 5250/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.759 | DEBUG    | __main__:trials:29 - Trial = 5250/30000 | Total reward = 48.77
2022-01-26 14:16:49.762 | DEBUG    | __main__:trials:24 - Trial = 5251/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.763 | DEBUG    | __main__:trials:29 - Trial = 5251/30000 | Total reward = 50.32
2022-01-26 14:16:49.768 | DEBUG    | __main__:trials:24 - Trial = 5252/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.768 | DEBUG    | __main__:trials:29 - Trial = 5252/30000 | Total reward = 20.45
2022-01-26 14:16:49.772 | DEBUG    | __main__:trials:24 - Trial = 5253/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.774 | DEBUG    | __main__:trials:29 - Trial = 5253/30000 | Total reward = 49.69
2022-01-26 14:16:49.777 | DEBUG    | __main__:trials:24 - Trial = 5254/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.779 | DEBUG    | __main__:trials:29 - Trial = 5254/30000 | Total reward = 49.36
2022-01-26 14:16:49.782 | DEBUG    | __main__:trials:24 - Trial = 5255/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.784 | DEBUG    | __main__:trials:29 - Trial = 5255/30000 | Total reward = 50.53
2022-01-26 14:16:49.787 | DEBUG    | __main__:trials:24 - Trial = 5256/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.788 | DEBUG    | __main__:trials:29 - Trial = 5256/30000 | Total reward = 49.56
2022-01-26 14:16:49.791 | DEBUG    | __main__:trials:24 - Trial = 5257/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.793 | DEBUG    | __main__:trials:29 - Trial = 5257/30000 | Total reward = 37.38
2022-01-26 14:16:49.796 | DEBUG    | __main__:trials:24 - Trial = 5258/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.798 | DEBUG    | __main__:trials:29 - Trial = 5258/30000 | Total reward = 48.35
2022-01-26 14:16:49.802 | DEBUG    | __main__:trials:24 - Trial = 5259/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.802 | DEBUG    | __main__:trials:29 - Trial = 5259/30000 | Total reward = 44.61
2022-01-26 14:16:49.807 | DEBUG    | __main__:trials:24 - Trial = 5260/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.809 | DEBUG    | __main__:trials:29 - Trial = 5260/30000 | Total reward = 49.28
2022-01-26 14:16:49.812 | DEBUG    | __main__:trials:24 - Trial = 5261/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.813 | DEBUG    | __main__:trials:29 - Trial = 5261/30000 | Total reward = 50.01
2022-01-26 14:16:49.818 | DEBUG    | __main__:trials:24 - Trial = 5262/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.819 | DEBUG    | __main__:trials:29 - Trial = 5262/30000 | Total reward = 48.71
2022-01-26 14:16:49.822 | DEBUG    | __main__:trials:24 - Trial = 5263/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.824 | DEBUG    | __main__:trials:29 - Trial = 5263/30000 | Total reward = 41.85
2022-01-26 14:16:49.828 | DEBUG    | __main__:trials:24 - Trial = 5264/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.830 | DEBUG    | __main__:trials:29 - Trial = 5264/30000 | Total reward = 46.57
2022-01-26 14:16:49.833 | DEBUG    | __main__:trials:24 - Trial = 5265/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.834 | DEBUG    | __main__:trials:29 - Trial = 5265/30000 | Total reward = 47.48
2022-01-26 14:16:49.838 | DEBUG    | __main__:trials:24 - Trial = 5266/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.840 | DEBUG    | __main__:trials:29 - Trial = 5266/30000 | Total reward = 50.18
2022-01-26 14:16:49.843 | DEBUG    | __main__:trials:24 - Trial = 5267/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.844 | DEBUG    | __main__:trials:29 - Trial = 5267/30000 | Total reward = 45.00
2022-01-26 14:16:49.849 | DEBUG    | __main__:trials:24 - Trial = 5268/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.850 | DEBUG    | __main__:trials:29 - Trial = 5268/30000 | Total reward = 48.77
2022-01-26 14:16:49.854 | DEBUG    | __main__:trials:24 - Trial = 5269/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.855 | DEBUG    | __main__:trials:29 - Trial = 5269/30000 | Total reward = 48.35
2022-01-26 14:16:49.858 | DEBUG    | __main__:trials:24 - Trial = 5270/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.860 | DEBUG    | __main__:trials:29 - Trial = 5270/30000 | Total reward = 45.52
2022-01-26 14:16:49.864 | DEBUG    | __main__:trials:24 - Trial = 5271/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.864 | DEBUG    | __main__:trials:29 - Trial = 5271/30000 | Total reward = 57.84
2022-01-26 14:16:49.868 | DEBUG    | __main__:trials:24 - Trial = 5272/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.870 | DEBUG    | __main__:trials:29 - Trial = 5272/30000 | Total reward = 47.22
2022-01-26 14:16:49.874 | DEBUG    | __main__:trials:24 - Trial = 5273/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.875 | DEBUG    | __main__:trials:29 - Trial = 5273/30000 | Total reward = 51.85
2022-01-26 14:16:49.879 | DEBUG    | __main__:trials:24 - Trial = 5274/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.880 | DEBUG    | __main__:trials:29 - Trial = 5274/30000 | Total reward = 42.04
2022-01-26 14:16:49.884 | DEBUG    | __main__:trials:24 - Trial = 5275/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.885 | DEBUG    | __main__:trials:29 - Trial = 5275/30000 | Total reward = 53.35
2022-01-26 14:16:49.889 | DEBUG    | __main__:trials:24 - Trial = 5276/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.890 | DEBUG    | __main__:trials:29 - Trial = 5276/30000 | Total reward = 43.47
2022-01-26 14:16:49.894 | DEBUG    | __main__:trials:24 - Trial = 5277/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.895 | DEBUG    | __main__:trials:29 - Trial = 5277/30000 | Total reward = 9.17
2022-01-26 14:16:49.900 | DEBUG    | __main__:trials:24 - Trial = 5278/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.901 | DEBUG    | __main__:trials:29 - Trial = 5278/30000 | Total reward = 51.31
2022-01-26 14:16:49.905 | DEBUG    | __main__:trials:24 - Trial = 5279/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.906 | DEBUG    | __main__:trials:29 - Trial = 5279/30000 | Total reward = 47.46
2022-01-26 14:16:49.909 | DEBUG    | __main__:trials:24 - Trial = 5280/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.910 | DEBUG    | __main__:trials:29 - Trial = 5280/30000 | Total reward = 46.70
2022-01-26 14:16:49.913 | DEBUG    | __main__:trials:24 - Trial = 5281/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.915 | DEBUG    | __main__:trials:29 - Trial = 5281/30000 | Total reward = 43.97
2022-01-26 14:16:49.919 | DEBUG    | __main__:trials:24 - Trial = 5282/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.919 | DEBUG    | __main__:trials:29 - Trial = 5282/30000 | Total reward = 47.08
2022-01-26 14:16:49.923 | DEBUG    | __main__:trials:24 - Trial = 5283/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.924 | DEBUG    | __main__:trials:29 - Trial = 5283/30000 | Total reward = 51.86
2022-01-26 14:16:49.927 | DEBUG    | __main__:trials:24 - Trial = 5284/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.928 | DEBUG    | __main__:trials:29 - Trial = 5284/30000 | Total reward = 49.19
2022-01-26 14:16:49.932 | DEBUG    | __main__:trials:24 - Trial = 5285/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.932 | DEBUG    | __main__:trials:29 - Trial = 5285/30000 | Total reward = 49.15
2022-01-26 14:16:49.937 | DEBUG    | __main__:trials:24 - Trial = 5286/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.937 | DEBUG    | __main__:trials:29 - Trial = 5286/30000 | Total reward = 44.51
2022-01-26 14:16:49.942 | DEBUG    | __main__:trials:24 - Trial = 5287/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.944 | DEBUG    | __main__:trials:29 - Trial = 5287/30000 | Total reward = 46.85
2022-01-26 14:16:49.948 | DEBUG    | __main__:trials:24 - Trial = 5288/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.949 | DEBUG    | __main__:trials:29 - Trial = 5288/30000 | Total reward = 56.16
2022-01-26 14:16:49.953 | DEBUG    | __main__:trials:24 - Trial = 5289/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.955 | DEBUG    | __main__:trials:29 - Trial = 5289/30000 | Total reward = 45.02
2022-01-26 14:16:49.958 | DEBUG    | __main__:trials:24 - Trial = 5290/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.960 | DEBUG    | __main__:trials:29 - Trial = 5290/30000 | Total reward = 50.16
2022-01-26 14:16:49.963 | DEBUG    | __main__:trials:24 - Trial = 5291/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.965 | DEBUG    | __main__:trials:29 - Trial = 5291/30000 | Total reward = 48.01
2022-01-26 14:16:49.969 | DEBUG    | __main__:trials:24 - Trial = 5292/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.970 | DEBUG    | __main__:trials:29 - Trial = 5292/30000 | Total reward = 42.64
2022-01-26 14:16:49.974 | DEBUG    | __main__:trials:24 - Trial = 5293/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.975 | DEBUG    | __main__:trials:29 - Trial = 5293/30000 | Total reward = 43.01
2022-01-26 14:16:49.979 | DEBUG    | __main__:trials:24 - Trial = 5294/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.981 | DEBUG    | __main__:trials:29 - Trial = 5294/30000 | Total reward = 31.66
2022-01-26 14:16:49.985 | DEBUG    | __main__:trials:24 - Trial = 5295/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.986 | DEBUG    | __main__:trials:29 - Trial = 5295/30000 | Total reward = 43.81
2022-01-26 14:16:49.990 | DEBUG    | __main__:trials:24 - Trial = 5296/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.992 | DEBUG    | __main__:trials:29 - Trial = 5296/30000 | Total reward = 55.73
2022-01-26 14:16:49.996 | DEBUG    | __main__:trials:24 - Trial = 5297/30000 | Max number of steps (20) reached
2022-01-26 14:16:49.997 | DEBUG    | __main__:trials:29 - Trial = 5297/30000 | Total reward = 46.95
2022-01-26 14:16:50.001 | DEBUG    | __main__:trials:24 - Trial = 5298/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.002 | DEBUG    | __main__:trials:29 - Trial = 5298/30000 | Total reward = 60.48
2022-01-26 14:16:50.006 | DEBUG    | __main__:trials:24 - Trial = 5299/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.007 | DEBUG    | __main__:trials:29 - Trial = 5299/30000 | Total reward = 52.30
2022-01-26 14:16:50.011 | DEBUG    | __main__:trials:24 - Trial = 5300/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.011 | DEBUG    | __main__:trials:29 - Trial = 5300/30000 | Total reward = 48.05
2022-01-26 14:16:50.015 | DEBUG    | __main__:trials:24 - Trial = 5301/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.017 | DEBUG    | __main__:trials:29 - Trial = 5301/30000 | Total reward = 47.34
2022-01-26 14:16:50.020 | DEBUG    | __main__:trials:24 - Trial = 5302/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.021 | DEBUG    | __main__:trials:29 - Trial = 5302/30000 | Total reward = 54.85
2022-01-26 14:16:50.025 | DEBUG    | __main__:trials:24 - Trial = 5303/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.026 | DEBUG    | __main__:trials:29 - Trial = 5303/30000 | Total reward = 34.37
2022-01-26 14:16:50.030 | DEBUG    | __main__:trials:24 - Trial = 5304/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.032 | DEBUG    | __main__:trials:29 - Trial = 5304/30000 | Total reward = 42.82
2022-01-26 14:16:50.036 | DEBUG    | __main__:trials:24 - Trial = 5305/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.036 | DEBUG    | __main__:trials:29 - Trial = 5305/30000 | Total reward = 47.71
2022-01-26 14:16:50.041 | DEBUG    | __main__:trials:24 - Trial = 5306/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.042 | DEBUG    | __main__:trials:29 - Trial = 5306/30000 | Total reward = 48.72
2022-01-26 14:16:50.046 | DEBUG    | __main__:trials:26 - Trial = 5307/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.047 | DEBUG    | __main__:trials:29 - Trial = 5307/30000 | Total reward = 18.29
2022-01-26 14:16:50.051 | DEBUG    | __main__:trials:24 - Trial = 5308/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.053 | DEBUG    | __main__:trials:29 - Trial = 5308/30000 | Total reward = 52.84
2022-01-26 14:16:50.056 | DEBUG    | __main__:trials:24 - Trial = 5309/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.057 | DEBUG    | __main__:trials:29 - Trial = 5309/30000 | Total reward = 38.13
2022-01-26 14:16:50.061 | DEBUG    | __main__:trials:24 - Trial = 5310/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.062 | DEBUG    | __main__:trials:29 - Trial = 5310/30000 | Total reward = 48.89
2022-01-26 14:16:50.066 | DEBUG    | __main__:trials:24 - Trial = 5311/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.067 | DEBUG    | __main__:trials:29 - Trial = 5311/30000 | Total reward = 46.54
2022-01-26 14:16:50.071 | DEBUG    | __main__:trials:24 - Trial = 5312/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.072 | DEBUG    | __main__:trials:29 - Trial = 5312/30000 | Total reward = 50.66
2022-01-26 14:16:50.076 | DEBUG    | __main__:trials:24 - Trial = 5313/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.077 | DEBUG    | __main__:trials:29 - Trial = 5313/30000 | Total reward = 39.68
2022-01-26 14:16:50.082 | DEBUG    | __main__:trials:24 - Trial = 5314/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.083 | DEBUG    | __main__:trials:29 - Trial = 5314/30000 | Total reward = 49.45
2022-01-26 14:16:50.086 | DEBUG    | __main__:trials:24 - Trial = 5315/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.088 | DEBUG    | __main__:trials:29 - Trial = 5315/30000 | Total reward = 54.39
2022-01-26 14:16:50.091 | DEBUG    | __main__:trials:24 - Trial = 5316/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.093 | DEBUG    | __main__:trials:29 - Trial = 5316/30000 | Total reward = 53.63
2022-01-26 14:16:50.096 | DEBUG    | __main__:trials:24 - Trial = 5317/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.097 | DEBUG    | __main__:trials:29 - Trial = 5317/30000 | Total reward = 50.12
2022-01-26 14:16:50.102 | DEBUG    | __main__:trials:24 - Trial = 5318/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.102 | DEBUG    | __main__:trials:29 - Trial = 5318/30000 | Total reward = 52.13
2022-01-26 14:16:50.107 | DEBUG    | __main__:trials:24 - Trial = 5319/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.108 | DEBUG    | __main__:trials:29 - Trial = 5319/30000 | Total reward = 49.69
2022-01-26 14:16:50.112 | DEBUG    | __main__:trials:24 - Trial = 5320/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.113 | DEBUG    | __main__:trials:29 - Trial = 5320/30000 | Total reward = 52.54
2022-01-26 14:16:50.117 | DEBUG    | __main__:trials:24 - Trial = 5321/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.118 | DEBUG    | __main__:trials:29 - Trial = 5321/30000 | Total reward = 52.59
2022-01-26 14:16:50.122 | DEBUG    | __main__:trials:24 - Trial = 5322/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.123 | DEBUG    | __main__:trials:29 - Trial = 5322/30000 | Total reward = 54.54
2022-01-26 14:16:50.127 | DEBUG    | __main__:trials:24 - Trial = 5323/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.128 | DEBUG    | __main__:trials:29 - Trial = 5323/30000 | Total reward = 64.25
2022-01-26 14:16:50.132 | DEBUG    | __main__:trials:24 - Trial = 5324/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.133 | DEBUG    | __main__:trials:29 - Trial = 5324/30000 | Total reward = 45.84
2022-01-26 14:16:50.137 | DEBUG    | __main__:trials:24 - Trial = 5325/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.139 | DEBUG    | __main__:trials:29 - Trial = 5325/30000 | Total reward = 48.16
2022-01-26 14:16:50.143 | DEBUG    | __main__:trials:24 - Trial = 5326/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.144 | DEBUG    | __main__:trials:29 - Trial = 5326/30000 | Total reward = 42.68
2022-01-26 14:16:50.148 | DEBUG    | __main__:trials:24 - Trial = 5327/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.149 | DEBUG    | __main__:trials:29 - Trial = 5327/30000 | Total reward = 49.69
2022-01-26 14:16:50.152 | DEBUG    | __main__:trials:24 - Trial = 5328/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.154 | DEBUG    | __main__:trials:29 - Trial = 5328/30000 | Total reward = 49.06
2022-01-26 14:16:50.157 | DEBUG    | __main__:trials:24 - Trial = 5329/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.157 | DEBUG    | __main__:trials:29 - Trial = 5329/30000 | Total reward = 45.91
2022-01-26 14:16:50.162 | DEBUG    | __main__:trials:24 - Trial = 5330/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.163 | DEBUG    | __main__:trials:29 - Trial = 5330/30000 | Total reward = 49.22
2022-01-26 14:16:50.167 | DEBUG    | __main__:trials:24 - Trial = 5331/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.167 | DEBUG    | __main__:trials:29 - Trial = 5331/30000 | Total reward = 26.67
2022-01-26 14:16:50.171 | DEBUG    | __main__:trials:24 - Trial = 5332/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.173 | DEBUG    | __main__:trials:29 - Trial = 5332/30000 | Total reward = 44.25
2022-01-26 14:16:50.176 | DEBUG    | __main__:trials:24 - Trial = 5333/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.178 | DEBUG    | __main__:trials:29 - Trial = 5333/30000 | Total reward = 49.27
2022-01-26 14:16:50.182 | DEBUG    | __main__:trials:24 - Trial = 5334/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.182 | DEBUG    | __main__:trials:29 - Trial = 5334/30000 | Total reward = 43.02
2022-01-26 14:16:50.186 | DEBUG    | __main__:trials:24 - Trial = 5335/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.188 | DEBUG    | __main__:trials:29 - Trial = 5335/30000 | Total reward = 46.24
2022-01-26 14:16:50.191 | DEBUG    | __main__:trials:24 - Trial = 5336/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.192 | DEBUG    | __main__:trials:29 - Trial = 5336/30000 | Total reward = 28.94
2022-01-26 14:16:50.195 | DEBUG    | __main__:trials:24 - Trial = 5337/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.197 | DEBUG    | __main__:trials:29 - Trial = 5337/30000 | Total reward = 42.88
2022-01-26 14:16:50.200 | DEBUG    | __main__:trials:24 - Trial = 5338/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.202 | DEBUG    | __main__:trials:29 - Trial = 5338/30000 | Total reward = 45.24
2022-01-26 14:16:50.206 | DEBUG    | __main__:trials:24 - Trial = 5339/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.206 | DEBUG    | __main__:trials:29 - Trial = 5339/30000 | Total reward = 48.92
2022-01-26 14:16:50.211 | DEBUG    | __main__:trials:24 - Trial = 5340/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.213 | DEBUG    | __main__:trials:29 - Trial = 5340/30000 | Total reward = 48.44
2022-01-26 14:16:50.216 | DEBUG    | __main__:trials:24 - Trial = 5341/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.217 | DEBUG    | __main__:trials:29 - Trial = 5341/30000 | Total reward = 47.27
2022-01-26 14:16:50.221 | DEBUG    | __main__:trials:24 - Trial = 5342/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.223 | DEBUG    | __main__:trials:29 - Trial = 5342/30000 | Total reward = 46.78
2022-01-26 14:16:50.226 | DEBUG    | __main__:trials:24 - Trial = 5343/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.227 | DEBUG    | __main__:trials:29 - Trial = 5343/30000 | Total reward = 45.18
2022-01-26 14:16:50.231 | DEBUG    | __main__:trials:24 - Trial = 5344/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.233 | DEBUG    | __main__:trials:29 - Trial = 5344/30000 | Total reward = 38.39
2022-01-26 14:16:50.235 | DEBUG    | __main__:trials:26 - Trial = 5345/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.237 | DEBUG    | __main__:trials:29 - Trial = 5345/30000 | Total reward = 16.62
2022-01-26 14:16:50.240 | DEBUG    | __main__:trials:24 - Trial = 5346/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.241 | DEBUG    | __main__:trials:29 - Trial = 5346/30000 | Total reward = 57.13
2022-01-26 14:16:50.245 | DEBUG    | __main__:trials:24 - Trial = 5347/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.245 | DEBUG    | __main__:trials:29 - Trial = 5347/30000 | Total reward = 50.52
2022-01-26 14:16:50.249 | DEBUG    | __main__:trials:24 - Trial = 5348/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.249 | DEBUG    | __main__:trials:29 - Trial = 5348/30000 | Total reward = 48.91
2022-01-26 14:16:50.253 | DEBUG    | __main__:trials:24 - Trial = 5349/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.255 | DEBUG    | __main__:trials:29 - Trial = 5349/30000 | Total reward = 32.89
2022-01-26 14:16:50.259 | DEBUG    | __main__:trials:24 - Trial = 5350/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.260 | DEBUG    | __main__:trials:29 - Trial = 5350/30000 | Total reward = 28.96
2022-01-26 14:16:50.265 | DEBUG    | __main__:trials:24 - Trial = 5351/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.265 | DEBUG    | __main__:trials:29 - Trial = 5351/30000 | Total reward = 59.11
2022-01-26 14:16:50.268 | DEBUG    | __main__:trials:24 - Trial = 5352/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.269 | DEBUG    | __main__:trials:29 - Trial = 5352/30000 | Total reward = 45.25
2022-01-26 14:16:50.273 | DEBUG    | __main__:trials:24 - Trial = 5353/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.273 | DEBUG    | __main__:trials:29 - Trial = 5353/30000 | Total reward = 45.66
2022-01-26 14:16:50.278 | DEBUG    | __main__:trials:24 - Trial = 5354/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.279 | DEBUG    | __main__:trials:29 - Trial = 5354/30000 | Total reward = 13.88
2022-01-26 14:16:50.283 | DEBUG    | __main__:trials:24 - Trial = 5355/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.284 | DEBUG    | __main__:trials:29 - Trial = 5355/30000 | Total reward = 41.13
2022-01-26 14:16:50.288 | DEBUG    | __main__:trials:24 - Trial = 5356/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.290 | DEBUG    | __main__:trials:29 - Trial = 5356/30000 | Total reward = 49.09
2022-01-26 14:16:50.293 | DEBUG    | __main__:trials:24 - Trial = 5357/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.295 | DEBUG    | __main__:trials:29 - Trial = 5357/30000 | Total reward = 50.63
2022-01-26 14:16:50.299 | DEBUG    | __main__:trials:24 - Trial = 5358/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.300 | DEBUG    | __main__:trials:29 - Trial = 5358/30000 | Total reward = 53.39
2022-01-26 14:16:50.304 | DEBUG    | __main__:trials:24 - Trial = 5359/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.306 | DEBUG    | __main__:trials:29 - Trial = 5359/30000 | Total reward = 55.29
2022-01-26 14:16:50.309 | DEBUG    | __main__:trials:24 - Trial = 5360/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.310 | DEBUG    | __main__:trials:29 - Trial = 5360/30000 | Total reward = 50.02
2022-01-26 14:16:50.315 | DEBUG    | __main__:trials:24 - Trial = 5361/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.316 | DEBUG    | __main__:trials:29 - Trial = 5361/30000 | Total reward = 41.36
2022-01-26 14:16:50.320 | DEBUG    | __main__:trials:24 - Trial = 5362/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.321 | DEBUG    | __main__:trials:29 - Trial = 5362/30000 | Total reward = 48.34
2022-01-26 14:16:50.325 | DEBUG    | __main__:trials:24 - Trial = 5363/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.326 | DEBUG    | __main__:trials:29 - Trial = 5363/30000 | Total reward = 50.28
2022-01-26 14:16:50.329 | DEBUG    | __main__:trials:24 - Trial = 5364/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.331 | DEBUG    | __main__:trials:29 - Trial = 5364/30000 | Total reward = 30.14
2022-01-26 14:16:50.334 | DEBUG    | __main__:trials:24 - Trial = 5365/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.336 | DEBUG    | __main__:trials:29 - Trial = 5365/30000 | Total reward = 49.40
2022-01-26 14:16:50.340 | DEBUG    | __main__:trials:24 - Trial = 5366/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.341 | DEBUG    | __main__:trials:29 - Trial = 5366/30000 | Total reward = 21.91
2022-01-26 14:16:50.345 | DEBUG    | __main__:trials:24 - Trial = 5367/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.345 | DEBUG    | __main__:trials:29 - Trial = 5367/30000 | Total reward = 41.12
2022-01-26 14:16:50.350 | DEBUG    | __main__:trials:26 - Trial = 5368/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.351 | DEBUG    | __main__:trials:29 - Trial = 5368/30000 | Total reward = 34.85
2022-01-26 14:16:50.355 | DEBUG    | __main__:trials:24 - Trial = 5369/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.357 | DEBUG    | __main__:trials:29 - Trial = 5369/30000 | Total reward = 51.23
2022-01-26 14:16:50.360 | DEBUG    | __main__:trials:24 - Trial = 5370/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.362 | DEBUG    | __main__:trials:29 - Trial = 5370/30000 | Total reward = 54.47
2022-01-26 14:16:50.366 | DEBUG    | __main__:trials:24 - Trial = 5371/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.366 | DEBUG    | __main__:trials:29 - Trial = 5371/30000 | Total reward = 23.29
2022-01-26 14:16:50.370 | DEBUG    | __main__:trials:24 - Trial = 5372/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.372 | DEBUG    | __main__:trials:29 - Trial = 5372/30000 | Total reward = 44.20
2022-01-26 14:16:50.375 | DEBUG    | __main__:trials:24 - Trial = 5373/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.376 | DEBUG    | __main__:trials:29 - Trial = 5373/30000 | Total reward = 30.70
2022-01-26 14:16:50.380 | DEBUG    | __main__:trials:24 - Trial = 5374/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.382 | DEBUG    | __main__:trials:29 - Trial = 5374/30000 | Total reward = 47.58
2022-01-26 14:16:50.385 | DEBUG    | __main__:trials:24 - Trial = 5375/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.387 | DEBUG    | __main__:trials:29 - Trial = 5375/30000 | Total reward = 47.74
2022-01-26 14:16:50.390 | DEBUG    | __main__:trials:24 - Trial = 5376/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.391 | DEBUG    | __main__:trials:29 - Trial = 5376/30000 | Total reward = 48.58
2022-01-26 14:16:50.395 | DEBUG    | __main__:trials:24 - Trial = 5377/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.397 | DEBUG    | __main__:trials:29 - Trial = 5377/30000 | Total reward = 53.51
2022-01-26 14:16:50.400 | DEBUG    | __main__:trials:24 - Trial = 5378/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.402 | DEBUG    | __main__:trials:29 - Trial = 5378/30000 | Total reward = 35.22
2022-01-26 14:16:50.405 | DEBUG    | __main__:trials:24 - Trial = 5379/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.406 | DEBUG    | __main__:trials:29 - Trial = 5379/30000 | Total reward = 48.63
2022-01-26 14:16:50.410 | DEBUG    | __main__:trials:24 - Trial = 5380/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.412 | DEBUG    | __main__:trials:29 - Trial = 5380/30000 | Total reward = 26.80
2022-01-26 14:16:50.415 | DEBUG    | __main__:trials:24 - Trial = 5381/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.417 | DEBUG    | __main__:trials:29 - Trial = 5381/30000 | Total reward = 48.25
2022-01-26 14:16:50.421 | DEBUG    | __main__:trials:24 - Trial = 5382/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.422 | DEBUG    | __main__:trials:29 - Trial = 5382/30000 | Total reward = 31.76
2022-01-26 14:16:50.425 | DEBUG    | __main__:trials:24 - Trial = 5383/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.426 | DEBUG    | __main__:trials:29 - Trial = 5383/30000 | Total reward = 34.09
2022-01-26 14:16:50.429 | DEBUG    | __main__:trials:24 - Trial = 5384/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.430 | DEBUG    | __main__:trials:29 - Trial = 5384/30000 | Total reward = 52.60
2022-01-26 14:16:50.433 | DEBUG    | __main__:trials:24 - Trial = 5385/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.434 | DEBUG    | __main__:trials:29 - Trial = 5385/30000 | Total reward = 49.56
2022-01-26 14:16:50.437 | DEBUG    | __main__:trials:26 - Trial = 5386/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.439 | DEBUG    | __main__:trials:29 - Trial = 5386/30000 | Total reward = 29.30
2022-01-26 14:16:50.442 | DEBUG    | __main__:trials:24 - Trial = 5387/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.444 | DEBUG    | __main__:trials:29 - Trial = 5387/30000 | Total reward = 47.54
2022-01-26 14:16:50.447 | DEBUG    | __main__:trials:24 - Trial = 5388/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.449 | DEBUG    | __main__:trials:29 - Trial = 5388/30000 | Total reward = 48.07
2022-01-26 14:16:50.452 | DEBUG    | __main__:trials:24 - Trial = 5389/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.454 | DEBUG    | __main__:trials:29 - Trial = 5389/30000 | Total reward = 47.99
2022-01-26 14:16:50.458 | DEBUG    | __main__:trials:24 - Trial = 5390/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.459 | DEBUG    | __main__:trials:29 - Trial = 5390/30000 | Total reward = 45.00
2022-01-26 14:16:50.463 | DEBUG    | __main__:trials:24 - Trial = 5391/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.464 | DEBUG    | __main__:trials:29 - Trial = 5391/30000 | Total reward = 34.26
2022-01-26 14:16:50.468 | DEBUG    | __main__:trials:24 - Trial = 5392/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.469 | DEBUG    | __main__:trials:29 - Trial = 5392/30000 | Total reward = 47.59
2022-01-26 14:16:50.473 | DEBUG    | __main__:trials:24 - Trial = 5393/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.474 | DEBUG    | __main__:trials:29 - Trial = 5393/30000 | Total reward = 50.56
2022-01-26 14:16:50.478 | DEBUG    | __main__:trials:24 - Trial = 5394/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.480 | DEBUG    | __main__:trials:29 - Trial = 5394/30000 | Total reward = 35.82
2022-01-26 14:16:50.484 | DEBUG    | __main__:trials:24 - Trial = 5395/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.485 | DEBUG    | __main__:trials:29 - Trial = 5395/30000 | Total reward = 54.68
2022-01-26 14:16:50.489 | DEBUG    | __main__:trials:24 - Trial = 5396/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.490 | DEBUG    | __main__:trials:29 - Trial = 5396/30000 | Total reward = 59.50
2022-01-26 14:16:50.494 | DEBUG    | __main__:trials:24 - Trial = 5397/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.494 | DEBUG    | __main__:trials:29 - Trial = 5397/30000 | Total reward = 28.35
2022-01-26 14:16:50.499 | DEBUG    | __main__:trials:24 - Trial = 5398/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.501 | DEBUG    | __main__:trials:29 - Trial = 5398/30000 | Total reward = 49.07
2022-01-26 14:16:50.504 | DEBUG    | __main__:trials:26 - Trial = 5399/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.505 | DEBUG    | __main__:trials:29 - Trial = 5399/30000 | Total reward = 22.03
2022-01-26 14:16:50.509 | DEBUG    | __main__:trials:24 - Trial = 5400/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.511 | DEBUG    | __main__:trials:29 - Trial = 5400/30000 | Total reward = 49.73
2022-01-26 14:16:50.515 | DEBUG    | __main__:trials:24 - Trial = 5401/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.516 | DEBUG    | __main__:trials:29 - Trial = 5401/30000 | Total reward = 47.74
2022-01-26 14:16:50.520 | DEBUG    | __main__:trials:24 - Trial = 5402/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.521 | DEBUG    | __main__:trials:29 - Trial = 5402/30000 | Total reward = 48.27
2022-01-26 14:16:50.526 | DEBUG    | __main__:trials:24 - Trial = 5403/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.527 | DEBUG    | __main__:trials:29 - Trial = 5403/30000 | Total reward = 47.21
2022-01-26 14:16:50.530 | DEBUG    | __main__:trials:24 - Trial = 5404/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.532 | DEBUG    | __main__:trials:29 - Trial = 5404/30000 | Total reward = 42.39
2022-01-26 14:16:50.535 | DEBUG    | __main__:trials:24 - Trial = 5405/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.537 | DEBUG    | __main__:trials:29 - Trial = 5405/30000 | Total reward = 61.16
2022-01-26 14:16:50.540 | DEBUG    | __main__:trials:24 - Trial = 5406/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.541 | DEBUG    | __main__:trials:29 - Trial = 5406/30000 | Total reward = 47.71
2022-01-26 14:16:50.544 | DEBUG    | __main__:trials:24 - Trial = 5407/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.546 | DEBUG    | __main__:trials:29 - Trial = 5407/30000 | Total reward = 46.70
2022-01-26 14:16:50.549 | DEBUG    | __main__:trials:24 - Trial = 5408/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.549 | DEBUG    | __main__:trials:29 - Trial = 5408/30000 | Total reward = 49.69
2022-01-26 14:16:50.554 | DEBUG    | __main__:trials:24 - Trial = 5409/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.555 | DEBUG    | __main__:trials:29 - Trial = 5409/30000 | Total reward = 49.63
2022-01-26 14:16:50.559 | DEBUG    | __main__:trials:24 - Trial = 5410/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.559 | DEBUG    | __main__:trials:29 - Trial = 5410/30000 | Total reward = 56.18
2022-01-26 14:16:50.564 | DEBUG    | __main__:trials:24 - Trial = 5411/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.565 | DEBUG    | __main__:trials:29 - Trial = 5411/30000 | Total reward = 45.84
2022-01-26 14:16:50.568 | DEBUG    | __main__:trials:24 - Trial = 5412/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.570 | DEBUG    | __main__:trials:29 - Trial = 5412/30000 | Total reward = 46.44
2022-01-26 14:16:50.573 | DEBUG    | __main__:trials:24 - Trial = 5413/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.574 | DEBUG    | __main__:trials:29 - Trial = 5413/30000 | Total reward = 50.18
2022-01-26 14:16:50.578 | DEBUG    | __main__:trials:24 - Trial = 5414/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.579 | DEBUG    | __main__:trials:29 - Trial = 5414/30000 | Total reward = 50.71
2022-01-26 14:16:50.582 | DEBUG    | __main__:trials:24 - Trial = 5415/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.584 | DEBUG    | __main__:trials:29 - Trial = 5415/30000 | Total reward = 45.19
2022-01-26 14:16:50.588 | DEBUG    | __main__:trials:24 - Trial = 5416/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.589 | DEBUG    | __main__:trials:29 - Trial = 5416/30000 | Total reward = 50.99
2022-01-26 14:16:50.593 | DEBUG    | __main__:trials:24 - Trial = 5417/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.594 | DEBUG    | __main__:trials:29 - Trial = 5417/30000 | Total reward = 48.07
2022-01-26 14:16:50.598 | DEBUG    | __main__:trials:24 - Trial = 5418/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.600 | DEBUG    | __main__:trials:29 - Trial = 5418/30000 | Total reward = 46.37
2022-01-26 14:16:50.602 | DEBUG    | __main__:trials:24 - Trial = 5419/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.604 | DEBUG    | __main__:trials:29 - Trial = 5419/30000 | Total reward = 43.43
2022-01-26 14:16:50.607 | DEBUG    | __main__:trials:24 - Trial = 5420/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.609 | DEBUG    | __main__:trials:29 - Trial = 5420/30000 | Total reward = 37.29
2022-01-26 14:16:50.612 | DEBUG    | __main__:trials:24 - Trial = 5421/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.614 | DEBUG    | __main__:trials:29 - Trial = 5421/30000 | Total reward = 51.72
2022-01-26 14:16:50.617 | DEBUG    | __main__:trials:26 - Trial = 5422/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.618 | DEBUG    | __main__:trials:29 - Trial = 5422/30000 | Total reward = 23.75
2022-01-26 14:16:50.622 | DEBUG    | __main__:trials:26 - Trial = 5423/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.623 | DEBUG    | __main__:trials:29 - Trial = 5423/30000 | Total reward = 27.44
2022-01-26 14:16:50.627 | DEBUG    | __main__:trials:24 - Trial = 5424/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.628 | DEBUG    | __main__:trials:29 - Trial = 5424/30000 | Total reward = 47.21
2022-01-26 14:16:50.631 | DEBUG    | __main__:trials:24 - Trial = 5425/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.633 | DEBUG    | __main__:trials:29 - Trial = 5425/30000 | Total reward = 45.46
2022-01-26 14:16:50.637 | DEBUG    | __main__:trials:24 - Trial = 5426/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.638 | DEBUG    | __main__:trials:29 - Trial = 5426/30000 | Total reward = 33.48
2022-01-26 14:16:50.642 | DEBUG    | __main__:trials:24 - Trial = 5427/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.642 | DEBUG    | __main__:trials:29 - Trial = 5427/30000 | Total reward = 45.25
2022-01-26 14:16:50.647 | DEBUG    | __main__:trials:24 - Trial = 5428/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.649 | DEBUG    | __main__:trials:29 - Trial = 5428/30000 | Total reward = 49.26
2022-01-26 14:16:50.652 | DEBUG    | __main__:trials:24 - Trial = 5429/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.653 | DEBUG    | __main__:trials:29 - Trial = 5429/30000 | Total reward = 56.99
2022-01-26 14:16:50.656 | DEBUG    | __main__:trials:24 - Trial = 5430/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.658 | DEBUG    | __main__:trials:29 - Trial = 5430/30000 | Total reward = 45.28
2022-01-26 14:16:50.661 | DEBUG    | __main__:trials:24 - Trial = 5431/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.662 | DEBUG    | __main__:trials:29 - Trial = 5431/30000 | Total reward = 47.38
2022-01-26 14:16:50.665 | DEBUG    | __main__:trials:24 - Trial = 5432/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.667 | DEBUG    | __main__:trials:29 - Trial = 5432/30000 | Total reward = 46.70
2022-01-26 14:16:50.670 | DEBUG    | __main__:trials:24 - Trial = 5433/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.671 | DEBUG    | __main__:trials:29 - Trial = 5433/30000 | Total reward = 48.07
2022-01-26 14:16:50.674 | DEBUG    | __main__:trials:24 - Trial = 5434/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.675 | DEBUG    | __main__:trials:29 - Trial = 5434/30000 | Total reward = 22.75
2022-01-26 14:16:50.678 | DEBUG    | __main__:trials:24 - Trial = 5435/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.680 | DEBUG    | __main__:trials:29 - Trial = 5435/30000 | Total reward = 46.45
2022-01-26 14:16:50.683 | DEBUG    | __main__:trials:24 - Trial = 5436/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.685 | DEBUG    | __main__:trials:29 - Trial = 5436/30000 | Total reward = 33.14
2022-01-26 14:16:50.688 | DEBUG    | __main__:trials:24 - Trial = 5437/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.690 | DEBUG    | __main__:trials:29 - Trial = 5437/30000 | Total reward = 33.75
2022-01-26 14:16:50.694 | DEBUG    | __main__:trials:24 - Trial = 5438/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.694 | DEBUG    | __main__:trials:29 - Trial = 5438/30000 | Total reward = 64.34
2022-01-26 14:16:50.698 | DEBUG    | __main__:trials:24 - Trial = 5439/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.700 | DEBUG    | __main__:trials:29 - Trial = 5439/30000 | Total reward = 35.13
2022-01-26 14:16:50.703 | DEBUG    | __main__:trials:24 - Trial = 5440/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.705 | DEBUG    | __main__:trials:29 - Trial = 5440/30000 | Total reward = 43.06
2022-01-26 14:16:50.709 | DEBUG    | __main__:trials:24 - Trial = 5441/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.709 | DEBUG    | __main__:trials:29 - Trial = 5441/30000 | Total reward = 43.80
2022-01-26 14:16:50.713 | DEBUG    | __main__:trials:24 - Trial = 5442/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.713 | DEBUG    | __main__:trials:29 - Trial = 5442/30000 | Total reward = 47.54
2022-01-26 14:16:50.717 | DEBUG    | __main__:trials:24 - Trial = 5443/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.718 | DEBUG    | __main__:trials:29 - Trial = 5443/30000 | Total reward = 46.58
2022-01-26 14:16:50.722 | DEBUG    | __main__:trials:24 - Trial = 5444/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.724 | DEBUG    | __main__:trials:29 - Trial = 5444/30000 | Total reward = 57.44
2022-01-26 14:16:50.727 | DEBUG    | __main__:trials:24 - Trial = 5445/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.729 | DEBUG    | __main__:trials:29 - Trial = 5445/30000 | Total reward = 45.24
2022-01-26 14:16:50.733 | DEBUG    | __main__:trials:24 - Trial = 5446/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.733 | DEBUG    | __main__:trials:29 - Trial = 5446/30000 | Total reward = 46.19
2022-01-26 14:16:50.737 | DEBUG    | __main__:trials:24 - Trial = 5447/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.737 | DEBUG    | __main__:trials:29 - Trial = 5447/30000 | Total reward = 43.06
2022-01-26 14:16:50.741 | DEBUG    | __main__:trials:24 - Trial = 5448/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.742 | DEBUG    | __main__:trials:29 - Trial = 5448/30000 | Total reward = 33.80
2022-01-26 14:16:50.746 | DEBUG    | __main__:trials:24 - Trial = 5449/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.748 | DEBUG    | __main__:trials:29 - Trial = 5449/30000 | Total reward = 43.96
2022-01-26 14:16:50.751 | DEBUG    | __main__:trials:24 - Trial = 5450/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.753 | DEBUG    | __main__:trials:29 - Trial = 5450/30000 | Total reward = 50.26
2022-01-26 14:16:50.756 | DEBUG    | __main__:trials:24 - Trial = 5451/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.758 | DEBUG    | __main__:trials:29 - Trial = 5451/30000 | Total reward = 57.18
2022-01-26 14:16:50.762 | DEBUG    | __main__:trials:24 - Trial = 5452/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.763 | DEBUG    | __main__:trials:29 - Trial = 5452/30000 | Total reward = 30.76
2022-01-26 14:16:50.767 | DEBUG    | __main__:trials:24 - Trial = 5453/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.768 | DEBUG    | __main__:trials:29 - Trial = 5453/30000 | Total reward = 46.29
2022-01-26 14:16:50.772 | DEBUG    | __main__:trials:24 - Trial = 5454/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.773 | DEBUG    | __main__:trials:29 - Trial = 5454/30000 | Total reward = 44.06
2022-01-26 14:16:50.776 | DEBUG    | __main__:trials:24 - Trial = 5455/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.778 | DEBUG    | __main__:trials:29 - Trial = 5455/30000 | Total reward = 40.81
2022-01-26 14:16:50.782 | DEBUG    | __main__:trials:24 - Trial = 5456/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.783 | DEBUG    | __main__:trials:29 - Trial = 5456/30000 | Total reward = 48.06
2022-01-26 14:16:50.787 | DEBUG    | __main__:trials:24 - Trial = 5457/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.787 | DEBUG    | __main__:trials:29 - Trial = 5457/30000 | Total reward = 56.73
2022-01-26 14:16:50.792 | DEBUG    | __main__:trials:24 - Trial = 5458/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.794 | DEBUG    | __main__:trials:29 - Trial = 5458/30000 | Total reward = 40.75
2022-01-26 14:16:50.797 | DEBUG    | __main__:trials:24 - Trial = 5459/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.798 | DEBUG    | __main__:trials:29 - Trial = 5459/30000 | Total reward = 44.84
2022-01-26 14:16:50.802 | DEBUG    | __main__:trials:24 - Trial = 5460/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.804 | DEBUG    | __main__:trials:29 - Trial = 5460/30000 | Total reward = 29.45
2022-01-26 14:16:50.807 | DEBUG    | __main__:trials:24 - Trial = 5461/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.808 | DEBUG    | __main__:trials:29 - Trial = 5461/30000 | Total reward = 45.32
2022-01-26 14:16:50.812 | DEBUG    | __main__:trials:24 - Trial = 5462/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.814 | DEBUG    | __main__:trials:29 - Trial = 5462/30000 | Total reward = 43.89
2022-01-26 14:16:50.817 | DEBUG    | __main__:trials:24 - Trial = 5463/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.818 | DEBUG    | __main__:trials:29 - Trial = 5463/30000 | Total reward = 55.97
2022-01-26 14:16:50.822 | DEBUG    | __main__:trials:24 - Trial = 5464/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.824 | DEBUG    | __main__:trials:29 - Trial = 5464/30000 | Total reward = 55.32
2022-01-26 14:16:50.827 | DEBUG    | __main__:trials:24 - Trial = 5465/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.828 | DEBUG    | __main__:trials:29 - Trial = 5465/30000 | Total reward = 43.70
2022-01-26 14:16:50.832 | DEBUG    | __main__:trials:24 - Trial = 5466/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.834 | DEBUG    | __main__:trials:29 - Trial = 5466/30000 | Total reward = 56.72
2022-01-26 14:16:50.837 | DEBUG    | __main__:trials:24 - Trial = 5467/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.839 | DEBUG    | __main__:trials:29 - Trial = 5467/30000 | Total reward = 51.29
2022-01-26 14:16:50.843 | DEBUG    | __main__:trials:24 - Trial = 5468/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.844 | DEBUG    | __main__:trials:29 - Trial = 5468/30000 | Total reward = 57.30
2022-01-26 14:16:50.848 | DEBUG    | __main__:trials:24 - Trial = 5469/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.850 | DEBUG    | __main__:trials:29 - Trial = 5469/30000 | Total reward = 48.01
2022-01-26 14:16:50.853 | DEBUG    | __main__:trials:24 - Trial = 5470/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.855 | DEBUG    | __main__:trials:29 - Trial = 5470/30000 | Total reward = 58.27
2022-01-26 14:16:50.859 | DEBUG    | __main__:trials:24 - Trial = 5471/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.860 | DEBUG    | __main__:trials:29 - Trial = 5471/30000 | Total reward = 41.09
2022-01-26 14:16:50.864 | DEBUG    | __main__:trials:24 - Trial = 5472/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.865 | DEBUG    | __main__:trials:29 - Trial = 5472/30000 | Total reward = 27.96
2022-01-26 14:16:50.869 | DEBUG    | __main__:trials:24 - Trial = 5473/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.870 | DEBUG    | __main__:trials:29 - Trial = 5473/30000 | Total reward = 49.96
2022-01-26 14:16:50.874 | DEBUG    | __main__:trials:24 - Trial = 5474/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.876 | DEBUG    | __main__:trials:29 - Trial = 5474/30000 | Total reward = 43.53
2022-01-26 14:16:50.878 | DEBUG    | __main__:trials:24 - Trial = 5475/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.880 | DEBUG    | __main__:trials:29 - Trial = 5475/30000 | Total reward = 50.14
2022-01-26 14:16:50.883 | DEBUG    | __main__:trials:24 - Trial = 5476/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.885 | DEBUG    | __main__:trials:29 - Trial = 5476/30000 | Total reward = 46.52
2022-01-26 14:16:50.888 | DEBUG    | __main__:trials:24 - Trial = 5477/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.890 | DEBUG    | __main__:trials:29 - Trial = 5477/30000 | Total reward = 48.99
2022-01-26 14:16:50.894 | DEBUG    | __main__:trials:24 - Trial = 5478/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.894 | DEBUG    | __main__:trials:29 - Trial = 5478/30000 | Total reward = 48.68
2022-01-26 14:16:50.898 | DEBUG    | __main__:trials:26 - Trial = 5479/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.899 | DEBUG    | __main__:trials:29 - Trial = 5479/30000 | Total reward = 22.45
2022-01-26 14:16:50.902 | DEBUG    | __main__:trials:24 - Trial = 5480/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.904 | DEBUG    | __main__:trials:29 - Trial = 5480/30000 | Total reward = 47.15
2022-01-26 14:16:50.908 | DEBUG    | __main__:trials:24 - Trial = 5481/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.910 | DEBUG    | __main__:trials:29 - Trial = 5481/30000 | Total reward = 42.86
2022-01-26 14:16:50.913 | DEBUG    | __main__:trials:24 - Trial = 5482/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.915 | DEBUG    | __main__:trials:29 - Trial = 5482/30000 | Total reward = 51.35
2022-01-26 14:16:50.919 | DEBUG    | __main__:trials:24 - Trial = 5483/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.919 | DEBUG    | __main__:trials:29 - Trial = 5483/30000 | Total reward = 43.64
2022-01-26 14:16:50.924 | DEBUG    | __main__:trials:24 - Trial = 5484/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.925 | DEBUG    | __main__:trials:29 - Trial = 5484/30000 | Total reward = 44.16
2022-01-26 14:16:50.929 | DEBUG    | __main__:trials:24 - Trial = 5485/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.931 | DEBUG    | __main__:trials:29 - Trial = 5485/30000 | Total reward = 46.10
2022-01-26 14:16:50.935 | DEBUG    | __main__:trials:24 - Trial = 5486/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.936 | DEBUG    | __main__:trials:29 - Trial = 5486/30000 | Total reward = 26.12
2022-01-26 14:16:50.940 | DEBUG    | __main__:trials:26 - Trial = 5487/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:50.941 | DEBUG    | __main__:trials:29 - Trial = 5487/30000 | Total reward = 36.55
2022-01-26 14:16:50.945 | DEBUG    | __main__:trials:24 - Trial = 5488/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.946 | DEBUG    | __main__:trials:29 - Trial = 5488/30000 | Total reward = 46.52
2022-01-26 14:16:50.951 | DEBUG    | __main__:trials:24 - Trial = 5489/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.952 | DEBUG    | __main__:trials:29 - Trial = 5489/30000 | Total reward = 38.52
2022-01-26 14:16:50.956 | DEBUG    | __main__:trials:24 - Trial = 5490/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.958 | DEBUG    | __main__:trials:29 - Trial = 5490/30000 | Total reward = 46.02
2022-01-26 14:16:50.962 | DEBUG    | __main__:trials:24 - Trial = 5491/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.963 | DEBUG    | __main__:trials:29 - Trial = 5491/30000 | Total reward = 45.61
2022-01-26 14:16:50.967 | DEBUG    | __main__:trials:24 - Trial = 5492/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.968 | DEBUG    | __main__:trials:29 - Trial = 5492/30000 | Total reward = 30.55
2022-01-26 14:16:50.971 | DEBUG    | __main__:trials:24 - Trial = 5493/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.972 | DEBUG    | __main__:trials:29 - Trial = 5493/30000 | Total reward = 28.28
2022-01-26 14:16:50.976 | DEBUG    | __main__:trials:24 - Trial = 5494/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.977 | DEBUG    | __main__:trials:29 - Trial = 5494/30000 | Total reward = 41.70
2022-01-26 14:16:50.980 | DEBUG    | __main__:trials:24 - Trial = 5495/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.982 | DEBUG    | __main__:trials:29 - Trial = 5495/30000 | Total reward = 49.07
2022-01-26 14:16:50.986 | DEBUG    | __main__:trials:24 - Trial = 5496/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.987 | DEBUG    | __main__:trials:29 - Trial = 5496/30000 | Total reward = 50.29
2022-01-26 14:16:50.991 | DEBUG    | __main__:trials:24 - Trial = 5497/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.991 | DEBUG    | __main__:trials:29 - Trial = 5497/30000 | Total reward = 45.93
2022-01-26 14:16:50.996 | DEBUG    | __main__:trials:24 - Trial = 5498/30000 | Max number of steps (20) reached
2022-01-26 14:16:50.996 | DEBUG    | __main__:trials:29 - Trial = 5498/30000 | Total reward = 43.15
2022-01-26 14:16:51.001 | DEBUG    | __main__:trials:24 - Trial = 5499/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.002 | DEBUG    | __main__:trials:29 - Trial = 5499/30000 | Total reward = 46.52
2022-01-26 14:16:51.006 | DEBUG    | __main__:trials:24 - Trial = 5500/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.008 | DEBUG    | __main__:trials:29 - Trial = 5500/30000 | Total reward = 44.08
2022-01-26 14:16:51.011 | DEBUG    | __main__:trials:24 - Trial = 5501/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.012 | DEBUG    | __main__:trials:29 - Trial = 5501/30000 | Total reward = 38.17
2022-01-26 14:16:51.015 | DEBUG    | __main__:trials:24 - Trial = 5502/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.018 | DEBUG    | __main__:trials:29 - Trial = 5502/30000 | Total reward = 31.27
2022-01-26 14:16:51.022 | DEBUG    | __main__:trials:24 - Trial = 5503/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.023 | DEBUG    | __main__:trials:29 - Trial = 5503/30000 | Total reward = 36.02
2022-01-26 14:16:51.027 | DEBUG    | __main__:trials:24 - Trial = 5504/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.029 | DEBUG    | __main__:trials:29 - Trial = 5504/30000 | Total reward = 17.01
2022-01-26 14:16:51.032 | DEBUG    | __main__:trials:24 - Trial = 5505/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.033 | DEBUG    | __main__:trials:29 - Trial = 5505/30000 | Total reward = 41.62
2022-01-26 14:16:51.037 | DEBUG    | __main__:trials:24 - Trial = 5506/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.038 | DEBUG    | __main__:trials:29 - Trial = 5506/30000 | Total reward = 43.32
2022-01-26 14:16:51.042 | DEBUG    | __main__:trials:24 - Trial = 5507/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.043 | DEBUG    | __main__:trials:29 - Trial = 5507/30000 | Total reward = 39.94
2022-01-26 14:16:51.047 | DEBUG    | __main__:trials:24 - Trial = 5508/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.049 | DEBUG    | __main__:trials:29 - Trial = 5508/30000 | Total reward = 51.37
2022-01-26 14:16:51.052 | DEBUG    | __main__:trials:24 - Trial = 5509/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.053 | DEBUG    | __main__:trials:29 - Trial = 5509/30000 | Total reward = 42.38
2022-01-26 14:16:51.058 | DEBUG    | __main__:trials:24 - Trial = 5510/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.058 | DEBUG    | __main__:trials:29 - Trial = 5510/30000 | Total reward = 48.17
2022-01-26 14:16:51.063 | DEBUG    | __main__:trials:24 - Trial = 5511/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.064 | DEBUG    | __main__:trials:29 - Trial = 5511/30000 | Total reward = 22.12
2022-01-26 14:16:51.068 | DEBUG    | __main__:trials:24 - Trial = 5512/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.068 | DEBUG    | __main__:trials:29 - Trial = 5512/30000 | Total reward = 32.22
2022-01-26 14:16:51.072 | DEBUG    | __main__:trials:24 - Trial = 5513/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.074 | DEBUG    | __main__:trials:29 - Trial = 5513/30000 | Total reward = 45.90
2022-01-26 14:16:51.077 | DEBUG    | __main__:trials:24 - Trial = 5514/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.079 | DEBUG    | __main__:trials:29 - Trial = 5514/30000 | Total reward = 41.53
2022-01-26 14:16:51.083 | DEBUG    | __main__:trials:26 - Trial = 5515/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.083 | DEBUG    | __main__:trials:29 - Trial = 5515/30000 | Total reward = 20.50
2022-01-26 14:16:51.087 | DEBUG    | __main__:trials:24 - Trial = 5516/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.089 | DEBUG    | __main__:trials:29 - Trial = 5516/30000 | Total reward = 42.45
2022-01-26 14:16:51.093 | DEBUG    | __main__:trials:24 - Trial = 5517/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.093 | DEBUG    | __main__:trials:29 - Trial = 5517/30000 | Total reward = 49.86
2022-01-26 14:16:51.097 | DEBUG    | __main__:trials:24 - Trial = 5518/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.099 | DEBUG    | __main__:trials:29 - Trial = 5518/30000 | Total reward = 48.09
2022-01-26 14:16:51.102 | DEBUG    | __main__:trials:24 - Trial = 5519/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.104 | DEBUG    | __main__:trials:29 - Trial = 5519/30000 | Total reward = 34.09
2022-01-26 14:16:51.107 | DEBUG    | __main__:trials:24 - Trial = 5520/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.109 | DEBUG    | __main__:trials:29 - Trial = 5520/30000 | Total reward = 44.82
2022-01-26 14:16:51.112 | DEBUG    | __main__:trials:24 - Trial = 5521/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.113 | DEBUG    | __main__:trials:29 - Trial = 5521/30000 | Total reward = 62.83
2022-01-26 14:16:51.117 | DEBUG    | __main__:trials:24 - Trial = 5522/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.118 | DEBUG    | __main__:trials:29 - Trial = 5522/30000 | Total reward = 50.75
2022-01-26 14:16:51.121 | DEBUG    | __main__:trials:24 - Trial = 5523/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.122 | DEBUG    | __main__:trials:29 - Trial = 5523/30000 | Total reward = 51.10
2022-01-26 14:16:51.126 | DEBUG    | __main__:trials:24 - Trial = 5524/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.126 | DEBUG    | __main__:trials:29 - Trial = 5524/30000 | Total reward = 46.96
2022-01-26 14:16:51.131 | DEBUG    | __main__:trials:24 - Trial = 5525/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.133 | DEBUG    | __main__:trials:29 - Trial = 5525/30000 | Total reward = 59.08
2022-01-26 14:16:51.136 | DEBUG    | __main__:trials:24 - Trial = 5526/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.138 | DEBUG    | __main__:trials:29 - Trial = 5526/30000 | Total reward = 42.70
2022-01-26 14:16:51.142 | DEBUG    | __main__:trials:24 - Trial = 5527/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.143 | DEBUG    | __main__:trials:29 - Trial = 5527/30000 | Total reward = 43.03
2022-01-26 14:16:51.147 | DEBUG    | __main__:trials:24 - Trial = 5528/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.148 | DEBUG    | __main__:trials:29 - Trial = 5528/30000 | Total reward = 46.01
2022-01-26 14:16:51.152 | DEBUG    | __main__:trials:24 - Trial = 5529/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.153 | DEBUG    | __main__:trials:29 - Trial = 5529/30000 | Total reward = 45.81
2022-01-26 14:16:51.157 | DEBUG    | __main__:trials:24 - Trial = 5530/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.157 | DEBUG    | __main__:trials:29 - Trial = 5530/30000 | Total reward = 44.85
2022-01-26 14:16:51.162 | DEBUG    | __main__:trials:24 - Trial = 5531/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.164 | DEBUG    | __main__:trials:29 - Trial = 5531/30000 | Total reward = 50.97
2022-01-26 14:16:51.167 | DEBUG    | __main__:trials:24 - Trial = 5532/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.168 | DEBUG    | __main__:trials:29 - Trial = 5532/30000 | Total reward = 44.02
2022-01-26 14:16:51.171 | DEBUG    | __main__:trials:26 - Trial = 5533/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.173 | DEBUG    | __main__:trials:29 - Trial = 5533/30000 | Total reward = 6.70
2022-01-26 14:16:51.175 | DEBUG    | __main__:trials:26 - Trial = 5534/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.177 | DEBUG    | __main__:trials:29 - Trial = 5534/30000 | Total reward = 21.53
2022-01-26 14:16:51.180 | DEBUG    | __main__:trials:26 - Trial = 5535/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.182 | DEBUG    | __main__:trials:29 - Trial = 5535/30000 | Total reward = 16.07
2022-01-26 14:16:51.186 | DEBUG    | __main__:trials:24 - Trial = 5536/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.186 | DEBUG    | __main__:trials:29 - Trial = 5536/30000 | Total reward = 51.95
2022-01-26 14:16:51.190 | DEBUG    | __main__:trials:24 - Trial = 5537/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.192 | DEBUG    | __main__:trials:29 - Trial = 5537/30000 | Total reward = 47.72
2022-01-26 14:16:51.196 | DEBUG    | __main__:trials:24 - Trial = 5538/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.198 | DEBUG    | __main__:trials:29 - Trial = 5538/30000 | Total reward = 42.83
2022-01-26 14:16:51.201 | DEBUG    | __main__:trials:24 - Trial = 5539/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.203 | DEBUG    | __main__:trials:29 - Trial = 5539/30000 | Total reward = 46.00
2022-01-26 14:16:51.206 | DEBUG    | __main__:trials:24 - Trial = 5540/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.208 | DEBUG    | __main__:trials:29 - Trial = 5540/30000 | Total reward = 14.01
2022-01-26 14:16:51.211 | DEBUG    | __main__:trials:24 - Trial = 5541/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.212 | DEBUG    | __main__:trials:29 - Trial = 5541/30000 | Total reward = 44.06
2022-01-26 14:16:51.216 | DEBUG    | __main__:trials:24 - Trial = 5542/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.218 | DEBUG    | __main__:trials:29 - Trial = 5542/30000 | Total reward = 45.34
2022-01-26 14:16:51.221 | DEBUG    | __main__:trials:24 - Trial = 5543/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.223 | DEBUG    | __main__:trials:29 - Trial = 5543/30000 | Total reward = 35.80
2022-01-26 14:16:51.226 | DEBUG    | __main__:trials:24 - Trial = 5544/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.228 | DEBUG    | __main__:trials:29 - Trial = 5544/30000 | Total reward = 42.67
2022-01-26 14:16:51.231 | DEBUG    | __main__:trials:24 - Trial = 5545/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.233 | DEBUG    | __main__:trials:29 - Trial = 5545/30000 | Total reward = 50.86
2022-01-26 14:16:51.236 | DEBUG    | __main__:trials:24 - Trial = 5546/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.237 | DEBUG    | __main__:trials:29 - Trial = 5546/30000 | Total reward = 44.65
2022-01-26 14:16:51.241 | DEBUG    | __main__:trials:24 - Trial = 5547/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.241 | DEBUG    | __main__:trials:29 - Trial = 5547/30000 | Total reward = 44.37
2022-01-26 14:16:51.244 | DEBUG    | __main__:trials:26 - Trial = 5548/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.245 | DEBUG    | __main__:trials:29 - Trial = 5548/30000 | Total reward = 23.62
2022-01-26 14:16:51.249 | DEBUG    | __main__:trials:24 - Trial = 5549/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.250 | DEBUG    | __main__:trials:29 - Trial = 5549/30000 | Total reward = 41.60
2022-01-26 14:16:51.397 | DEBUG    | __main__:trials:24 - Trial = 5550/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.398 | DEBUG    | __main__:trials:29 - Trial = 5550/30000 | Total reward = 47.70
2022-01-26 14:16:51.402 | DEBUG    | __main__:trials:24 - Trial = 5551/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.404 | DEBUG    | __main__:trials:29 - Trial = 5551/30000 | Total reward = 48.25
2022-01-26 14:16:51.408 | DEBUG    | __main__:trials:24 - Trial = 5552/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.409 | DEBUG    | __main__:trials:29 - Trial = 5552/30000 | Total reward = 42.93
2022-01-26 14:16:51.412 | DEBUG    | __main__:trials:24 - Trial = 5553/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.414 | DEBUG    | __main__:trials:29 - Trial = 5553/30000 | Total reward = 46.20
2022-01-26 14:16:51.417 | DEBUG    | __main__:trials:24 - Trial = 5554/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.419 | DEBUG    | __main__:trials:29 - Trial = 5554/30000 | Total reward = 47.54
2022-01-26 14:16:51.421 | DEBUG    | __main__:trials:24 - Trial = 5555/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.423 | DEBUG    | __main__:trials:29 - Trial = 5555/30000 | Total reward = 42.76
2022-01-26 14:16:51.427 | DEBUG    | __main__:trials:26 - Trial = 5556/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.428 | DEBUG    | __main__:trials:29 - Trial = 5556/30000 | Total reward = 37.53
2022-01-26 14:16:51.432 | DEBUG    | __main__:trials:24 - Trial = 5557/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.433 | DEBUG    | __main__:trials:29 - Trial = 5557/30000 | Total reward = 41.35
2022-01-26 14:16:51.437 | DEBUG    | __main__:trials:24 - Trial = 5558/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.438 | DEBUG    | __main__:trials:29 - Trial = 5558/30000 | Total reward = 45.05
2022-01-26 14:16:51.441 | DEBUG    | __main__:trials:24 - Trial = 5559/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.442 | DEBUG    | __main__:trials:29 - Trial = 5559/30000 | Total reward = 38.52
2022-01-26 14:16:51.445 | DEBUG    | __main__:trials:24 - Trial = 5560/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.447 | DEBUG    | __main__:trials:29 - Trial = 5560/30000 | Total reward = 54.91
2022-01-26 14:16:51.450 | DEBUG    | __main__:trials:24 - Trial = 5561/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.452 | DEBUG    | __main__:trials:29 - Trial = 5561/30000 | Total reward = 32.31
2022-01-26 14:16:51.455 | DEBUG    | __main__:trials:24 - Trial = 5562/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.457 | DEBUG    | __main__:trials:29 - Trial = 5562/30000 | Total reward = 46.70
2022-01-26 14:16:51.460 | DEBUG    | __main__:trials:24 - Trial = 5563/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.461 | DEBUG    | __main__:trials:29 - Trial = 5563/30000 | Total reward = 47.11
2022-01-26 14:16:51.465 | DEBUG    | __main__:trials:24 - Trial = 5564/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.466 | DEBUG    | __main__:trials:29 - Trial = 5564/30000 | Total reward = 53.74
2022-01-26 14:16:51.469 | DEBUG    | __main__:trials:24 - Trial = 5565/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.471 | DEBUG    | __main__:trials:29 - Trial = 5565/30000 | Total reward = 51.91
2022-01-26 14:16:51.475 | DEBUG    | __main__:trials:24 - Trial = 5566/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.476 | DEBUG    | __main__:trials:29 - Trial = 5566/30000 | Total reward = 39.30
2022-01-26 14:16:51.479 | DEBUG    | __main__:trials:24 - Trial = 5567/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.481 | DEBUG    | __main__:trials:29 - Trial = 5567/30000 | Total reward = 46.12
2022-01-26 14:16:51.484 | DEBUG    | __main__:trials:24 - Trial = 5568/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.486 | DEBUG    | __main__:trials:29 - Trial = 5568/30000 | Total reward = 44.64
2022-01-26 14:16:51.489 | DEBUG    | __main__:trials:24 - Trial = 5569/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.490 | DEBUG    | __main__:trials:29 - Trial = 5569/30000 | Total reward = 52.87
2022-01-26 14:16:51.493 | DEBUG    | __main__:trials:24 - Trial = 5570/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.495 | DEBUG    | __main__:trials:29 - Trial = 5570/30000 | Total reward = 33.63
2022-01-26 14:16:51.497 | DEBUG    | __main__:trials:24 - Trial = 5571/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.499 | DEBUG    | __main__:trials:29 - Trial = 5571/30000 | Total reward = 14.09
2022-01-26 14:16:51.502 | DEBUG    | __main__:trials:24 - Trial = 5572/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.504 | DEBUG    | __main__:trials:29 - Trial = 5572/30000 | Total reward = 36.31
2022-01-26 14:16:51.507 | DEBUG    | __main__:trials:24 - Trial = 5573/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.508 | DEBUG    | __main__:trials:29 - Trial = 5573/30000 | Total reward = 46.52
2022-01-26 14:16:51.512 | DEBUG    | __main__:trials:24 - Trial = 5574/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.514 | DEBUG    | __main__:trials:29 - Trial = 5574/30000 | Total reward = 47.51
2022-01-26 14:16:51.518 | DEBUG    | __main__:trials:24 - Trial = 5575/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.519 | DEBUG    | __main__:trials:29 - Trial = 5575/30000 | Total reward = 54.45
2022-01-26 14:16:51.523 | DEBUG    | __main__:trials:24 - Trial = 5576/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.524 | DEBUG    | __main__:trials:29 - Trial = 5576/30000 | Total reward = 43.88
2022-01-26 14:16:51.528 | DEBUG    | __main__:trials:24 - Trial = 5577/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.530 | DEBUG    | __main__:trials:29 - Trial = 5577/30000 | Total reward = 52.01
2022-01-26 14:16:51.533 | DEBUG    | __main__:trials:24 - Trial = 5578/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.534 | DEBUG    | __main__:trials:29 - Trial = 5578/30000 | Total reward = 43.88
2022-01-26 14:16:51.539 | DEBUG    | __main__:trials:24 - Trial = 5579/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.539 | DEBUG    | __main__:trials:29 - Trial = 5579/30000 | Total reward = 44.61
2022-01-26 14:16:51.544 | DEBUG    | __main__:trials:24 - Trial = 5580/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.545 | DEBUG    | __main__:trials:29 - Trial = 5580/30000 | Total reward = 49.00
2022-01-26 14:16:51.548 | DEBUG    | __main__:trials:24 - Trial = 5581/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.550 | DEBUG    | __main__:trials:29 - Trial = 5581/30000 | Total reward = 42.82
2022-01-26 14:16:51.553 | DEBUG    | __main__:trials:24 - Trial = 5582/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.554 | DEBUG    | __main__:trials:29 - Trial = 5582/30000 | Total reward = 42.65
2022-01-26 14:16:51.558 | DEBUG    | __main__:trials:24 - Trial = 5583/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.559 | DEBUG    | __main__:trials:29 - Trial = 5583/30000 | Total reward = 42.81
2022-01-26 14:16:51.563 | DEBUG    | __main__:trials:24 - Trial = 5584/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.564 | DEBUG    | __main__:trials:29 - Trial = 5584/30000 | Total reward = 46.85
2022-01-26 14:16:51.568 | DEBUG    | __main__:trials:24 - Trial = 5585/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.569 | DEBUG    | __main__:trials:29 - Trial = 5585/30000 | Total reward = 44.77
2022-01-26 14:16:51.572 | DEBUG    | __main__:trials:24 - Trial = 5586/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.574 | DEBUG    | __main__:trials:29 - Trial = 5586/30000 | Total reward = 36.62
2022-01-26 14:16:51.578 | DEBUG    | __main__:trials:24 - Trial = 5587/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.578 | DEBUG    | __main__:trials:29 - Trial = 5587/30000 | Total reward = 46.01
2022-01-26 14:16:51.582 | DEBUG    | __main__:trials:24 - Trial = 5588/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.583 | DEBUG    | __main__:trials:29 - Trial = 5588/30000 | Total reward = 57.56
2022-01-26 14:16:51.587 | DEBUG    | __main__:trials:24 - Trial = 5589/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.588 | DEBUG    | __main__:trials:29 - Trial = 5589/30000 | Total reward = 46.29
2022-01-26 14:16:51.592 | DEBUG    | __main__:trials:24 - Trial = 5590/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.593 | DEBUG    | __main__:trials:29 - Trial = 5590/30000 | Total reward = 46.98
2022-01-26 14:16:51.596 | DEBUG    | __main__:trials:24 - Trial = 5591/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.597 | DEBUG    | __main__:trials:29 - Trial = 5591/30000 | Total reward = 45.02
2022-01-26 14:16:51.600 | DEBUG    | __main__:trials:24 - Trial = 5592/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.602 | DEBUG    | __main__:trials:29 - Trial = 5592/30000 | Total reward = 43.98
2022-01-26 14:16:51.606 | DEBUG    | __main__:trials:24 - Trial = 5593/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.606 | DEBUG    | __main__:trials:29 - Trial = 5593/30000 | Total reward = 53.00
2022-01-26 14:16:51.611 | DEBUG    | __main__:trials:24 - Trial = 5594/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.612 | DEBUG    | __main__:trials:29 - Trial = 5594/30000 | Total reward = 47.53
2022-01-26 14:16:51.616 | DEBUG    | __main__:trials:24 - Trial = 5595/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.616 | DEBUG    | __main__:trials:29 - Trial = 5595/30000 | Total reward = 41.29
2022-01-26 14:16:51.620 | DEBUG    | __main__:trials:24 - Trial = 5596/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.622 | DEBUG    | __main__:trials:29 - Trial = 5596/30000 | Total reward = 46.51
2022-01-26 14:16:51.626 | DEBUG    | __main__:trials:24 - Trial = 5597/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.626 | DEBUG    | __main__:trials:29 - Trial = 5597/30000 | Total reward = 50.16
2022-01-26 14:16:51.631 | DEBUG    | __main__:trials:24 - Trial = 5598/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.631 | DEBUG    | __main__:trials:29 - Trial = 5598/30000 | Total reward = 56.36
2022-01-26 14:16:51.636 | DEBUG    | __main__:trials:24 - Trial = 5599/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.637 | DEBUG    | __main__:trials:29 - Trial = 5599/30000 | Total reward = 53.98
2022-01-26 14:16:51.641 | DEBUG    | __main__:trials:24 - Trial = 5600/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.643 | DEBUG    | __main__:trials:29 - Trial = 5600/30000 | Total reward = 30.70
2022-01-26 14:16:51.646 | DEBUG    | __main__:trials:24 - Trial = 5601/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.647 | DEBUG    | __main__:trials:29 - Trial = 5601/30000 | Total reward = 42.58
2022-01-26 14:16:51.651 | DEBUG    | __main__:trials:24 - Trial = 5602/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.652 | DEBUG    | __main__:trials:29 - Trial = 5602/30000 | Total reward = 46.50
2022-01-26 14:16:51.655 | DEBUG    | __main__:trials:24 - Trial = 5603/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.657 | DEBUG    | __main__:trials:29 - Trial = 5603/30000 | Total reward = 40.08
2022-01-26 14:16:51.661 | DEBUG    | __main__:trials:24 - Trial = 5604/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.662 | DEBUG    | __main__:trials:29 - Trial = 5604/30000 | Total reward = 49.24
2022-01-26 14:16:51.665 | DEBUG    | __main__:trials:24 - Trial = 5605/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.666 | DEBUG    | __main__:trials:29 - Trial = 5605/30000 | Total reward = 49.79
2022-01-26 14:16:51.669 | DEBUG    | __main__:trials:24 - Trial = 5606/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.670 | DEBUG    | __main__:trials:29 - Trial = 5606/30000 | Total reward = 49.48
2022-01-26 14:16:51.674 | DEBUG    | __main__:trials:24 - Trial = 5607/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.674 | DEBUG    | __main__:trials:29 - Trial = 5607/30000 | Total reward = 43.59
2022-01-26 14:16:51.678 | DEBUG    | __main__:trials:24 - Trial = 5608/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.680 | DEBUG    | __main__:trials:29 - Trial = 5608/30000 | Total reward = 49.39
2022-01-26 14:16:51.683 | DEBUG    | __main__:trials:24 - Trial = 5609/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.684 | DEBUG    | __main__:trials:29 - Trial = 5609/30000 | Total reward = 50.73
2022-01-26 14:16:51.688 | DEBUG    | __main__:trials:24 - Trial = 5610/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.689 | DEBUG    | __main__:trials:29 - Trial = 5610/30000 | Total reward = 57.83
2022-01-26 14:16:51.693 | DEBUG    | __main__:trials:24 - Trial = 5611/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.694 | DEBUG    | __main__:trials:29 - Trial = 5611/30000 | Total reward = 46.34
2022-01-26 14:16:51.698 | DEBUG    | __main__:trials:24 - Trial = 5612/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.699 | DEBUG    | __main__:trials:29 - Trial = 5612/30000 | Total reward = 29.03
2022-01-26 14:16:51.703 | DEBUG    | __main__:trials:24 - Trial = 5613/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.704 | DEBUG    | __main__:trials:29 - Trial = 5613/30000 | Total reward = 49.52
2022-01-26 14:16:51.708 | DEBUG    | __main__:trials:24 - Trial = 5614/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.708 | DEBUG    | __main__:trials:29 - Trial = 5614/30000 | Total reward = 46.28
2022-01-26 14:16:51.712 | DEBUG    | __main__:trials:24 - Trial = 5615/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.714 | DEBUG    | __main__:trials:29 - Trial = 5615/30000 | Total reward = 25.75
2022-01-26 14:16:51.717 | DEBUG    | __main__:trials:24 - Trial = 5616/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.718 | DEBUG    | __main__:trials:29 - Trial = 5616/30000 | Total reward = 49.22
2022-01-26 14:16:51.721 | DEBUG    | __main__:trials:24 - Trial = 5617/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.722 | DEBUG    | __main__:trials:29 - Trial = 5617/30000 | Total reward = 40.42
2022-01-26 14:16:51.726 | DEBUG    | __main__:trials:24 - Trial = 5618/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.727 | DEBUG    | __main__:trials:29 - Trial = 5618/30000 | Total reward = 49.07
2022-01-26 14:16:51.731 | DEBUG    | __main__:trials:24 - Trial = 5619/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.732 | DEBUG    | __main__:trials:29 - Trial = 5619/30000 | Total reward = 49.47
2022-01-26 14:16:51.735 | DEBUG    | __main__:trials:24 - Trial = 5620/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.736 | DEBUG    | __main__:trials:29 - Trial = 5620/30000 | Total reward = 48.90
2022-01-26 14:16:51.740 | DEBUG    | __main__:trials:24 - Trial = 5621/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.740 | DEBUG    | __main__:trials:29 - Trial = 5621/30000 | Total reward = 53.42
2022-01-26 14:16:51.744 | DEBUG    | __main__:trials:24 - Trial = 5622/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.744 | DEBUG    | __main__:trials:29 - Trial = 5622/30000 | Total reward = 51.13
2022-01-26 14:16:51.748 | DEBUG    | __main__:trials:24 - Trial = 5623/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.750 | DEBUG    | __main__:trials:29 - Trial = 5623/30000 | Total reward = 51.74
2022-01-26 14:16:51.753 | DEBUG    | __main__:trials:24 - Trial = 5624/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.754 | DEBUG    | __main__:trials:29 - Trial = 5624/30000 | Total reward = 47.70
2022-01-26 14:16:51.758 | DEBUG    | __main__:trials:24 - Trial = 5625/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.759 | DEBUG    | __main__:trials:29 - Trial = 5625/30000 | Total reward = 49.42
2022-01-26 14:16:51.762 | DEBUG    | __main__:trials:26 - Trial = 5626/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.763 | DEBUG    | __main__:trials:29 - Trial = 5626/30000 | Total reward = 20.45
2022-01-26 14:16:51.767 | DEBUG    | __main__:trials:24 - Trial = 5627/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.768 | DEBUG    | __main__:trials:29 - Trial = 5627/30000 | Total reward = 49.93
2022-01-26 14:16:51.772 | DEBUG    | __main__:trials:24 - Trial = 5628/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.772 | DEBUG    | __main__:trials:29 - Trial = 5628/30000 | Total reward = 51.73
2022-01-26 14:16:51.776 | DEBUG    | __main__:trials:24 - Trial = 5629/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.777 | DEBUG    | __main__:trials:29 - Trial = 5629/30000 | Total reward = 40.57
2022-01-26 14:16:51.780 | DEBUG    | __main__:trials:24 - Trial = 5630/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.782 | DEBUG    | __main__:trials:29 - Trial = 5630/30000 | Total reward = 49.96
2022-01-26 14:16:51.785 | DEBUG    | __main__:trials:24 - Trial = 5631/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.785 | DEBUG    | __main__:trials:29 - Trial = 5631/30000 | Total reward = 48.53
2022-01-26 14:16:51.789 | DEBUG    | __main__:trials:24 - Trial = 5632/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.790 | DEBUG    | __main__:trials:29 - Trial = 5632/30000 | Total reward = 50.86
2022-01-26 14:16:51.794 | DEBUG    | __main__:trials:24 - Trial = 5633/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.795 | DEBUG    | __main__:trials:29 - Trial = 5633/30000 | Total reward = 52.22
2022-01-26 14:16:51.798 | DEBUG    | __main__:trials:24 - Trial = 5634/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.800 | DEBUG    | __main__:trials:29 - Trial = 5634/30000 | Total reward = 48.27
2022-01-26 14:16:51.804 | DEBUG    | __main__:trials:24 - Trial = 5635/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.805 | DEBUG    | __main__:trials:29 - Trial = 5635/30000 | Total reward = 17.92
2022-01-26 14:16:51.809 | DEBUG    | __main__:trials:24 - Trial = 5636/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.810 | DEBUG    | __main__:trials:29 - Trial = 5636/30000 | Total reward = 37.02
2022-01-26 14:16:51.814 | DEBUG    | __main__:trials:24 - Trial = 5637/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.814 | DEBUG    | __main__:trials:29 - Trial = 5637/30000 | Total reward = 19.55
2022-01-26 14:16:51.819 | DEBUG    | __main__:trials:24 - Trial = 5638/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.820 | DEBUG    | __main__:trials:29 - Trial = 5638/30000 | Total reward = 48.56
2022-01-26 14:16:51.823 | DEBUG    | __main__:trials:24 - Trial = 5639/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.825 | DEBUG    | __main__:trials:29 - Trial = 5639/30000 | Total reward = 43.70
2022-01-26 14:16:51.829 | DEBUG    | __main__:trials:24 - Trial = 5640/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.829 | DEBUG    | __main__:trials:29 - Trial = 5640/30000 | Total reward = 51.32
2022-01-26 14:16:51.833 | DEBUG    | __main__:trials:24 - Trial = 5641/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.834 | DEBUG    | __main__:trials:29 - Trial = 5641/30000 | Total reward = 46.40
2022-01-26 14:16:51.838 | DEBUG    | __main__:trials:24 - Trial = 5642/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.840 | DEBUG    | __main__:trials:29 - Trial = 5642/30000 | Total reward = 49.52
2022-01-26 14:16:51.843 | DEBUG    | __main__:trials:24 - Trial = 5643/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.845 | DEBUG    | __main__:trials:29 - Trial = 5643/30000 | Total reward = 55.23
2022-01-26 14:16:51.848 | DEBUG    | __main__:trials:24 - Trial = 5644/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.850 | DEBUG    | __main__:trials:29 - Trial = 5644/30000 | Total reward = 51.53
2022-01-26 14:16:51.853 | DEBUG    | __main__:trials:24 - Trial = 5645/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.854 | DEBUG    | __main__:trials:29 - Trial = 5645/30000 | Total reward = 49.49
2022-01-26 14:16:51.859 | DEBUG    | __main__:trials:24 - Trial = 5646/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.860 | DEBUG    | __main__:trials:29 - Trial = 5646/30000 | Total reward = 53.20
2022-01-26 14:16:51.863 | DEBUG    | __main__:trials:24 - Trial = 5647/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.865 | DEBUG    | __main__:trials:29 - Trial = 5647/30000 | Total reward = 34.58
2022-01-26 14:16:51.868 | DEBUG    | __main__:trials:24 - Trial = 5648/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.870 | DEBUG    | __main__:trials:29 - Trial = 5648/30000 | Total reward = 48.77
2022-01-26 14:16:51.873 | DEBUG    | __main__:trials:24 - Trial = 5649/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.875 | DEBUG    | __main__:trials:29 - Trial = 5649/30000 | Total reward = 48.02
2022-01-26 14:16:51.879 | DEBUG    | __main__:trials:24 - Trial = 5650/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.879 | DEBUG    | __main__:trials:29 - Trial = 5650/30000 | Total reward = 29.20
2022-01-26 14:16:51.884 | DEBUG    | __main__:trials:24 - Trial = 5651/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.884 | DEBUG    | __main__:trials:29 - Trial = 5651/30000 | Total reward = 47.22
2022-01-26 14:16:51.888 | DEBUG    | __main__:trials:24 - Trial = 5652/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.890 | DEBUG    | __main__:trials:29 - Trial = 5652/30000 | Total reward = 28.15
2022-01-26 14:16:51.894 | DEBUG    | __main__:trials:24 - Trial = 5653/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.894 | DEBUG    | __main__:trials:29 - Trial = 5653/30000 | Total reward = 51.32
2022-01-26 14:16:51.899 | DEBUG    | __main__:trials:24 - Trial = 5654/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.900 | DEBUG    | __main__:trials:29 - Trial = 5654/30000 | Total reward = 35.03
2022-01-26 14:16:51.904 | DEBUG    | __main__:trials:24 - Trial = 5655/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.906 | DEBUG    | __main__:trials:29 - Trial = 5655/30000 | Total reward = 47.65
2022-01-26 14:16:51.909 | DEBUG    | __main__:trials:24 - Trial = 5656/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.911 | DEBUG    | __main__:trials:29 - Trial = 5656/30000 | Total reward = 23.50
2022-01-26 14:16:51.914 | DEBUG    | __main__:trials:24 - Trial = 5657/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.916 | DEBUG    | __main__:trials:29 - Trial = 5657/30000 | Total reward = 45.30
2022-01-26 14:16:51.919 | DEBUG    | __main__:trials:24 - Trial = 5658/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.921 | DEBUG    | __main__:trials:29 - Trial = 5658/30000 | Total reward = 32.04
2022-01-26 14:16:51.925 | DEBUG    | __main__:trials:24 - Trial = 5659/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.926 | DEBUG    | __main__:trials:29 - Trial = 5659/30000 | Total reward = 50.47
2022-01-26 14:16:51.930 | DEBUG    | __main__:trials:26 - Trial = 5660/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.931 | DEBUG    | __main__:trials:29 - Trial = 5660/30000 | Total reward = 27.90
2022-01-26 14:16:51.934 | DEBUG    | __main__:trials:24 - Trial = 5661/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.936 | DEBUG    | __main__:trials:29 - Trial = 5661/30000 | Total reward = 55.06
2022-01-26 14:16:51.938 | DEBUG    | __main__:trials:26 - Trial = 5662/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.939 | DEBUG    | __main__:trials:29 - Trial = 5662/30000 | Total reward = 21.47
2022-01-26 14:16:51.943 | DEBUG    | __main__:trials:24 - Trial = 5663/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.945 | DEBUG    | __main__:trials:29 - Trial = 5663/30000 | Total reward = 42.49
2022-01-26 14:16:51.948 | DEBUG    | __main__:trials:24 - Trial = 5664/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.950 | DEBUG    | __main__:trials:29 - Trial = 5664/30000 | Total reward = 55.57
2022-01-26 14:16:51.953 | DEBUG    | __main__:trials:24 - Trial = 5665/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.954 | DEBUG    | __main__:trials:29 - Trial = 5665/30000 | Total reward = 51.54
2022-01-26 14:16:51.959 | DEBUG    | __main__:trials:24 - Trial = 5666/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.960 | DEBUG    | __main__:trials:29 - Trial = 5666/30000 | Total reward = 55.92
2022-01-26 14:16:51.964 | DEBUG    | __main__:trials:24 - Trial = 5667/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.965 | DEBUG    | __main__:trials:29 - Trial = 5667/30000 | Total reward = 47.36
2022-01-26 14:16:51.968 | DEBUG    | __main__:trials:24 - Trial = 5668/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.970 | DEBUG    | __main__:trials:29 - Trial = 5668/30000 | Total reward = 46.44
2022-01-26 14:16:51.973 | DEBUG    | __main__:trials:24 - Trial = 5669/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.975 | DEBUG    | __main__:trials:29 - Trial = 5669/30000 | Total reward = 52.78
2022-01-26 14:16:51.977 | DEBUG    | __main__:trials:26 - Trial = 5670/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:51.979 | DEBUG    | __main__:trials:29 - Trial = 5670/30000 | Total reward = 17.48
2022-01-26 14:16:51.983 | DEBUG    | __main__:trials:24 - Trial = 5671/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.984 | DEBUG    | __main__:trials:29 - Trial = 5671/30000 | Total reward = 39.60
2022-01-26 14:16:51.988 | DEBUG    | __main__:trials:24 - Trial = 5672/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.989 | DEBUG    | __main__:trials:29 - Trial = 5672/30000 | Total reward = 43.78
2022-01-26 14:16:51.993 | DEBUG    | __main__:trials:24 - Trial = 5673/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.993 | DEBUG    | __main__:trials:29 - Trial = 5673/30000 | Total reward = 52.88
2022-01-26 14:16:51.998 | DEBUG    | __main__:trials:24 - Trial = 5674/30000 | Max number of steps (20) reached
2022-01-26 14:16:51.999 | DEBUG    | __main__:trials:29 - Trial = 5674/30000 | Total reward = 62.64
2022-01-26 14:16:52.003 | DEBUG    | __main__:trials:24 - Trial = 5675/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.004 | DEBUG    | __main__:trials:29 - Trial = 5675/30000 | Total reward = 50.58
2022-01-26 14:16:52.008 | DEBUG    | __main__:trials:24 - Trial = 5676/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.009 | DEBUG    | __main__:trials:29 - Trial = 5676/30000 | Total reward = 50.89
2022-01-26 14:16:52.013 | DEBUG    | __main__:trials:24 - Trial = 5677/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.015 | DEBUG    | __main__:trials:29 - Trial = 5677/30000 | Total reward = 45.37
2022-01-26 14:16:52.018 | DEBUG    | __main__:trials:24 - Trial = 5678/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.019 | DEBUG    | __main__:trials:29 - Trial = 5678/30000 | Total reward = 49.27
2022-01-26 14:16:52.023 | DEBUG    | __main__:trials:24 - Trial = 5679/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.025 | DEBUG    | __main__:trials:29 - Trial = 5679/30000 | Total reward = 48.43
2022-01-26 14:16:52.028 | DEBUG    | __main__:trials:24 - Trial = 5680/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.030 | DEBUG    | __main__:trials:29 - Trial = 5680/30000 | Total reward = 48.09
2022-01-26 14:16:52.033 | DEBUG    | __main__:trials:24 - Trial = 5681/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.034 | DEBUG    | __main__:trials:29 - Trial = 5681/30000 | Total reward = 50.57
2022-01-26 14:16:52.038 | DEBUG    | __main__:trials:24 - Trial = 5682/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.039 | DEBUG    | __main__:trials:29 - Trial = 5682/30000 | Total reward = 51.70
2022-01-26 14:16:52.044 | DEBUG    | __main__:trials:24 - Trial = 5683/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.045 | DEBUG    | __main__:trials:29 - Trial = 5683/30000 | Total reward = 51.32
2022-01-26 14:16:52.049 | DEBUG    | __main__:trials:24 - Trial = 5684/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.051 | DEBUG    | __main__:trials:29 - Trial = 5684/30000 | Total reward = 59.17
2022-01-26 14:16:52.055 | DEBUG    | __main__:trials:24 - Trial = 5685/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.056 | DEBUG    | __main__:trials:29 - Trial = 5685/30000 | Total reward = 51.73
2022-01-26 14:16:52.060 | DEBUG    | __main__:trials:24 - Trial = 5686/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.061 | DEBUG    | __main__:trials:29 - Trial = 5686/30000 | Total reward = 49.64
2022-01-26 14:16:52.065 | DEBUG    | __main__:trials:24 - Trial = 5687/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.066 | DEBUG    | __main__:trials:29 - Trial = 5687/30000 | Total reward = 51.29
2022-01-26 14:16:52.070 | DEBUG    | __main__:trials:24 - Trial = 5688/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.070 | DEBUG    | __main__:trials:29 - Trial = 5688/30000 | Total reward = 48.87
2022-01-26 14:16:52.074 | DEBUG    | __main__:trials:24 - Trial = 5689/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.076 | DEBUG    | __main__:trials:29 - Trial = 5689/30000 | Total reward = 54.12
2022-01-26 14:16:52.079 | DEBUG    | __main__:trials:24 - Trial = 5690/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.080 | DEBUG    | __main__:trials:29 - Trial = 5690/30000 | Total reward = 52.89
2022-01-26 14:16:52.084 | DEBUG    | __main__:trials:24 - Trial = 5691/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.085 | DEBUG    | __main__:trials:29 - Trial = 5691/30000 | Total reward = 51.19
2022-01-26 14:16:52.088 | DEBUG    | __main__:trials:24 - Trial = 5692/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.090 | DEBUG    | __main__:trials:29 - Trial = 5692/30000 | Total reward = 49.93
2022-01-26 14:16:52.093 | DEBUG    | __main__:trials:24 - Trial = 5693/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.095 | DEBUG    | __main__:trials:29 - Trial = 5693/30000 | Total reward = 49.64
2022-01-26 14:16:52.098 | DEBUG    | __main__:trials:24 - Trial = 5694/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.100 | DEBUG    | __main__:trials:29 - Trial = 5694/30000 | Total reward = 51.14
2022-01-26 14:16:52.103 | DEBUG    | __main__:trials:24 - Trial = 5695/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.105 | DEBUG    | __main__:trials:29 - Trial = 5695/30000 | Total reward = 49.26
2022-01-26 14:16:52.108 | DEBUG    | __main__:trials:24 - Trial = 5696/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.110 | DEBUG    | __main__:trials:29 - Trial = 5696/30000 | Total reward = 48.43
2022-01-26 14:16:52.113 | DEBUG    | __main__:trials:24 - Trial = 5697/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.115 | DEBUG    | __main__:trials:29 - Trial = 5697/30000 | Total reward = 59.03
2022-01-26 14:16:52.119 | DEBUG    | __main__:trials:24 - Trial = 5698/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.120 | DEBUG    | __main__:trials:29 - Trial = 5698/30000 | Total reward = 42.55
2022-01-26 14:16:52.124 | DEBUG    | __main__:trials:24 - Trial = 5699/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.125 | DEBUG    | __main__:trials:29 - Trial = 5699/30000 | Total reward = 51.73
2022-01-26 14:16:52.128 | DEBUG    | __main__:trials:24 - Trial = 5700/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.130 | DEBUG    | __main__:trials:29 - Trial = 5700/30000 | Total reward = 48.53
2022-01-26 14:16:52.134 | DEBUG    | __main__:trials:24 - Trial = 5701/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.135 | DEBUG    | __main__:trials:29 - Trial = 5701/30000 | Total reward = 40.59
2022-01-26 14:16:52.139 | DEBUG    | __main__:trials:24 - Trial = 5702/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.139 | DEBUG    | __main__:trials:29 - Trial = 5702/30000 | Total reward = 51.79
2022-01-26 14:16:52.144 | DEBUG    | __main__:trials:24 - Trial = 5703/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.145 | DEBUG    | __main__:trials:29 - Trial = 5703/30000 | Total reward = 45.06
2022-01-26 14:16:52.148 | DEBUG    | __main__:trials:24 - Trial = 5704/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.150 | DEBUG    | __main__:trials:29 - Trial = 5704/30000 | Total reward = 58.29
2022-01-26 14:16:52.154 | DEBUG    | __main__:trials:24 - Trial = 5705/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.155 | DEBUG    | __main__:trials:29 - Trial = 5705/30000 | Total reward = 53.47
2022-01-26 14:16:52.159 | DEBUG    | __main__:trials:24 - Trial = 5706/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.159 | DEBUG    | __main__:trials:29 - Trial = 5706/30000 | Total reward = 51.78
2022-01-26 14:16:52.164 | DEBUG    | __main__:trials:24 - Trial = 5707/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.164 | DEBUG    | __main__:trials:29 - Trial = 5707/30000 | Total reward = 50.58
2022-01-26 14:16:52.168 | DEBUG    | __main__:trials:24 - Trial = 5708/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.169 | DEBUG    | __main__:trials:29 - Trial = 5708/30000 | Total reward = 48.29
2022-01-26 14:16:52.172 | DEBUG    | __main__:trials:24 - Trial = 5709/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.174 | DEBUG    | __main__:trials:29 - Trial = 5709/30000 | Total reward = 48.84
2022-01-26 14:16:52.177 | DEBUG    | __main__:trials:24 - Trial = 5710/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.178 | DEBUG    | __main__:trials:29 - Trial = 5710/30000 | Total reward = 51.79
2022-01-26 14:16:52.181 | DEBUG    | __main__:trials:24 - Trial = 5711/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.183 | DEBUG    | __main__:trials:29 - Trial = 5711/30000 | Total reward = 39.50
2022-01-26 14:16:52.186 | DEBUG    | __main__:trials:24 - Trial = 5712/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.188 | DEBUG    | __main__:trials:29 - Trial = 5712/30000 | Total reward = 50.07
2022-01-26 14:16:52.190 | DEBUG    | __main__:trials:24 - Trial = 5713/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.192 | DEBUG    | __main__:trials:29 - Trial = 5713/30000 | Total reward = 44.54
2022-01-26 14:16:52.195 | DEBUG    | __main__:trials:24 - Trial = 5714/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.196 | DEBUG    | __main__:trials:29 - Trial = 5714/30000 | Total reward = 50.08
2022-01-26 14:16:52.199 | DEBUG    | __main__:trials:24 - Trial = 5715/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.200 | DEBUG    | __main__:trials:29 - Trial = 5715/30000 | Total reward = 51.78
2022-01-26 14:16:52.204 | DEBUG    | __main__:trials:26 - Trial = 5716/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.205 | DEBUG    | __main__:trials:29 - Trial = 5716/30000 | Total reward = 30.24
2022-01-26 14:16:52.208 | DEBUG    | __main__:trials:24 - Trial = 5717/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.208 | DEBUG    | __main__:trials:29 - Trial = 5717/30000 | Total reward = 52.83
2022-01-26 14:16:52.212 | DEBUG    | __main__:trials:24 - Trial = 5718/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.213 | DEBUG    | __main__:trials:29 - Trial = 5718/30000 | Total reward = 49.40
2022-01-26 14:16:52.216 | DEBUG    | __main__:trials:24 - Trial = 5719/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.218 | DEBUG    | __main__:trials:29 - Trial = 5719/30000 | Total reward = 44.36
2022-01-26 14:16:52.220 | DEBUG    | __main__:trials:24 - Trial = 5720/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.222 | DEBUG    | __main__:trials:29 - Trial = 5720/30000 | Total reward = 49.16
2022-01-26 14:16:52.225 | DEBUG    | __main__:trials:24 - Trial = 5721/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.227 | DEBUG    | __main__:trials:29 - Trial = 5721/30000 | Total reward = 50.34
2022-01-26 14:16:52.230 | DEBUG    | __main__:trials:24 - Trial = 5722/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.232 | DEBUG    | __main__:trials:29 - Trial = 5722/30000 | Total reward = 47.37
2022-01-26 14:16:52.235 | DEBUG    | __main__:trials:24 - Trial = 5723/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.235 | DEBUG    | __main__:trials:29 - Trial = 5723/30000 | Total reward = 50.67
2022-01-26 14:16:52.239 | DEBUG    | __main__:trials:24 - Trial = 5724/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.240 | DEBUG    | __main__:trials:29 - Trial = 5724/30000 | Total reward = 47.10
2022-01-26 14:16:52.243 | DEBUG    | __main__:trials:24 - Trial = 5725/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.245 | DEBUG    | __main__:trials:29 - Trial = 5725/30000 | Total reward = 45.75
2022-01-26 14:16:52.246 | DEBUG    | __main__:trials:26 - Trial = 5726/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.248 | DEBUG    | __main__:trials:29 - Trial = 5726/30000 | Total reward = 7.23
2022-01-26 14:16:52.251 | DEBUG    | __main__:trials:24 - Trial = 5727/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.251 | DEBUG    | __main__:trials:29 - Trial = 5727/30000 | Total reward = 48.47
2022-01-26 14:16:52.255 | DEBUG    | __main__:trials:24 - Trial = 5728/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.256 | DEBUG    | __main__:trials:29 - Trial = 5728/30000 | Total reward = 53.05
2022-01-26 14:16:52.259 | DEBUG    | __main__:trials:24 - Trial = 5729/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.261 | DEBUG    | __main__:trials:29 - Trial = 5729/30000 | Total reward = 45.90
2022-01-26 14:16:52.264 | DEBUG    | __main__:trials:24 - Trial = 5730/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.264 | DEBUG    | __main__:trials:29 - Trial = 5730/30000 | Total reward = 47.65
2022-01-26 14:16:52.268 | DEBUG    | __main__:trials:24 - Trial = 5731/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.269 | DEBUG    | __main__:trials:29 - Trial = 5731/30000 | Total reward = 32.11
2022-01-26 14:16:52.272 | DEBUG    | __main__:trials:24 - Trial = 5732/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.273 | DEBUG    | __main__:trials:29 - Trial = 5732/30000 | Total reward = 48.84
2022-01-26 14:16:52.276 | DEBUG    | __main__:trials:24 - Trial = 5733/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.277 | DEBUG    | __main__:trials:29 - Trial = 5733/30000 | Total reward = 40.08
2022-01-26 14:16:52.281 | DEBUG    | __main__:trials:24 - Trial = 5734/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.282 | DEBUG    | __main__:trials:29 - Trial = 5734/30000 | Total reward = 40.59
2022-01-26 14:16:52.285 | DEBUG    | __main__:trials:24 - Trial = 5735/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.286 | DEBUG    | __main__:trials:29 - Trial = 5735/30000 | Total reward = 46.06
2022-01-26 14:16:52.289 | DEBUG    | __main__:trials:24 - Trial = 5736/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.290 | DEBUG    | __main__:trials:29 - Trial = 5736/30000 | Total reward = 47.55
2022-01-26 14:16:52.293 | DEBUG    | __main__:trials:24 - Trial = 5737/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.295 | DEBUG    | __main__:trials:29 - Trial = 5737/30000 | Total reward = 55.79
2022-01-26 14:16:52.298 | DEBUG    | __main__:trials:24 - Trial = 5738/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.299 | DEBUG    | __main__:trials:29 - Trial = 5738/30000 | Total reward = 55.75
2022-01-26 14:16:52.303 | DEBUG    | __main__:trials:24 - Trial = 5739/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.304 | DEBUG    | __main__:trials:29 - Trial = 5739/30000 | Total reward = 47.31
2022-01-26 14:16:52.307 | DEBUG    | __main__:trials:24 - Trial = 5740/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.309 | DEBUG    | __main__:trials:29 - Trial = 5740/30000 | Total reward = 35.88
2022-01-26 14:16:52.312 | DEBUG    | __main__:trials:24 - Trial = 5741/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.314 | DEBUG    | __main__:trials:29 - Trial = 5741/30000 | Total reward = 46.91
2022-01-26 14:16:52.317 | DEBUG    | __main__:trials:24 - Trial = 5742/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.319 | DEBUG    | __main__:trials:29 - Trial = 5742/30000 | Total reward = 49.93
2022-01-26 14:16:52.322 | DEBUG    | __main__:trials:24 - Trial = 5743/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.323 | DEBUG    | __main__:trials:29 - Trial = 5743/30000 | Total reward = 52.29
2022-01-26 14:16:52.326 | DEBUG    | __main__:trials:24 - Trial = 5744/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.328 | DEBUG    | __main__:trials:29 - Trial = 5744/30000 | Total reward = 40.21
2022-01-26 14:16:52.330 | DEBUG    | __main__:trials:26 - Trial = 5745/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.332 | DEBUG    | __main__:trials:29 - Trial = 5745/30000 | Total reward = 11.78
2022-01-26 14:16:52.335 | DEBUG    | __main__:trials:24 - Trial = 5746/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.337 | DEBUG    | __main__:trials:29 - Trial = 5746/30000 | Total reward = 51.73
2022-01-26 14:16:52.340 | DEBUG    | __main__:trials:24 - Trial = 5747/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.342 | DEBUG    | __main__:trials:29 - Trial = 5747/30000 | Total reward = 52.60
2022-01-26 14:16:52.344 | DEBUG    | __main__:trials:24 - Trial = 5748/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.346 | DEBUG    | __main__:trials:29 - Trial = 5748/30000 | Total reward = 48.92
2022-01-26 14:16:52.349 | DEBUG    | __main__:trials:24 - Trial = 5749/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.351 | DEBUG    | __main__:trials:29 - Trial = 5749/30000 | Total reward = 47.17
2022-01-26 14:16:52.354 | DEBUG    | __main__:trials:24 - Trial = 5750/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.356 | DEBUG    | __main__:trials:29 - Trial = 5750/30000 | Total reward = 57.10
2022-01-26 14:16:52.359 | DEBUG    | __main__:trials:24 - Trial = 5751/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.360 | DEBUG    | __main__:trials:29 - Trial = 5751/30000 | Total reward = 21.12
2022-01-26 14:16:52.363 | DEBUG    | __main__:trials:24 - Trial = 5752/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.364 | DEBUG    | __main__:trials:29 - Trial = 5752/30000 | Total reward = 49.70
2022-01-26 14:16:52.367 | DEBUG    | __main__:trials:24 - Trial = 5753/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.369 | DEBUG    | __main__:trials:29 - Trial = 5753/30000 | Total reward = 48.46
2022-01-26 14:16:52.372 | DEBUG    | __main__:trials:24 - Trial = 5754/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.374 | DEBUG    | __main__:trials:29 - Trial = 5754/30000 | Total reward = 44.17
2022-01-26 14:16:52.376 | DEBUG    | __main__:trials:24 - Trial = 5755/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.378 | DEBUG    | __main__:trials:29 - Trial = 5755/30000 | Total reward = 50.85
2022-01-26 14:16:52.382 | DEBUG    | __main__:trials:24 - Trial = 5756/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.383 | DEBUG    | __main__:trials:29 - Trial = 5756/30000 | Total reward = 48.40
2022-01-26 14:16:52.386 | DEBUG    | __main__:trials:24 - Trial = 5757/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.388 | DEBUG    | __main__:trials:29 - Trial = 5757/30000 | Total reward = 51.16
2022-01-26 14:16:52.390 | DEBUG    | __main__:trials:24 - Trial = 5758/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.392 | DEBUG    | __main__:trials:29 - Trial = 5758/30000 | Total reward = 47.80
2022-01-26 14:16:52.395 | DEBUG    | __main__:trials:24 - Trial = 5759/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.396 | DEBUG    | __main__:trials:29 - Trial = 5759/30000 | Total reward = 48.55
2022-01-26 14:16:52.399 | DEBUG    | __main__:trials:24 - Trial = 5760/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.400 | DEBUG    | __main__:trials:29 - Trial = 5760/30000 | Total reward = 51.64
2022-01-26 14:16:52.403 | DEBUG    | __main__:trials:24 - Trial = 5761/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.404 | DEBUG    | __main__:trials:29 - Trial = 5761/30000 | Total reward = 46.44
2022-01-26 14:16:52.407 | DEBUG    | __main__:trials:24 - Trial = 5762/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.409 | DEBUG    | __main__:trials:29 - Trial = 5762/30000 | Total reward = 44.92
2022-01-26 14:16:52.413 | DEBUG    | __main__:trials:24 - Trial = 5763/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.414 | DEBUG    | __main__:trials:29 - Trial = 5763/30000 | Total reward = 48.69
2022-01-26 14:16:52.418 | DEBUG    | __main__:trials:24 - Trial = 5764/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.419 | DEBUG    | __main__:trials:29 - Trial = 5764/30000 | Total reward = 46.52
2022-01-26 14:16:52.422 | DEBUG    | __main__:trials:24 - Trial = 5765/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.424 | DEBUG    | __main__:trials:29 - Trial = 5765/30000 | Total reward = 45.48
2022-01-26 14:16:52.426 | DEBUG    | __main__:trials:26 - Trial = 5766/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.428 | DEBUG    | __main__:trials:29 - Trial = 5766/30000 | Total reward = 11.51
2022-01-26 14:16:52.431 | DEBUG    | __main__:trials:26 - Trial = 5767/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.432 | DEBUG    | __main__:trials:29 - Trial = 5767/30000 | Total reward = 8.65
2022-01-26 14:16:52.436 | DEBUG    | __main__:trials:26 - Trial = 5768/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.438 | DEBUG    | __main__:trials:29 - Trial = 5768/30000 | Total reward = 36.38
2022-01-26 14:16:52.441 | DEBUG    | __main__:trials:24 - Trial = 5769/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.443 | DEBUG    | __main__:trials:29 - Trial = 5769/30000 | Total reward = 35.05
2022-01-26 14:16:52.446 | DEBUG    | __main__:trials:24 - Trial = 5770/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.447 | DEBUG    | __main__:trials:29 - Trial = 5770/30000 | Total reward = 45.28
2022-01-26 14:16:52.451 | DEBUG    | __main__:trials:24 - Trial = 5771/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.452 | DEBUG    | __main__:trials:29 - Trial = 5771/30000 | Total reward = 47.11
2022-01-26 14:16:52.456 | DEBUG    | __main__:trials:24 - Trial = 5772/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.457 | DEBUG    | __main__:trials:29 - Trial = 5772/30000 | Total reward = 42.37
2022-01-26 14:16:52.460 | DEBUG    | __main__:trials:24 - Trial = 5773/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.462 | DEBUG    | __main__:trials:29 - Trial = 5773/30000 | Total reward = 47.12
2022-01-26 14:16:52.466 | DEBUG    | __main__:trials:24 - Trial = 5774/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.467 | DEBUG    | __main__:trials:29 - Trial = 5774/30000 | Total reward = 44.34
2022-01-26 14:16:52.471 | DEBUG    | __main__:trials:24 - Trial = 5775/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.473 | DEBUG    | __main__:trials:29 - Trial = 5775/30000 | Total reward = 48.95
2022-01-26 14:16:52.476 | DEBUG    | __main__:trials:24 - Trial = 5776/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.478 | DEBUG    | __main__:trials:29 - Trial = 5776/30000 | Total reward = 49.11
2022-01-26 14:16:52.481 | DEBUG    | __main__:trials:24 - Trial = 5777/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.483 | DEBUG    | __main__:trials:29 - Trial = 5777/30000 | Total reward = 44.28
2022-01-26 14:16:52.486 | DEBUG    | __main__:trials:24 - Trial = 5778/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.488 | DEBUG    | __main__:trials:29 - Trial = 5778/30000 | Total reward = 47.51
2022-01-26 14:16:52.491 | DEBUG    | __main__:trials:24 - Trial = 5779/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.493 | DEBUG    | __main__:trials:29 - Trial = 5779/30000 | Total reward = 24.67
2022-01-26 14:16:52.496 | DEBUG    | __main__:trials:24 - Trial = 5780/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.498 | DEBUG    | __main__:trials:29 - Trial = 5780/30000 | Total reward = 44.36
2022-01-26 14:16:52.501 | DEBUG    | __main__:trials:26 - Trial = 5781/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.502 | DEBUG    | __main__:trials:29 - Trial = 5781/30000 | Total reward = 21.45
2022-01-26 14:16:52.505 | DEBUG    | __main__:trials:24 - Trial = 5782/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.507 | DEBUG    | __main__:trials:29 - Trial = 5782/30000 | Total reward = 49.16
2022-01-26 14:16:52.510 | DEBUG    | __main__:trials:24 - Trial = 5783/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.511 | DEBUG    | __main__:trials:29 - Trial = 5783/30000 | Total reward = 35.01
2022-01-26 14:16:52.515 | DEBUG    | __main__:trials:24 - Trial = 5784/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.515 | DEBUG    | __main__:trials:29 - Trial = 5784/30000 | Total reward = 41.50
2022-01-26 14:16:52.519 | DEBUG    | __main__:trials:24 - Trial = 5785/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.520 | DEBUG    | __main__:trials:29 - Trial = 5785/30000 | Total reward = 44.16
2022-01-26 14:16:52.524 | DEBUG    | __main__:trials:24 - Trial = 5786/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.525 | DEBUG    | __main__:trials:29 - Trial = 5786/30000 | Total reward = 41.10
2022-01-26 14:16:52.529 | DEBUG    | __main__:trials:24 - Trial = 5787/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.531 | DEBUG    | __main__:trials:29 - Trial = 5787/30000 | Total reward = 39.83
2022-01-26 14:16:52.534 | DEBUG    | __main__:trials:24 - Trial = 5788/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.536 | DEBUG    | __main__:trials:29 - Trial = 5788/30000 | Total reward = 48.35
2022-01-26 14:16:52.540 | DEBUG    | __main__:trials:24 - Trial = 5789/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.541 | DEBUG    | __main__:trials:29 - Trial = 5789/30000 | Total reward = 56.35
2022-01-26 14:16:52.545 | DEBUG    | __main__:trials:24 - Trial = 5790/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.546 | DEBUG    | __main__:trials:29 - Trial = 5790/30000 | Total reward = 51.96
2022-01-26 14:16:52.549 | DEBUG    | __main__:trials:26 - Trial = 5791/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.550 | DEBUG    | __main__:trials:29 - Trial = 5791/30000 | Total reward = 14.35
2022-01-26 14:16:52.554 | DEBUG    | __main__:trials:24 - Trial = 5792/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.556 | DEBUG    | __main__:trials:29 - Trial = 5792/30000 | Total reward = 52.01
2022-01-26 14:16:52.559 | DEBUG    | __main__:trials:24 - Trial = 5793/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.560 | DEBUG    | __main__:trials:29 - Trial = 5793/30000 | Total reward = 50.05
2022-01-26 14:16:52.564 | DEBUG    | __main__:trials:24 - Trial = 5794/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.565 | DEBUG    | __main__:trials:29 - Trial = 5794/30000 | Total reward = 44.02
2022-01-26 14:16:52.568 | DEBUG    | __main__:trials:24 - Trial = 5795/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.570 | DEBUG    | __main__:trials:29 - Trial = 5795/30000 | Total reward = 51.73
2022-01-26 14:16:52.574 | DEBUG    | __main__:trials:24 - Trial = 5796/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.575 | DEBUG    | __main__:trials:29 - Trial = 5796/30000 | Total reward = 47.35
2022-01-26 14:16:52.578 | DEBUG    | __main__:trials:24 - Trial = 5797/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.580 | DEBUG    | __main__:trials:29 - Trial = 5797/30000 | Total reward = 46.44
2022-01-26 14:16:52.583 | DEBUG    | __main__:trials:24 - Trial = 5798/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.584 | DEBUG    | __main__:trials:29 - Trial = 5798/30000 | Total reward = 51.58
2022-01-26 14:16:52.587 | DEBUG    | __main__:trials:24 - Trial = 5799/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.589 | DEBUG    | __main__:trials:29 - Trial = 5799/30000 | Total reward = 51.81
2022-01-26 14:16:52.592 | DEBUG    | __main__:trials:24 - Trial = 5800/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.593 | DEBUG    | __main__:trials:29 - Trial = 5800/30000 | Total reward = 49.50
2022-01-26 14:16:52.596 | DEBUG    | __main__:trials:24 - Trial = 5801/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.598 | DEBUG    | __main__:trials:29 - Trial = 5801/30000 | Total reward = 57.11
2022-01-26 14:16:52.601 | DEBUG    | __main__:trials:26 - Trial = 5802/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.602 | DEBUG    | __main__:trials:29 - Trial = 5802/30000 | Total reward = 11.79
2022-01-26 14:16:52.605 | DEBUG    | __main__:trials:24 - Trial = 5803/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.607 | DEBUG    | __main__:trials:29 - Trial = 5803/30000 | Total reward = 45.91
2022-01-26 14:16:52.610 | DEBUG    | __main__:trials:24 - Trial = 5804/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.612 | DEBUG    | __main__:trials:29 - Trial = 5804/30000 | Total reward = 42.13
2022-01-26 14:16:52.615 | DEBUG    | __main__:trials:24 - Trial = 5805/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.617 | DEBUG    | __main__:trials:29 - Trial = 5805/30000 | Total reward = 49.26
2022-01-26 14:16:52.621 | DEBUG    | __main__:trials:24 - Trial = 5806/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.621 | DEBUG    | __main__:trials:29 - Trial = 5806/30000 | Total reward = 45.30
2022-01-26 14:16:52.626 | DEBUG    | __main__:trials:24 - Trial = 5807/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.626 | DEBUG    | __main__:trials:29 - Trial = 5807/30000 | Total reward = 46.91
2022-01-26 14:16:52.631 | DEBUG    | __main__:trials:24 - Trial = 5808/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.632 | DEBUG    | __main__:trials:29 - Trial = 5808/30000 | Total reward = 50.63
2022-01-26 14:16:52.636 | DEBUG    | __main__:trials:24 - Trial = 5809/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.636 | DEBUG    | __main__:trials:29 - Trial = 5809/30000 | Total reward = 51.73
2022-01-26 14:16:52.641 | DEBUG    | __main__:trials:24 - Trial = 5810/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.641 | DEBUG    | __main__:trials:29 - Trial = 5810/30000 | Total reward = 50.07
2022-01-26 14:16:52.645 | DEBUG    | __main__:trials:24 - Trial = 5811/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.646 | DEBUG    | __main__:trials:29 - Trial = 5811/30000 | Total reward = 55.10
2022-01-26 14:16:52.650 | DEBUG    | __main__:trials:24 - Trial = 5812/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.650 | DEBUG    | __main__:trials:29 - Trial = 5812/30000 | Total reward = 49.84
2022-01-26 14:16:52.654 | DEBUG    | __main__:trials:24 - Trial = 5813/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.656 | DEBUG    | __main__:trials:29 - Trial = 5813/30000 | Total reward = 52.19
2022-01-26 14:16:52.659 | DEBUG    | __main__:trials:24 - Trial = 5814/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.661 | DEBUG    | __main__:trials:29 - Trial = 5814/30000 | Total reward = 51.32
2022-01-26 14:16:52.664 | DEBUG    | __main__:trials:24 - Trial = 5815/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.665 | DEBUG    | __main__:trials:29 - Trial = 5815/30000 | Total reward = 49.38
2022-01-26 14:16:52.668 | DEBUG    | __main__:trials:24 - Trial = 5816/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.670 | DEBUG    | __main__:trials:29 - Trial = 5816/30000 | Total reward = 52.34
2022-01-26 14:16:52.674 | DEBUG    | __main__:trials:24 - Trial = 5817/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.675 | DEBUG    | __main__:trials:29 - Trial = 5817/30000 | Total reward = 50.60
2022-01-26 14:16:52.679 | DEBUG    | __main__:trials:24 - Trial = 5818/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.680 | DEBUG    | __main__:trials:29 - Trial = 5818/30000 | Total reward = 48.35
2022-01-26 14:16:52.684 | DEBUG    | __main__:trials:24 - Trial = 5819/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.685 | DEBUG    | __main__:trials:29 - Trial = 5819/30000 | Total reward = 52.39
2022-01-26 14:16:52.689 | DEBUG    | __main__:trials:24 - Trial = 5820/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.691 | DEBUG    | __main__:trials:29 - Trial = 5820/30000 | Total reward = 43.90
2022-01-26 14:16:52.694 | DEBUG    | __main__:trials:26 - Trial = 5821/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.696 | DEBUG    | __main__:trials:29 - Trial = 5821/30000 | Total reward = 19.46
2022-01-26 14:16:52.699 | DEBUG    | __main__:trials:24 - Trial = 5822/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.701 | DEBUG    | __main__:trials:29 - Trial = 5822/30000 | Total reward = 51.79
2022-01-26 14:16:52.704 | DEBUG    | __main__:trials:24 - Trial = 5823/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.706 | DEBUG    | __main__:trials:29 - Trial = 5823/30000 | Total reward = 52.43
2022-01-26 14:16:52.709 | DEBUG    | __main__:trials:24 - Trial = 5824/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.709 | DEBUG    | __main__:trials:29 - Trial = 5824/30000 | Total reward = 54.73
2022-01-26 14:16:52.714 | DEBUG    | __main__:trials:24 - Trial = 5825/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.715 | DEBUG    | __main__:trials:29 - Trial = 5825/30000 | Total reward = 58.32
2022-01-26 14:16:52.719 | DEBUG    | __main__:trials:24 - Trial = 5826/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.719 | DEBUG    | __main__:trials:29 - Trial = 5826/30000 | Total reward = 61.19
2022-01-26 14:16:52.723 | DEBUG    | __main__:trials:24 - Trial = 5827/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.725 | DEBUG    | __main__:trials:29 - Trial = 5827/30000 | Total reward = 47.70
2022-01-26 14:16:52.728 | DEBUG    | __main__:trials:24 - Trial = 5828/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.730 | DEBUG    | __main__:trials:29 - Trial = 5828/30000 | Total reward = 51.73
2022-01-26 14:16:52.734 | DEBUG    | __main__:trials:24 - Trial = 5829/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.734 | DEBUG    | __main__:trials:29 - Trial = 5829/30000 | Total reward = 44.29
2022-01-26 14:16:52.739 | DEBUG    | __main__:trials:24 - Trial = 5830/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.740 | DEBUG    | __main__:trials:29 - Trial = 5830/30000 | Total reward = 56.22
2022-01-26 14:16:52.744 | DEBUG    | __main__:trials:24 - Trial = 5831/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.745 | DEBUG    | __main__:trials:29 - Trial = 5831/30000 | Total reward = 50.69
2022-01-26 14:16:52.749 | DEBUG    | __main__:trials:24 - Trial = 5832/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.751 | DEBUG    | __main__:trials:29 - Trial = 5832/30000 | Total reward = 56.08
2022-01-26 14:16:52.754 | DEBUG    | __main__:trials:24 - Trial = 5833/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.755 | DEBUG    | __main__:trials:29 - Trial = 5833/30000 | Total reward = 47.65
2022-01-26 14:16:52.759 | DEBUG    | __main__:trials:24 - Trial = 5834/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.760 | DEBUG    | __main__:trials:29 - Trial = 5834/30000 | Total reward = 35.75
2022-01-26 14:16:52.763 | DEBUG    | __main__:trials:24 - Trial = 5835/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.765 | DEBUG    | __main__:trials:29 - Trial = 5835/30000 | Total reward = 51.36
2022-01-26 14:16:52.768 | DEBUG    | __main__:trials:24 - Trial = 5836/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.770 | DEBUG    | __main__:trials:29 - Trial = 5836/30000 | Total reward = 40.08
2022-01-26 14:16:52.774 | DEBUG    | __main__:trials:24 - Trial = 5837/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.775 | DEBUG    | __main__:trials:29 - Trial = 5837/30000 | Total reward = 51.73
2022-01-26 14:16:52.779 | DEBUG    | __main__:trials:24 - Trial = 5838/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.780 | DEBUG    | __main__:trials:29 - Trial = 5838/30000 | Total reward = 48.95
2022-01-26 14:16:52.783 | DEBUG    | __main__:trials:24 - Trial = 5839/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.785 | DEBUG    | __main__:trials:29 - Trial = 5839/30000 | Total reward = 48.35
2022-01-26 14:16:52.789 | DEBUG    | __main__:trials:24 - Trial = 5840/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.790 | DEBUG    | __main__:trials:29 - Trial = 5840/30000 | Total reward = 42.10
2022-01-26 14:16:52.793 | DEBUG    | __main__:trials:24 - Trial = 5841/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.794 | DEBUG    | __main__:trials:29 - Trial = 5841/30000 | Total reward = 49.07
2022-01-26 14:16:52.798 | DEBUG    | __main__:trials:24 - Trial = 5842/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.799 | DEBUG    | __main__:trials:29 - Trial = 5842/30000 | Total reward = 41.91
2022-01-26 14:16:52.803 | DEBUG    | __main__:trials:24 - Trial = 5843/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.805 | DEBUG    | __main__:trials:29 - Trial = 5843/30000 | Total reward = 53.66
2022-01-26 14:16:52.807 | DEBUG    | __main__:trials:24 - Trial = 5844/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.809 | DEBUG    | __main__:trials:29 - Trial = 5844/30000 | Total reward = 40.95
2022-01-26 14:16:52.812 | DEBUG    | __main__:trials:24 - Trial = 5845/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.814 | DEBUG    | __main__:trials:29 - Trial = 5845/30000 | Total reward = 48.78
2022-01-26 14:16:52.817 | DEBUG    | __main__:trials:24 - Trial = 5846/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.819 | DEBUG    | __main__:trials:29 - Trial = 5846/30000 | Total reward = 43.14
2022-01-26 14:16:52.823 | DEBUG    | __main__:trials:24 - Trial = 5847/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.823 | DEBUG    | __main__:trials:29 - Trial = 5847/30000 | Total reward = 50.56
2022-01-26 14:16:52.828 | DEBUG    | __main__:trials:24 - Trial = 5848/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.829 | DEBUG    | __main__:trials:29 - Trial = 5848/30000 | Total reward = 46.12
2022-01-26 14:16:52.832 | DEBUG    | __main__:trials:24 - Trial = 5849/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.834 | DEBUG    | __main__:trials:29 - Trial = 5849/30000 | Total reward = 51.24
2022-01-26 14:16:52.838 | DEBUG    | __main__:trials:24 - Trial = 5850/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.839 | DEBUG    | __main__:trials:29 - Trial = 5850/30000 | Total reward = 43.77
2022-01-26 14:16:52.843 | DEBUG    | __main__:trials:24 - Trial = 5851/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.844 | DEBUG    | __main__:trials:29 - Trial = 5851/30000 | Total reward = 47.87
2022-01-26 14:16:52.847 | DEBUG    | __main__:trials:24 - Trial = 5852/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.849 | DEBUG    | __main__:trials:29 - Trial = 5852/30000 | Total reward = 48.78
2022-01-26 14:16:52.852 | DEBUG    | __main__:trials:24 - Trial = 5853/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.854 | DEBUG    | __main__:trials:29 - Trial = 5853/30000 | Total reward = 52.33
2022-01-26 14:16:52.857 | DEBUG    | __main__:trials:24 - Trial = 5854/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.859 | DEBUG    | __main__:trials:29 - Trial = 5854/30000 | Total reward = 45.71
2022-01-26 14:16:52.862 | DEBUG    | __main__:trials:24 - Trial = 5855/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.864 | DEBUG    | __main__:trials:29 - Trial = 5855/30000 | Total reward = 48.27
2022-01-26 14:16:52.866 | DEBUG    | __main__:trials:24 - Trial = 5856/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.868 | DEBUG    | __main__:trials:29 - Trial = 5856/30000 | Total reward = 46.30
2022-01-26 14:16:52.872 | DEBUG    | __main__:trials:24 - Trial = 5857/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.873 | DEBUG    | __main__:trials:29 - Trial = 5857/30000 | Total reward = 49.57
2022-01-26 14:16:52.876 | DEBUG    | __main__:trials:24 - Trial = 5858/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.878 | DEBUG    | __main__:trials:29 - Trial = 5858/30000 | Total reward = 53.20
2022-01-26 14:16:52.882 | DEBUG    | __main__:trials:24 - Trial = 5859/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.883 | DEBUG    | __main__:trials:29 - Trial = 5859/30000 | Total reward = 51.47
2022-01-26 14:16:52.887 | DEBUG    | __main__:trials:24 - Trial = 5860/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.888 | DEBUG    | __main__:trials:29 - Trial = 5860/30000 | Total reward = 45.76
2022-01-26 14:16:52.892 | DEBUG    | __main__:trials:24 - Trial = 5861/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.894 | DEBUG    | __main__:trials:29 - Trial = 5861/30000 | Total reward = 47.81
2022-01-26 14:16:52.902 | DEBUG    | __main__:trials:24 - Trial = 5862/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.903 | DEBUG    | __main__:trials:29 - Trial = 5862/30000 | Total reward = 47.42
2022-01-26 14:16:52.907 | DEBUG    | __main__:trials:24 - Trial = 5863/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.909 | DEBUG    | __main__:trials:29 - Trial = 5863/30000 | Total reward = 46.04
2022-01-26 14:16:52.912 | DEBUG    | __main__:trials:24 - Trial = 5864/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.914 | DEBUG    | __main__:trials:29 - Trial = 5864/30000 | Total reward = 49.94
2022-01-26 14:16:52.917 | DEBUG    | __main__:trials:24 - Trial = 5865/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.918 | DEBUG    | __main__:trials:29 - Trial = 5865/30000 | Total reward = 46.03
2022-01-26 14:16:52.921 | DEBUG    | __main__:trials:26 - Trial = 5866/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.922 | DEBUG    | __main__:trials:29 - Trial = 5866/30000 | Total reward = 11.51
2022-01-26 14:16:52.925 | DEBUG    | __main__:trials:26 - Trial = 5867/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:52.927 | DEBUG    | __main__:trials:29 - Trial = 5867/30000 | Total reward = 23.73
2022-01-26 14:16:52.930 | DEBUG    | __main__:trials:24 - Trial = 5868/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.931 | DEBUG    | __main__:trials:29 - Trial = 5868/30000 | Total reward = 46.85
2022-01-26 14:16:52.935 | DEBUG    | __main__:trials:24 - Trial = 5869/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.936 | DEBUG    | __main__:trials:29 - Trial = 5869/30000 | Total reward = 41.31
2022-01-26 14:16:52.939 | DEBUG    | __main__:trials:24 - Trial = 5870/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.941 | DEBUG    | __main__:trials:29 - Trial = 5870/30000 | Total reward = 48.78
2022-01-26 14:16:52.945 | DEBUG    | __main__:trials:24 - Trial = 5871/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.945 | DEBUG    | __main__:trials:29 - Trial = 5871/30000 | Total reward = 44.69
2022-01-26 14:16:52.948 | DEBUG    | __main__:trials:24 - Trial = 5872/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.949 | DEBUG    | __main__:trials:29 - Trial = 5872/30000 | Total reward = 45.87
2022-01-26 14:16:52.952 | DEBUG    | __main__:trials:24 - Trial = 5873/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.954 | DEBUG    | __main__:trials:29 - Trial = 5873/30000 | Total reward = 47.77
2022-01-26 14:16:52.957 | DEBUG    | __main__:trials:24 - Trial = 5874/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.958 | DEBUG    | __main__:trials:29 - Trial = 5874/30000 | Total reward = 44.35
2022-01-26 14:16:52.962 | DEBUG    | __main__:trials:24 - Trial = 5875/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.963 | DEBUG    | __main__:trials:29 - Trial = 5875/30000 | Total reward = 37.01
2022-01-26 14:16:52.966 | DEBUG    | __main__:trials:24 - Trial = 5876/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.968 | DEBUG    | __main__:trials:29 - Trial = 5876/30000 | Total reward = 50.30
2022-01-26 14:16:52.971 | DEBUG    | __main__:trials:24 - Trial = 5877/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.972 | DEBUG    | __main__:trials:29 - Trial = 5877/30000 | Total reward = 46.78
2022-01-26 14:16:52.976 | DEBUG    | __main__:trials:24 - Trial = 5878/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.978 | DEBUG    | __main__:trials:29 - Trial = 5878/30000 | Total reward = 39.33
2022-01-26 14:16:52.981 | DEBUG    | __main__:trials:24 - Trial = 5879/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.983 | DEBUG    | __main__:trials:29 - Trial = 5879/30000 | Total reward = 49.10
2022-01-26 14:16:52.986 | DEBUG    | __main__:trials:24 - Trial = 5880/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.987 | DEBUG    | __main__:trials:29 - Trial = 5880/30000 | Total reward = 45.94
2022-01-26 14:16:52.990 | DEBUG    | __main__:trials:24 - Trial = 5881/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.992 | DEBUG    | __main__:trials:29 - Trial = 5881/30000 | Total reward = 43.50
2022-01-26 14:16:52.996 | DEBUG    | __main__:trials:24 - Trial = 5882/30000 | Max number of steps (20) reached
2022-01-26 14:16:52.997 | DEBUG    | __main__:trials:29 - Trial = 5882/30000 | Total reward = 42.67
2022-01-26 14:16:53.000 | DEBUG    | __main__:trials:24 - Trial = 5883/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.002 | DEBUG    | __main__:trials:29 - Trial = 5883/30000 | Total reward = 46.52
2022-01-26 14:16:53.005 | DEBUG    | __main__:trials:26 - Trial = 5884/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.006 | DEBUG    | __main__:trials:29 - Trial = 5884/30000 | Total reward = 18.45
2022-01-26 14:16:53.010 | DEBUG    | __main__:trials:24 - Trial = 5885/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.011 | DEBUG    | __main__:trials:29 - Trial = 5885/30000 | Total reward = 43.60
2022-01-26 14:16:53.014 | DEBUG    | __main__:trials:24 - Trial = 5886/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.016 | DEBUG    | __main__:trials:29 - Trial = 5886/30000 | Total reward = 41.61
2022-01-26 14:16:53.020 | DEBUG    | __main__:trials:24 - Trial = 5887/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.020 | DEBUG    | __main__:trials:29 - Trial = 5887/30000 | Total reward = 48.15
2022-01-26 14:16:53.025 | DEBUG    | __main__:trials:24 - Trial = 5888/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.026 | DEBUG    | __main__:trials:29 - Trial = 5888/30000 | Total reward = 46.21
2022-01-26 14:16:53.029 | DEBUG    | __main__:trials:24 - Trial = 5889/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.030 | DEBUG    | __main__:trials:29 - Trial = 5889/30000 | Total reward = 46.92
2022-01-26 14:16:53.033 | DEBUG    | __main__:trials:24 - Trial = 5890/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.034 | DEBUG    | __main__:trials:29 - Trial = 5890/30000 | Total reward = 45.51
2022-01-26 14:16:53.037 | DEBUG    | __main__:trials:24 - Trial = 5891/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.039 | DEBUG    | __main__:trials:29 - Trial = 5891/30000 | Total reward = 40.91
2022-01-26 14:16:53.042 | DEBUG    | __main__:trials:24 - Trial = 5892/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.043 | DEBUG    | __main__:trials:29 - Trial = 5892/30000 | Total reward = 43.20
2022-01-26 14:16:53.047 | DEBUG    | __main__:trials:24 - Trial = 5893/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.049 | DEBUG    | __main__:trials:29 - Trial = 5893/30000 | Total reward = 46.52
2022-01-26 14:16:53.052 | DEBUG    | __main__:trials:24 - Trial = 5894/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.053 | DEBUG    | __main__:trials:29 - Trial = 5894/30000 | Total reward = 43.91
2022-01-26 14:16:53.056 | DEBUG    | __main__:trials:24 - Trial = 5895/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.058 | DEBUG    | __main__:trials:29 - Trial = 5895/30000 | Total reward = 46.48
2022-01-26 14:16:53.062 | DEBUG    | __main__:trials:24 - Trial = 5896/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.063 | DEBUG    | __main__:trials:29 - Trial = 5896/30000 | Total reward = 53.58
2022-01-26 14:16:53.066 | DEBUG    | __main__:trials:24 - Trial = 5897/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.067 | DEBUG    | __main__:trials:29 - Trial = 5897/30000 | Total reward = 48.23
2022-01-26 14:16:53.070 | DEBUG    | __main__:trials:24 - Trial = 5898/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.072 | DEBUG    | __main__:trials:29 - Trial = 5898/30000 | Total reward = 40.39
2022-01-26 14:16:53.076 | DEBUG    | __main__:trials:24 - Trial = 5899/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.076 | DEBUG    | __main__:trials:29 - Trial = 5899/30000 | Total reward = 46.44
2022-01-26 14:16:53.080 | DEBUG    | __main__:trials:24 - Trial = 5900/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.081 | DEBUG    | __main__:trials:29 - Trial = 5900/30000 | Total reward = 53.21
2022-01-26 14:16:53.085 | DEBUG    | __main__:trials:24 - Trial = 5901/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.085 | DEBUG    | __main__:trials:29 - Trial = 5901/30000 | Total reward = 48.40
2022-01-26 14:16:53.088 | DEBUG    | __main__:trials:24 - Trial = 5902/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.089 | DEBUG    | __main__:trials:29 - Trial = 5902/30000 | Total reward = 46.95
2022-01-26 14:16:53.093 | DEBUG    | __main__:trials:24 - Trial = 5903/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.094 | DEBUG    | __main__:trials:29 - Trial = 5903/30000 | Total reward = 47.29
2022-01-26 14:16:53.098 | DEBUG    | __main__:trials:24 - Trial = 5904/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.098 | DEBUG    | __main__:trials:29 - Trial = 5904/30000 | Total reward = 48.28
2022-01-26 14:16:53.103 | DEBUG    | __main__:trials:24 - Trial = 5905/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.103 | DEBUG    | __main__:trials:29 - Trial = 5905/30000 | Total reward = 30.89
2022-01-26 14:16:53.108 | DEBUG    | __main__:trials:24 - Trial = 5906/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.108 | DEBUG    | __main__:trials:29 - Trial = 5906/30000 | Total reward = 35.77
2022-01-26 14:16:53.113 | DEBUG    | __main__:trials:24 - Trial = 5907/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.113 | DEBUG    | __main__:trials:29 - Trial = 5907/30000 | Total reward = 47.17
2022-01-26 14:16:53.117 | DEBUG    | __main__:trials:24 - Trial = 5908/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.118 | DEBUG    | __main__:trials:29 - Trial = 5908/30000 | Total reward = 46.57
2022-01-26 14:16:53.122 | DEBUG    | __main__:trials:24 - Trial = 5909/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.123 | DEBUG    | __main__:trials:29 - Trial = 5909/30000 | Total reward = 49.64
2022-01-26 14:16:53.127 | DEBUG    | __main__:trials:24 - Trial = 5910/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.128 | DEBUG    | __main__:trials:29 - Trial = 5910/30000 | Total reward = 30.25
2022-01-26 14:16:53.132 | DEBUG    | __main__:trials:24 - Trial = 5911/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.134 | DEBUG    | __main__:trials:29 - Trial = 5911/30000 | Total reward = 55.29
2022-01-26 14:16:53.138 | DEBUG    | __main__:trials:24 - Trial = 5912/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.139 | DEBUG    | __main__:trials:29 - Trial = 5912/30000 | Total reward = 46.70
2022-01-26 14:16:53.143 | DEBUG    | __main__:trials:24 - Trial = 5913/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.144 | DEBUG    | __main__:trials:29 - Trial = 5913/30000 | Total reward = 48.31
2022-01-26 14:16:53.147 | DEBUG    | __main__:trials:26 - Trial = 5914/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.148 | DEBUG    | __main__:trials:29 - Trial = 5914/30000 | Total reward = 20.45
2022-01-26 14:16:53.152 | DEBUG    | __main__:trials:24 - Trial = 5915/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.153 | DEBUG    | __main__:trials:29 - Trial = 5915/30000 | Total reward = 44.78
2022-01-26 14:16:53.157 | DEBUG    | __main__:trials:24 - Trial = 5916/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.158 | DEBUG    | __main__:trials:29 - Trial = 5916/30000 | Total reward = 44.61
2022-01-26 14:16:53.161 | DEBUG    | __main__:trials:24 - Trial = 5917/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.163 | DEBUG    | __main__:trials:29 - Trial = 5917/30000 | Total reward = 54.23
2022-01-26 14:16:53.167 | DEBUG    | __main__:trials:24 - Trial = 5918/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.167 | DEBUG    | __main__:trials:29 - Trial = 5918/30000 | Total reward = 45.01
2022-01-26 14:16:53.172 | DEBUG    | __main__:trials:26 - Trial = 5919/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.172 | DEBUG    | __main__:trials:29 - Trial = 5919/30000 | Total reward = 36.83
2022-01-26 14:16:53.176 | DEBUG    | __main__:trials:24 - Trial = 5920/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.177 | DEBUG    | __main__:trials:29 - Trial = 5920/30000 | Total reward = 35.37
2022-01-26 14:16:53.180 | DEBUG    | __main__:trials:24 - Trial = 5921/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.182 | DEBUG    | __main__:trials:29 - Trial = 5921/30000 | Total reward = 43.48
2022-01-26 14:16:53.185 | DEBUG    | __main__:trials:24 - Trial = 5922/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.186 | DEBUG    | __main__:trials:29 - Trial = 5922/30000 | Total reward = 56.31
2022-01-26 14:16:53.189 | DEBUG    | __main__:trials:24 - Trial = 5923/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.191 | DEBUG    | __main__:trials:29 - Trial = 5923/30000 | Total reward = 44.83
2022-01-26 14:16:53.194 | DEBUG    | __main__:trials:24 - Trial = 5924/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.196 | DEBUG    | __main__:trials:29 - Trial = 5924/30000 | Total reward = 50.27
2022-01-26 14:16:53.199 | DEBUG    | __main__:trials:24 - Trial = 5925/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.201 | DEBUG    | __main__:trials:29 - Trial = 5925/30000 | Total reward = 44.64
2022-01-26 14:16:53.204 | DEBUG    | __main__:trials:24 - Trial = 5926/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.205 | DEBUG    | __main__:trials:29 - Trial = 5926/30000 | Total reward = 44.64
2022-01-26 14:16:53.208 | DEBUG    | __main__:trials:24 - Trial = 5927/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.210 | DEBUG    | __main__:trials:29 - Trial = 5927/30000 | Total reward = 44.70
2022-01-26 14:16:53.214 | DEBUG    | __main__:trials:24 - Trial = 5928/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.214 | DEBUG    | __main__:trials:29 - Trial = 5928/30000 | Total reward = 34.70
2022-01-26 14:16:53.219 | DEBUG    | __main__:trials:24 - Trial = 5929/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.220 | DEBUG    | __main__:trials:29 - Trial = 5929/30000 | Total reward = 45.85
2022-01-26 14:16:53.224 | DEBUG    | __main__:trials:24 - Trial = 5930/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.225 | DEBUG    | __main__:trials:29 - Trial = 5930/30000 | Total reward = 38.51
2022-01-26 14:16:53.229 | DEBUG    | __main__:trials:24 - Trial = 5931/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.230 | DEBUG    | __main__:trials:29 - Trial = 5931/30000 | Total reward = 34.77
2022-01-26 14:16:53.234 | DEBUG    | __main__:trials:24 - Trial = 5932/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.236 | DEBUG    | __main__:trials:29 - Trial = 5932/30000 | Total reward = 49.14
2022-01-26 14:16:53.239 | DEBUG    | __main__:trials:24 - Trial = 5933/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.240 | DEBUG    | __main__:trials:29 - Trial = 5933/30000 | Total reward = 46.52
2022-01-26 14:16:53.244 | DEBUG    | __main__:trials:24 - Trial = 5934/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.246 | DEBUG    | __main__:trials:29 - Trial = 5934/30000 | Total reward = 48.78
2022-01-26 14:16:53.250 | DEBUG    | __main__:trials:24 - Trial = 5935/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.250 | DEBUG    | __main__:trials:29 - Trial = 5935/30000 | Total reward = 36.18
2022-01-26 14:16:53.254 | DEBUG    | __main__:trials:24 - Trial = 5936/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.255 | DEBUG    | __main__:trials:29 - Trial = 5936/30000 | Total reward = 45.32
2022-01-26 14:16:53.260 | DEBUG    | __main__:trials:24 - Trial = 5937/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.261 | DEBUG    | __main__:trials:29 - Trial = 5937/30000 | Total reward = 45.90
2022-01-26 14:16:53.265 | DEBUG    | __main__:trials:24 - Trial = 5938/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.266 | DEBUG    | __main__:trials:29 - Trial = 5938/30000 | Total reward = 45.48
2022-01-26 14:16:53.270 | DEBUG    | __main__:trials:24 - Trial = 5939/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.271 | DEBUG    | __main__:trials:29 - Trial = 5939/30000 | Total reward = 45.01
2022-01-26 14:16:53.275 | DEBUG    | __main__:trials:24 - Trial = 5940/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.276 | DEBUG    | __main__:trials:29 - Trial = 5940/30000 | Total reward = 46.70
2022-01-26 14:16:53.280 | DEBUG    | __main__:trials:24 - Trial = 5941/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.282 | DEBUG    | __main__:trials:29 - Trial = 5941/30000 | Total reward = 48.07
2022-01-26 14:16:53.285 | DEBUG    | __main__:trials:24 - Trial = 5942/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.287 | DEBUG    | __main__:trials:29 - Trial = 5942/30000 | Total reward = 40.07
2022-01-26 14:16:53.291 | DEBUG    | __main__:trials:24 - Trial = 5943/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.291 | DEBUG    | __main__:trials:29 - Trial = 5943/30000 | Total reward = 49.22
2022-01-26 14:16:53.295 | DEBUG    | __main__:trials:24 - Trial = 5944/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.297 | DEBUG    | __main__:trials:29 - Trial = 5944/30000 | Total reward = 29.37
2022-01-26 14:16:53.299 | DEBUG    | __main__:trials:24 - Trial = 5945/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.301 | DEBUG    | __main__:trials:29 - Trial = 5945/30000 | Total reward = 38.75
2022-01-26 14:16:53.304 | DEBUG    | __main__:trials:26 - Trial = 5946/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.306 | DEBUG    | __main__:trials:29 - Trial = 5946/30000 | Total reward = 36.22
2022-01-26 14:16:53.309 | DEBUG    | __main__:trials:24 - Trial = 5947/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.311 | DEBUG    | __main__:trials:29 - Trial = 5947/30000 | Total reward = 11.83
2022-01-26 14:16:53.314 | DEBUG    | __main__:trials:24 - Trial = 5948/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.316 | DEBUG    | __main__:trials:29 - Trial = 5948/30000 | Total reward = 51.04
2022-01-26 14:16:53.319 | DEBUG    | __main__:trials:24 - Trial = 5949/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.320 | DEBUG    | __main__:trials:29 - Trial = 5949/30000 | Total reward = 44.70
2022-01-26 14:16:53.324 | DEBUG    | __main__:trials:24 - Trial = 5950/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.325 | DEBUG    | __main__:trials:29 - Trial = 5950/30000 | Total reward = 45.87
2022-01-26 14:16:53.329 | DEBUG    | __main__:trials:24 - Trial = 5951/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.331 | DEBUG    | __main__:trials:29 - Trial = 5951/30000 | Total reward = 37.04
2022-01-26 14:16:53.333 | DEBUG    | __main__:trials:26 - Trial = 5952/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.334 | DEBUG    | __main__:trials:29 - Trial = 5952/30000 | Total reward = 25.46
2022-01-26 14:16:53.338 | DEBUG    | __main__:trials:24 - Trial = 5953/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.339 | DEBUG    | __main__:trials:29 - Trial = 5953/30000 | Total reward = 45.23
2022-01-26 14:16:53.343 | DEBUG    | __main__:trials:24 - Trial = 5954/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.343 | DEBUG    | __main__:trials:29 - Trial = 5954/30000 | Total reward = 48.71
2022-01-26 14:16:53.347 | DEBUG    | __main__:trials:24 - Trial = 5955/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.349 | DEBUG    | __main__:trials:29 - Trial = 5955/30000 | Total reward = 32.27
2022-01-26 14:16:53.351 | DEBUG    | __main__:trials:24 - Trial = 5956/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.353 | DEBUG    | __main__:trials:29 - Trial = 5956/30000 | Total reward = 46.02
2022-01-26 14:16:53.356 | DEBUG    | __main__:trials:24 - Trial = 5957/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.358 | DEBUG    | __main__:trials:29 - Trial = 5957/30000 | Total reward = 41.67
2022-01-26 14:16:53.362 | DEBUG    | __main__:trials:24 - Trial = 5958/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.363 | DEBUG    | __main__:trials:29 - Trial = 5958/30000 | Total reward = 30.92
2022-01-26 14:16:53.367 | DEBUG    | __main__:trials:24 - Trial = 5959/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.367 | DEBUG    | __main__:trials:29 - Trial = 5959/30000 | Total reward = 37.22
2022-01-26 14:16:53.371 | DEBUG    | __main__:trials:24 - Trial = 5960/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.372 | DEBUG    | __main__:trials:29 - Trial = 5960/30000 | Total reward = 42.93
2022-01-26 14:16:53.375 | DEBUG    | __main__:trials:24 - Trial = 5961/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.376 | DEBUG    | __main__:trials:29 - Trial = 5961/30000 | Total reward = 48.25
2022-01-26 14:16:53.380 | DEBUG    | __main__:trials:24 - Trial = 5962/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.381 | DEBUG    | __main__:trials:29 - Trial = 5962/30000 | Total reward = 36.62
2022-01-26 14:16:53.384 | DEBUG    | __main__:trials:24 - Trial = 5963/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.385 | DEBUG    | __main__:trials:29 - Trial = 5963/30000 | Total reward = 48.07
2022-01-26 14:16:53.388 | DEBUG    | __main__:trials:24 - Trial = 5964/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.390 | DEBUG    | __main__:trials:29 - Trial = 5964/30000 | Total reward = 47.54
2022-01-26 14:16:53.393 | DEBUG    | __main__:trials:24 - Trial = 5965/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.393 | DEBUG    | __main__:trials:29 - Trial = 5965/30000 | Total reward = 26.81
2022-01-26 14:16:53.397 | DEBUG    | __main__:trials:24 - Trial = 5966/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.398 | DEBUG    | __main__:trials:29 - Trial = 5966/30000 | Total reward = 50.49
2022-01-26 14:16:53.401 | DEBUG    | __main__:trials:24 - Trial = 5967/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.403 | DEBUG    | __main__:trials:29 - Trial = 5967/30000 | Total reward = 51.88
2022-01-26 14:16:53.406 | DEBUG    | __main__:trials:24 - Trial = 5968/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.407 | DEBUG    | __main__:trials:29 - Trial = 5968/30000 | Total reward = 44.07
2022-01-26 14:16:53.410 | DEBUG    | __main__:trials:24 - Trial = 5969/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.412 | DEBUG    | __main__:trials:29 - Trial = 5969/30000 | Total reward = 46.52
2022-01-26 14:16:53.416 | DEBUG    | __main__:trials:24 - Trial = 5970/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.417 | DEBUG    | __main__:trials:29 - Trial = 5970/30000 | Total reward = 43.18
2022-01-26 14:16:53.420 | DEBUG    | __main__:trials:24 - Trial = 5971/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.422 | DEBUG    | __main__:trials:29 - Trial = 5971/30000 | Total reward = 49.42
2022-01-26 14:16:53.425 | DEBUG    | __main__:trials:24 - Trial = 5972/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.426 | DEBUG    | __main__:trials:29 - Trial = 5972/30000 | Total reward = 54.10
2022-01-26 14:16:53.430 | DEBUG    | __main__:trials:24 - Trial = 5973/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.430 | DEBUG    | __main__:trials:29 - Trial = 5973/30000 | Total reward = 18.02
2022-01-26 14:16:53.434 | DEBUG    | __main__:trials:24 - Trial = 5974/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.436 | DEBUG    | __main__:trials:29 - Trial = 5974/30000 | Total reward = 40.53
2022-01-26 14:16:53.439 | DEBUG    | __main__:trials:24 - Trial = 5975/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.440 | DEBUG    | __main__:trials:29 - Trial = 5975/30000 | Total reward = 43.11
2022-01-26 14:16:53.444 | DEBUG    | __main__:trials:24 - Trial = 5976/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.446 | DEBUG    | __main__:trials:29 - Trial = 5976/30000 | Total reward = 44.53
2022-01-26 14:16:53.449 | DEBUG    | __main__:trials:24 - Trial = 5977/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.450 | DEBUG    | __main__:trials:29 - Trial = 5977/30000 | Total reward = 49.82
2022-01-26 14:16:53.454 | DEBUG    | __main__:trials:24 - Trial = 5978/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.455 | DEBUG    | __main__:trials:29 - Trial = 5978/30000 | Total reward = 46.70
2022-01-26 14:16:53.459 | DEBUG    | __main__:trials:24 - Trial = 5979/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.460 | DEBUG    | __main__:trials:29 - Trial = 5979/30000 | Total reward = 41.76
2022-01-26 14:16:53.463 | DEBUG    | __main__:trials:24 - Trial = 5980/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.465 | DEBUG    | __main__:trials:29 - Trial = 5980/30000 | Total reward = 38.24
2022-01-26 14:16:53.468 | DEBUG    | __main__:trials:24 - Trial = 5981/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.470 | DEBUG    | __main__:trials:29 - Trial = 5981/30000 | Total reward = 48.27
2022-01-26 14:16:53.473 | DEBUG    | __main__:trials:24 - Trial = 5982/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.475 | DEBUG    | __main__:trials:29 - Trial = 5982/30000 | Total reward = 46.80
2022-01-26 14:16:53.478 | DEBUG    | __main__:trials:24 - Trial = 5983/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.479 | DEBUG    | __main__:trials:29 - Trial = 5983/30000 | Total reward = 54.50
2022-01-26 14:16:53.482 | DEBUG    | __main__:trials:24 - Trial = 5984/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.484 | DEBUG    | __main__:trials:29 - Trial = 5984/30000 | Total reward = 44.64
2022-01-26 14:16:53.486 | DEBUG    | __main__:trials:24 - Trial = 5985/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.488 | DEBUG    | __main__:trials:29 - Trial = 5985/30000 | Total reward = 46.19
2022-01-26 14:16:53.491 | DEBUG    | __main__:trials:24 - Trial = 5986/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.493 | DEBUG    | __main__:trials:29 - Trial = 5986/30000 | Total reward = 49.24
2022-01-26 14:16:53.496 | DEBUG    | __main__:trials:24 - Trial = 5987/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.497 | DEBUG    | __main__:trials:29 - Trial = 5987/30000 | Total reward = 46.39
2022-01-26 14:16:53.500 | DEBUG    | __main__:trials:24 - Trial = 5988/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.502 | DEBUG    | __main__:trials:29 - Trial = 5988/30000 | Total reward = 38.98
2022-01-26 14:16:53.505 | DEBUG    | __main__:trials:24 - Trial = 5989/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.506 | DEBUG    | __main__:trials:29 - Trial = 5989/30000 | Total reward = 44.32
2022-01-26 14:16:53.510 | DEBUG    | __main__:trials:24 - Trial = 5990/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.512 | DEBUG    | __main__:trials:29 - Trial = 5990/30000 | Total reward = 47.51
2022-01-26 14:16:53.515 | DEBUG    | __main__:trials:24 - Trial = 5991/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.517 | DEBUG    | __main__:trials:29 - Trial = 5991/30000 | Total reward = 46.70
2022-01-26 14:16:53.520 | DEBUG    | __main__:trials:24 - Trial = 5992/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.522 | DEBUG    | __main__:trials:29 - Trial = 5992/30000 | Total reward = 46.42
2022-01-26 14:16:53.525 | DEBUG    | __main__:trials:24 - Trial = 5993/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.527 | DEBUG    | __main__:trials:29 - Trial = 5993/30000 | Total reward = 46.02
2022-01-26 14:16:53.530 | DEBUG    | __main__:trials:24 - Trial = 5994/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.532 | DEBUG    | __main__:trials:29 - Trial = 5994/30000 | Total reward = 40.81
2022-01-26 14:16:53.535 | DEBUG    | __main__:trials:24 - Trial = 5995/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.537 | DEBUG    | __main__:trials:29 - Trial = 5995/30000 | Total reward = 39.17
2022-01-26 14:16:53.539 | DEBUG    | __main__:trials:24 - Trial = 5996/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.541 | DEBUG    | __main__:trials:29 - Trial = 5996/30000 | Total reward = 46.19
2022-01-26 14:16:53.544 | DEBUG    | __main__:trials:24 - Trial = 5997/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.546 | DEBUG    | __main__:trials:29 - Trial = 5997/30000 | Total reward = 46.78
2022-01-26 14:16:53.550 | DEBUG    | __main__:trials:24 - Trial = 5998/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.551 | DEBUG    | __main__:trials:29 - Trial = 5998/30000 | Total reward = 49.24
2022-01-26 14:16:53.554 | DEBUG    | __main__:trials:24 - Trial = 5999/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.556 | DEBUG    | __main__:trials:29 - Trial = 5999/30000 | Total reward = 42.52
2022-01-26 14:16:53.559 | DEBUG    | __main__:trials:24 - Trial = 6000/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.561 | DEBUG    | __main__:trials:29 - Trial = 6000/30000 | Total reward = 37.02
2022-01-26 14:16:53.564 | DEBUG    | __main__:trials:24 - Trial = 6001/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.566 | DEBUG    | __main__:trials:29 - Trial = 6001/30000 | Total reward = 47.74
2022-01-26 14:16:53.568 | DEBUG    | __main__:trials:24 - Trial = 6002/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.570 | DEBUG    | __main__:trials:29 - Trial = 6002/30000 | Total reward = 42.90
2022-01-26 14:16:53.573 | DEBUG    | __main__:trials:24 - Trial = 6003/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.574 | DEBUG    | __main__:trials:29 - Trial = 6003/30000 | Total reward = 29.89
2022-01-26 14:16:53.579 | DEBUG    | __main__:trials:24 - Trial = 6004/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.581 | DEBUG    | __main__:trials:29 - Trial = 6004/30000 | Total reward = 46.57
2022-01-26 14:16:53.584 | DEBUG    | __main__:trials:26 - Trial = 6005/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.586 | DEBUG    | __main__:trials:29 - Trial = 6005/30000 | Total reward = 16.56
2022-01-26 14:16:53.589 | DEBUG    | __main__:trials:24 - Trial = 6006/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.590 | DEBUG    | __main__:trials:29 - Trial = 6006/30000 | Total reward = 45.50
2022-01-26 14:16:53.593 | DEBUG    | __main__:trials:24 - Trial = 6007/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.595 | DEBUG    | __main__:trials:29 - Trial = 6007/30000 | Total reward = 36.33
2022-01-26 14:16:53.598 | DEBUG    | __main__:trials:24 - Trial = 6008/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.600 | DEBUG    | __main__:trials:29 - Trial = 6008/30000 | Total reward = 56.43
2022-01-26 14:16:53.603 | DEBUG    | __main__:trials:24 - Trial = 6009/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.605 | DEBUG    | __main__:trials:29 - Trial = 6009/30000 | Total reward = 41.76
2022-01-26 14:16:53.608 | DEBUG    | __main__:trials:24 - Trial = 6010/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.610 | DEBUG    | __main__:trials:29 - Trial = 6010/30000 | Total reward = 35.14
2022-01-26 14:16:53.613 | DEBUG    | __main__:trials:24 - Trial = 6011/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.615 | DEBUG    | __main__:trials:29 - Trial = 6011/30000 | Total reward = 43.49
2022-01-26 14:16:53.618 | DEBUG    | __main__:trials:24 - Trial = 6012/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.620 | DEBUG    | __main__:trials:29 - Trial = 6012/30000 | Total reward = 44.90
2022-01-26 14:16:53.622 | DEBUG    | __main__:trials:24 - Trial = 6013/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.624 | DEBUG    | __main__:trials:29 - Trial = 6013/30000 | Total reward = 40.23
2022-01-26 14:16:53.628 | DEBUG    | __main__:trials:24 - Trial = 6014/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.629 | DEBUG    | __main__:trials:29 - Trial = 6014/30000 | Total reward = 46.70
2022-01-26 14:16:53.632 | DEBUG    | __main__:trials:24 - Trial = 6015/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.634 | DEBUG    | __main__:trials:29 - Trial = 6015/30000 | Total reward = 58.01
2022-01-26 14:16:53.638 | DEBUG    | __main__:trials:24 - Trial = 6016/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.639 | DEBUG    | __main__:trials:29 - Trial = 6016/30000 | Total reward = 45.90
2022-01-26 14:16:53.642 | DEBUG    | __main__:trials:24 - Trial = 6017/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.644 | DEBUG    | __main__:trials:29 - Trial = 6017/30000 | Total reward = 53.39
2022-01-26 14:16:53.648 | DEBUG    | __main__:trials:24 - Trial = 6018/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.650 | DEBUG    | __main__:trials:29 - Trial = 6018/30000 | Total reward = 54.52
2022-01-26 14:16:53.653 | DEBUG    | __main__:trials:24 - Trial = 6019/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.654 | DEBUG    | __main__:trials:29 - Trial = 6019/30000 | Total reward = 44.47
2022-01-26 14:16:53.658 | DEBUG    | __main__:trials:24 - Trial = 6020/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.660 | DEBUG    | __main__:trials:29 - Trial = 6020/30000 | Total reward = 41.46
2022-01-26 14:16:53.663 | DEBUG    | __main__:trials:24 - Trial = 6021/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.664 | DEBUG    | __main__:trials:29 - Trial = 6021/30000 | Total reward = 46.52
2022-01-26 14:16:53.668 | DEBUG    | __main__:trials:24 - Trial = 6022/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.669 | DEBUG    | __main__:trials:29 - Trial = 6022/30000 | Total reward = 45.73
2022-01-26 14:16:53.672 | DEBUG    | __main__:trials:24 - Trial = 6023/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.674 | DEBUG    | __main__:trials:29 - Trial = 6023/30000 | Total reward = 57.08
2022-01-26 14:16:53.678 | DEBUG    | __main__:trials:24 - Trial = 6024/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.679 | DEBUG    | __main__:trials:29 - Trial = 6024/30000 | Total reward = 51.42
2022-01-26 14:16:53.683 | DEBUG    | __main__:trials:24 - Trial = 6025/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.684 | DEBUG    | __main__:trials:29 - Trial = 6025/30000 | Total reward = 43.25
2022-01-26 14:16:53.688 | DEBUG    | __main__:trials:24 - Trial = 6026/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.689 | DEBUG    | __main__:trials:29 - Trial = 6026/30000 | Total reward = 60.26
2022-01-26 14:16:53.693 | DEBUG    | __main__:trials:24 - Trial = 6027/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.695 | DEBUG    | __main__:trials:29 - Trial = 6027/30000 | Total reward = 43.15
2022-01-26 14:16:53.698 | DEBUG    | __main__:trials:24 - Trial = 6028/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.700 | DEBUG    | __main__:trials:29 - Trial = 6028/30000 | Total reward = 57.65
2022-01-26 14:16:53.704 | DEBUG    | __main__:trials:24 - Trial = 6029/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.704 | DEBUG    | __main__:trials:29 - Trial = 6029/30000 | Total reward = 46.79
2022-01-26 14:16:53.708 | DEBUG    | __main__:trials:24 - Trial = 6030/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.710 | DEBUG    | __main__:trials:29 - Trial = 6030/30000 | Total reward = 44.02
2022-01-26 14:16:53.713 | DEBUG    | __main__:trials:24 - Trial = 6031/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.713 | DEBUG    | __main__:trials:29 - Trial = 6031/30000 | Total reward = 47.85
2022-01-26 14:16:53.718 | DEBUG    | __main__:trials:24 - Trial = 6032/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.719 | DEBUG    | __main__:trials:29 - Trial = 6032/30000 | Total reward = 45.99
2022-01-26 14:16:53.723 | DEBUG    | __main__:trials:24 - Trial = 6033/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.724 | DEBUG    | __main__:trials:29 - Trial = 6033/30000 | Total reward = 45.71
2022-01-26 14:16:53.727 | DEBUG    | __main__:trials:24 - Trial = 6034/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.729 | DEBUG    | __main__:trials:29 - Trial = 6034/30000 | Total reward = 33.78
2022-01-26 14:16:53.732 | DEBUG    | __main__:trials:24 - Trial = 6035/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.734 | DEBUG    | __main__:trials:29 - Trial = 6035/30000 | Total reward = 45.06
2022-01-26 14:16:53.737 | DEBUG    | __main__:trials:24 - Trial = 6036/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.738 | DEBUG    | __main__:trials:29 - Trial = 6036/30000 | Total reward = 45.50
2022-01-26 14:16:53.742 | DEBUG    | __main__:trials:24 - Trial = 6037/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.743 | DEBUG    | __main__:trials:29 - Trial = 6037/30000 | Total reward = 45.05
2022-01-26 14:16:53.748 | DEBUG    | __main__:trials:24 - Trial = 6038/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.749 | DEBUG    | __main__:trials:29 - Trial = 6038/30000 | Total reward = 22.87
2022-01-26 14:16:53.752 | DEBUG    | __main__:trials:24 - Trial = 6039/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.754 | DEBUG    | __main__:trials:29 - Trial = 6039/30000 | Total reward = 46.52
2022-01-26 14:16:53.757 | DEBUG    | __main__:trials:24 - Trial = 6040/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.759 | DEBUG    | __main__:trials:29 - Trial = 6040/30000 | Total reward = 44.72
2022-01-26 14:16:53.762 | DEBUG    | __main__:trials:24 - Trial = 6041/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.763 | DEBUG    | __main__:trials:29 - Trial = 6041/30000 | Total reward = 48.88
2022-01-26 14:16:53.767 | DEBUG    | __main__:trials:24 - Trial = 6042/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.768 | DEBUG    | __main__:trials:29 - Trial = 6042/30000 | Total reward = 41.52
2022-01-26 14:16:53.772 | DEBUG    | __main__:trials:24 - Trial = 6043/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.773 | DEBUG    | __main__:trials:29 - Trial = 6043/30000 | Total reward = 45.99
2022-01-26 14:16:53.776 | DEBUG    | __main__:trials:24 - Trial = 6044/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.777 | DEBUG    | __main__:trials:29 - Trial = 6044/30000 | Total reward = 46.10
2022-01-26 14:16:53.780 | DEBUG    | __main__:trials:24 - Trial = 6045/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.782 | DEBUG    | __main__:trials:29 - Trial = 6045/30000 | Total reward = 52.22
2022-01-26 14:16:53.785 | DEBUG    | __main__:trials:24 - Trial = 6046/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.787 | DEBUG    | __main__:trials:29 - Trial = 6046/30000 | Total reward = 46.52
2022-01-26 14:16:53.790 | DEBUG    | __main__:trials:24 - Trial = 6047/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.791 | DEBUG    | __main__:trials:29 - Trial = 6047/30000 | Total reward = 47.63
2022-01-26 14:16:53.795 | DEBUG    | __main__:trials:24 - Trial = 6048/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.796 | DEBUG    | __main__:trials:29 - Trial = 6048/30000 | Total reward = 38.12
2022-01-26 14:16:53.800 | DEBUG    | __main__:trials:24 - Trial = 6049/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.801 | DEBUG    | __main__:trials:29 - Trial = 6049/30000 | Total reward = 47.29
2022-01-26 14:16:53.805 | DEBUG    | __main__:trials:24 - Trial = 6050/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.806 | DEBUG    | __main__:trials:29 - Trial = 6050/30000 | Total reward = 49.27
2022-01-26 14:16:53.810 | DEBUG    | __main__:trials:24 - Trial = 6051/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.811 | DEBUG    | __main__:trials:29 - Trial = 6051/30000 | Total reward = 26.85
2022-01-26 14:16:53.815 | DEBUG    | __main__:trials:24 - Trial = 6052/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.817 | DEBUG    | __main__:trials:29 - Trial = 6052/30000 | Total reward = 43.59
2022-01-26 14:16:53.820 | DEBUG    | __main__:trials:24 - Trial = 6053/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.821 | DEBUG    | __main__:trials:29 - Trial = 6053/30000 | Total reward = 53.16
2022-01-26 14:16:53.824 | DEBUG    | __main__:trials:24 - Trial = 6054/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.826 | DEBUG    | __main__:trials:29 - Trial = 6054/30000 | Total reward = 43.12
2022-01-26 14:16:53.829 | DEBUG    | __main__:trials:24 - Trial = 6055/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.829 | DEBUG    | __main__:trials:29 - Trial = 6055/30000 | Total reward = 47.53
2022-01-26 14:16:53.834 | DEBUG    | __main__:trials:24 - Trial = 6056/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.835 | DEBUG    | __main__:trials:29 - Trial = 6056/30000 | Total reward = 50.08
2022-01-26 14:16:53.839 | DEBUG    | __main__:trials:24 - Trial = 6057/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.840 | DEBUG    | __main__:trials:29 - Trial = 6057/30000 | Total reward = 35.39
2022-01-26 14:16:53.844 | DEBUG    | __main__:trials:24 - Trial = 6058/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.845 | DEBUG    | __main__:trials:29 - Trial = 6058/30000 | Total reward = 39.86
2022-01-26 14:16:53.849 | DEBUG    | __main__:trials:24 - Trial = 6059/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.849 | DEBUG    | __main__:trials:29 - Trial = 6059/30000 | Total reward = 54.90
2022-01-26 14:16:53.852 | DEBUG    | __main__:trials:26 - Trial = 6060/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.853 | DEBUG    | __main__:trials:29 - Trial = 6060/30000 | Total reward = 12.90
2022-01-26 14:16:53.857 | DEBUG    | __main__:trials:24 - Trial = 6061/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.858 | DEBUG    | __main__:trials:29 - Trial = 6061/30000 | Total reward = 50.65
2022-01-26 14:16:53.861 | DEBUG    | __main__:trials:24 - Trial = 6062/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.862 | DEBUG    | __main__:trials:29 - Trial = 6062/30000 | Total reward = 46.52
2022-01-26 14:16:53.866 | DEBUG    | __main__:trials:24 - Trial = 6063/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.867 | DEBUG    | __main__:trials:29 - Trial = 6063/30000 | Total reward = 44.66
2022-01-26 14:16:53.870 | DEBUG    | __main__:trials:24 - Trial = 6064/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.872 | DEBUG    | __main__:trials:29 - Trial = 6064/30000 | Total reward = 34.88
2022-01-26 14:16:53.875 | DEBUG    | __main__:trials:24 - Trial = 6065/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.876 | DEBUG    | __main__:trials:29 - Trial = 6065/30000 | Total reward = 42.53
2022-01-26 14:16:53.879 | DEBUG    | __main__:trials:24 - Trial = 6066/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.881 | DEBUG    | __main__:trials:29 - Trial = 6066/30000 | Total reward = 45.13
2022-01-26 14:16:53.885 | DEBUG    | __main__:trials:24 - Trial = 6067/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.886 | DEBUG    | __main__:trials:29 - Trial = 6067/30000 | Total reward = 27.78
2022-01-26 14:16:53.890 | DEBUG    | __main__:trials:24 - Trial = 6068/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.891 | DEBUG    | __main__:trials:29 - Trial = 6068/30000 | Total reward = 42.82
2022-01-26 14:16:53.895 | DEBUG    | __main__:trials:24 - Trial = 6069/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.896 | DEBUG    | __main__:trials:29 - Trial = 6069/30000 | Total reward = 39.89
2022-01-26 14:16:53.900 | DEBUG    | __main__:trials:24 - Trial = 6070/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.902 | DEBUG    | __main__:trials:29 - Trial = 6070/30000 | Total reward = 27.91
2022-01-26 14:16:53.905 | DEBUG    | __main__:trials:26 - Trial = 6071/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.906 | DEBUG    | __main__:trials:29 - Trial = 6071/30000 | Total reward = 25.69
2022-01-26 14:16:53.910 | DEBUG    | __main__:trials:24 - Trial = 6072/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.912 | DEBUG    | __main__:trials:29 - Trial = 6072/30000 | Total reward = 65.11
2022-01-26 14:16:53.914 | DEBUG    | __main__:trials:24 - Trial = 6073/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.916 | DEBUG    | __main__:trials:29 - Trial = 6073/30000 | Total reward = 64.83
2022-01-26 14:16:53.920 | DEBUG    | __main__:trials:26 - Trial = 6074/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:53.921 | DEBUG    | __main__:trials:29 - Trial = 6074/30000 | Total reward = 15.72
2022-01-26 14:16:53.925 | DEBUG    | __main__:trials:24 - Trial = 6075/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.925 | DEBUG    | __main__:trials:29 - Trial = 6075/30000 | Total reward = 56.71
2022-01-26 14:16:53.930 | DEBUG    | __main__:trials:24 - Trial = 6076/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.931 | DEBUG    | __main__:trials:29 - Trial = 6076/30000 | Total reward = 50.44
2022-01-26 14:16:53.934 | DEBUG    | __main__:trials:24 - Trial = 6077/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.936 | DEBUG    | __main__:trials:29 - Trial = 6077/30000 | Total reward = 30.13
2022-01-26 14:16:53.939 | DEBUG    | __main__:trials:24 - Trial = 6078/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.940 | DEBUG    | __main__:trials:29 - Trial = 6078/30000 | Total reward = 44.06
2022-01-26 14:16:53.943 | DEBUG    | __main__:trials:24 - Trial = 6079/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.945 | DEBUG    | __main__:trials:29 - Trial = 6079/30000 | Total reward = 47.99
2022-01-26 14:16:53.948 | DEBUG    | __main__:trials:24 - Trial = 6080/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.950 | DEBUG    | __main__:trials:29 - Trial = 6080/30000 | Total reward = 50.00
2022-01-26 14:16:53.953 | DEBUG    | __main__:trials:24 - Trial = 6081/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.955 | DEBUG    | __main__:trials:29 - Trial = 6081/30000 | Total reward = 47.11
2022-01-26 14:16:53.958 | DEBUG    | __main__:trials:24 - Trial = 6082/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.959 | DEBUG    | __main__:trials:29 - Trial = 6082/30000 | Total reward = 49.88
2022-01-26 14:16:53.963 | DEBUG    | __main__:trials:24 - Trial = 6083/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.965 | DEBUG    | __main__:trials:29 - Trial = 6083/30000 | Total reward = 43.67
2022-01-26 14:16:53.968 | DEBUG    | __main__:trials:24 - Trial = 6084/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.970 | DEBUG    | __main__:trials:29 - Trial = 6084/30000 | Total reward = 47.05
2022-01-26 14:16:53.974 | DEBUG    | __main__:trials:24 - Trial = 6085/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.975 | DEBUG    | __main__:trials:29 - Trial = 6085/30000 | Total reward = 34.25
2022-01-26 14:16:53.978 | DEBUG    | __main__:trials:24 - Trial = 6086/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.979 | DEBUG    | __main__:trials:29 - Trial = 6086/30000 | Total reward = 52.79
2022-01-26 14:16:53.983 | DEBUG    | __main__:trials:24 - Trial = 6087/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.985 | DEBUG    | __main__:trials:29 - Trial = 6087/30000 | Total reward = 47.14
2022-01-26 14:16:53.988 | DEBUG    | __main__:trials:24 - Trial = 6088/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.989 | DEBUG    | __main__:trials:29 - Trial = 6088/30000 | Total reward = 40.48
2022-01-26 14:16:53.992 | DEBUG    | __main__:trials:24 - Trial = 6089/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.993 | DEBUG    | __main__:trials:29 - Trial = 6089/30000 | Total reward = 47.53
2022-01-26 14:16:53.997 | DEBUG    | __main__:trials:24 - Trial = 6090/30000 | Max number of steps (20) reached
2022-01-26 14:16:53.997 | DEBUG    | __main__:trials:29 - Trial = 6090/30000 | Total reward = 61.69
2022-01-26 14:16:54.001 | DEBUG    | __main__:trials:24 - Trial = 6091/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.001 | DEBUG    | __main__:trials:29 - Trial = 6091/30000 | Total reward = 48.38
2022-01-26 14:16:54.004 | DEBUG    | __main__:trials:24 - Trial = 6092/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.006 | DEBUG    | __main__:trials:29 - Trial = 6092/30000 | Total reward = 49.23
2022-01-26 14:16:54.009 | DEBUG    | __main__:trials:24 - Trial = 6093/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.010 | DEBUG    | __main__:trials:29 - Trial = 6093/30000 | Total reward = 37.24
2022-01-26 14:16:54.014 | DEBUG    | __main__:trials:24 - Trial = 6094/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.016 | DEBUG    | __main__:trials:29 - Trial = 6094/30000 | Total reward = 47.11
2022-01-26 14:16:54.019 | DEBUG    | __main__:trials:24 - Trial = 6095/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.021 | DEBUG    | __main__:trials:29 - Trial = 6095/30000 | Total reward = 29.19
2022-01-26 14:16:54.024 | DEBUG    | __main__:trials:24 - Trial = 6096/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.026 | DEBUG    | __main__:trials:29 - Trial = 6096/30000 | Total reward = 38.38
2022-01-26 14:16:54.029 | DEBUG    | __main__:trials:24 - Trial = 6097/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.031 | DEBUG    | __main__:trials:29 - Trial = 6097/30000 | Total reward = 46.52
2022-01-26 14:16:54.035 | DEBUG    | __main__:trials:24 - Trial = 6098/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.035 | DEBUG    | __main__:trials:29 - Trial = 6098/30000 | Total reward = 49.42
2022-01-26 14:16:54.039 | DEBUG    | __main__:trials:24 - Trial = 6099/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.040 | DEBUG    | __main__:trials:29 - Trial = 6099/30000 | Total reward = 45.58
2022-01-26 14:16:54.044 | DEBUG    | __main__:trials:24 - Trial = 6100/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.045 | DEBUG    | __main__:trials:29 - Trial = 6100/30000 | Total reward = 43.48
2022-01-26 14:16:54.049 | DEBUG    | __main__:trials:24 - Trial = 6101/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.050 | DEBUG    | __main__:trials:29 - Trial = 6101/30000 | Total reward = 42.82
2022-01-26 14:16:54.054 | DEBUG    | __main__:trials:24 - Trial = 6102/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.055 | DEBUG    | __main__:trials:29 - Trial = 6102/30000 | Total reward = 49.59
2022-01-26 14:16:54.060 | DEBUG    | __main__:trials:24 - Trial = 6103/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.061 | DEBUG    | __main__:trials:29 - Trial = 6103/30000 | Total reward = 54.20
2022-01-26 14:16:54.064 | DEBUG    | __main__:trials:26 - Trial = 6104/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.066 | DEBUG    | __main__:trials:29 - Trial = 6104/30000 | Total reward = 33.68
2022-01-26 14:16:54.069 | DEBUG    | __main__:trials:24 - Trial = 6105/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.071 | DEBUG    | __main__:trials:29 - Trial = 6105/30000 | Total reward = 26.64
2022-01-26 14:16:54.074 | DEBUG    | __main__:trials:24 - Trial = 6106/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.075 | DEBUG    | __main__:trials:29 - Trial = 6106/30000 | Total reward = 52.96
2022-01-26 14:16:54.079 | DEBUG    | __main__:trials:24 - Trial = 6107/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.080 | DEBUG    | __main__:trials:29 - Trial = 6107/30000 | Total reward = 46.75
2022-01-26 14:16:54.083 | DEBUG    | __main__:trials:24 - Trial = 6108/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.085 | DEBUG    | __main__:trials:29 - Trial = 6108/30000 | Total reward = 44.03
2022-01-26 14:16:54.089 | DEBUG    | __main__:trials:24 - Trial = 6109/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.090 | DEBUG    | __main__:trials:29 - Trial = 6109/30000 | Total reward = 53.87
2022-01-26 14:16:54.093 | DEBUG    | __main__:trials:24 - Trial = 6110/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.094 | DEBUG    | __main__:trials:29 - Trial = 6110/30000 | Total reward = 49.06
2022-01-26 14:16:54.097 | DEBUG    | __main__:trials:24 - Trial = 6111/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.099 | DEBUG    | __main__:trials:29 - Trial = 6111/30000 | Total reward = 46.52
2022-01-26 14:16:54.102 | DEBUG    | __main__:trials:24 - Trial = 6112/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.103 | DEBUG    | __main__:trials:29 - Trial = 6112/30000 | Total reward = 21.48
2022-01-26 14:16:54.107 | DEBUG    | __main__:trials:24 - Trial = 6113/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.107 | DEBUG    | __main__:trials:29 - Trial = 6113/30000 | Total reward = 50.30
2022-01-26 14:16:54.111 | DEBUG    | __main__:trials:26 - Trial = 6114/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.112 | DEBUG    | __main__:trials:29 - Trial = 6114/30000 | Total reward = 20.73
2022-01-26 14:16:54.116 | DEBUG    | __main__:trials:24 - Trial = 6115/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.116 | DEBUG    | __main__:trials:29 - Trial = 6115/30000 | Total reward = 46.19
2022-01-26 14:16:54.121 | DEBUG    | __main__:trials:24 - Trial = 6116/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.122 | DEBUG    | __main__:trials:29 - Trial = 6116/30000 | Total reward = 44.87
2022-01-26 14:16:54.126 | DEBUG    | __main__:trials:24 - Trial = 6117/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.127 | DEBUG    | __main__:trials:29 - Trial = 6117/30000 | Total reward = 46.70
2022-01-26 14:16:54.130 | DEBUG    | __main__:trials:24 - Trial = 6118/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.132 | DEBUG    | __main__:trials:29 - Trial = 6118/30000 | Total reward = 46.19
2022-01-26 14:16:54.135 | DEBUG    | __main__:trials:24 - Trial = 6119/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.136 | DEBUG    | __main__:trials:29 - Trial = 6119/30000 | Total reward = 46.88
2022-01-26 14:16:54.140 | DEBUG    | __main__:trials:24 - Trial = 6120/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.142 | DEBUG    | __main__:trials:29 - Trial = 6120/30000 | Total reward = 51.08
2022-01-26 14:16:54.144 | DEBUG    | __main__:trials:26 - Trial = 6121/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.146 | DEBUG    | __main__:trials:29 - Trial = 6121/30000 | Total reward = 10.18
2022-01-26 14:16:54.149 | DEBUG    | __main__:trials:24 - Trial = 6122/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.151 | DEBUG    | __main__:trials:29 - Trial = 6122/30000 | Total reward = 44.54
2022-01-26 14:16:54.154 | DEBUG    | __main__:trials:24 - Trial = 6123/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.155 | DEBUG    | __main__:trials:29 - Trial = 6123/30000 | Total reward = 40.30
2022-01-26 14:16:54.158 | DEBUG    | __main__:trials:26 - Trial = 6124/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.159 | DEBUG    | __main__:trials:29 - Trial = 6124/30000 | Total reward = 21.18
2022-01-26 14:16:54.163 | DEBUG    | __main__:trials:24 - Trial = 6125/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.165 | DEBUG    | __main__:trials:29 - Trial = 6125/30000 | Total reward = 44.68
2022-01-26 14:16:54.168 | DEBUG    | __main__:trials:24 - Trial = 6126/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.169 | DEBUG    | __main__:trials:29 - Trial = 6126/30000 | Total reward = 49.33
2022-01-26 14:16:54.172 | DEBUG    | __main__:trials:24 - Trial = 6127/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.174 | DEBUG    | __main__:trials:29 - Trial = 6127/30000 | Total reward = 47.00
2022-01-26 14:16:54.177 | DEBUG    | __main__:trials:24 - Trial = 6128/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.178 | DEBUG    | __main__:trials:29 - Trial = 6128/30000 | Total reward = 49.94
2022-01-26 14:16:54.181 | DEBUG    | __main__:trials:24 - Trial = 6129/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.183 | DEBUG    | __main__:trials:29 - Trial = 6129/30000 | Total reward = 46.76
2022-01-26 14:16:54.186 | DEBUG    | __main__:trials:24 - Trial = 6130/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.188 | DEBUG    | __main__:trials:29 - Trial = 6130/30000 | Total reward = 48.55
2022-01-26 14:16:54.191 | DEBUG    | __main__:trials:24 - Trial = 6131/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.193 | DEBUG    | __main__:trials:29 - Trial = 6131/30000 | Total reward = 48.11
2022-01-26 14:16:54.196 | DEBUG    | __main__:trials:24 - Trial = 6132/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.197 | DEBUG    | __main__:trials:29 - Trial = 6132/30000 | Total reward = 46.01
2022-01-26 14:16:54.200 | DEBUG    | __main__:trials:24 - Trial = 6133/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.201 | DEBUG    | __main__:trials:29 - Trial = 6133/30000 | Total reward = 46.68
2022-01-26 14:16:54.204 | DEBUG    | __main__:trials:24 - Trial = 6134/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.206 | DEBUG    | __main__:trials:29 - Trial = 6134/30000 | Total reward = 45.26
2022-01-26 14:16:54.209 | DEBUG    | __main__:trials:24 - Trial = 6135/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.211 | DEBUG    | __main__:trials:29 - Trial = 6135/30000 | Total reward = 35.54
2022-01-26 14:16:54.214 | DEBUG    | __main__:trials:24 - Trial = 6136/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.215 | DEBUG    | __main__:trials:29 - Trial = 6136/30000 | Total reward = 44.54
2022-01-26 14:16:54.218 | DEBUG    | __main__:trials:24 - Trial = 6137/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.220 | DEBUG    | __main__:trials:29 - Trial = 6137/30000 | Total reward = 24.22
2022-01-26 14:16:54.224 | DEBUG    | __main__:trials:24 - Trial = 6138/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.224 | DEBUG    | __main__:trials:29 - Trial = 6138/30000 | Total reward = 35.14
2022-01-26 14:16:54.228 | DEBUG    | __main__:trials:24 - Trial = 6139/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.230 | DEBUG    | __main__:trials:29 - Trial = 6139/30000 | Total reward = 52.98
2022-01-26 14:16:54.233 | DEBUG    | __main__:trials:24 - Trial = 6140/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.235 | DEBUG    | __main__:trials:29 - Trial = 6140/30000 | Total reward = 47.79
2022-01-26 14:16:54.238 | DEBUG    | __main__:trials:24 - Trial = 6141/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.239 | DEBUG    | __main__:trials:29 - Trial = 6141/30000 | Total reward = 44.92
2022-01-26 14:16:54.243 | DEBUG    | __main__:trials:24 - Trial = 6142/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.245 | DEBUG    | __main__:trials:29 - Trial = 6142/30000 | Total reward = 45.69
2022-01-26 14:16:54.249 | DEBUG    | __main__:trials:24 - Trial = 6143/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.249 | DEBUG    | __main__:trials:29 - Trial = 6143/30000 | Total reward = 52.48
2022-01-26 14:16:54.254 | DEBUG    | __main__:trials:24 - Trial = 6144/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.254 | DEBUG    | __main__:trials:29 - Trial = 6144/30000 | Total reward = 25.75
2022-01-26 14:16:54.259 | DEBUG    | __main__:trials:24 - Trial = 6145/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.260 | DEBUG    | __main__:trials:29 - Trial = 6145/30000 | Total reward = 48.57
2022-01-26 14:16:54.263 | DEBUG    | __main__:trials:24 - Trial = 6146/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.265 | DEBUG    | __main__:trials:29 - Trial = 6146/30000 | Total reward = 44.02
2022-01-26 14:16:54.268 | DEBUG    | __main__:trials:24 - Trial = 6147/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.270 | DEBUG    | __main__:trials:29 - Trial = 6147/30000 | Total reward = 36.41
2022-01-26 14:16:54.273 | DEBUG    | __main__:trials:24 - Trial = 6148/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.273 | DEBUG    | __main__:trials:29 - Trial = 6148/30000 | Total reward = 45.20
2022-01-26 14:16:54.277 | DEBUG    | __main__:trials:24 - Trial = 6149/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.278 | DEBUG    | __main__:trials:29 - Trial = 6149/30000 | Total reward = 34.48
2022-01-26 14:16:54.281 | DEBUG    | __main__:trials:24 - Trial = 6150/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.282 | DEBUG    | __main__:trials:29 - Trial = 6150/30000 | Total reward = 49.26
2022-01-26 14:16:54.285 | DEBUG    | __main__:trials:26 - Trial = 6151/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.286 | DEBUG    | __main__:trials:29 - Trial = 6151/30000 | Total reward = 22.04
2022-01-26 14:16:54.290 | DEBUG    | __main__:trials:24 - Trial = 6152/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.292 | DEBUG    | __main__:trials:29 - Trial = 6152/30000 | Total reward = 34.44
2022-01-26 14:16:54.296 | DEBUG    | __main__:trials:24 - Trial = 6153/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.297 | DEBUG    | __main__:trials:29 - Trial = 6153/30000 | Total reward = 45.94
2022-01-26 14:16:54.301 | DEBUG    | __main__:trials:24 - Trial = 6154/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.302 | DEBUG    | __main__:trials:29 - Trial = 6154/30000 | Total reward = 46.52
2022-01-26 14:16:54.305 | DEBUG    | __main__:trials:26 - Trial = 6155/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.307 | DEBUG    | __main__:trials:29 - Trial = 6155/30000 | Total reward = 14.41
2022-01-26 14:16:54.310 | DEBUG    | __main__:trials:24 - Trial = 6156/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.311 | DEBUG    | __main__:trials:29 - Trial = 6156/30000 | Total reward = 43.70
2022-01-26 14:16:54.315 | DEBUG    | __main__:trials:24 - Trial = 6157/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.317 | DEBUG    | __main__:trials:29 - Trial = 6157/30000 | Total reward = 43.49
2022-01-26 14:16:54.320 | DEBUG    | __main__:trials:24 - Trial = 6158/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.321 | DEBUG    | __main__:trials:29 - Trial = 6158/30000 | Total reward = 44.91
2022-01-26 14:16:54.325 | DEBUG    | __main__:trials:24 - Trial = 6159/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.326 | DEBUG    | __main__:trials:29 - Trial = 6159/30000 | Total reward = 47.82
2022-01-26 14:16:54.330 | DEBUG    | __main__:trials:24 - Trial = 6160/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.332 | DEBUG    | __main__:trials:29 - Trial = 6160/30000 | Total reward = 53.36
2022-01-26 14:16:54.335 | DEBUG    | __main__:trials:24 - Trial = 6161/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.336 | DEBUG    | __main__:trials:29 - Trial = 6161/30000 | Total reward = 46.52
2022-01-26 14:16:54.341 | DEBUG    | __main__:trials:24 - Trial = 6162/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.342 | DEBUG    | __main__:trials:29 - Trial = 6162/30000 | Total reward = 49.26
2022-01-26 14:16:54.346 | DEBUG    | __main__:trials:24 - Trial = 6163/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.347 | DEBUG    | __main__:trials:29 - Trial = 6163/30000 | Total reward = 34.12
2022-01-26 14:16:54.351 | DEBUG    | __main__:trials:24 - Trial = 6164/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.352 | DEBUG    | __main__:trials:29 - Trial = 6164/30000 | Total reward = 42.88
2022-01-26 14:16:54.356 | DEBUG    | __main__:trials:24 - Trial = 6165/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.358 | DEBUG    | __main__:trials:29 - Trial = 6165/30000 | Total reward = 42.88
2022-01-26 14:16:54.361 | DEBUG    | __main__:trials:24 - Trial = 6166/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.363 | DEBUG    | __main__:trials:29 - Trial = 6166/30000 | Total reward = 43.48
2022-01-26 14:16:54.366 | DEBUG    | __main__:trials:24 - Trial = 6167/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.368 | DEBUG    | __main__:trials:29 - Trial = 6167/30000 | Total reward = 47.67
2022-01-26 14:16:54.372 | DEBUG    | __main__:trials:24 - Trial = 6168/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.373 | DEBUG    | __main__:trials:29 - Trial = 6168/30000 | Total reward = 34.05
2022-01-26 14:16:54.376 | DEBUG    | __main__:trials:24 - Trial = 6169/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.377 | DEBUG    | __main__:trials:29 - Trial = 6169/30000 | Total reward = 46.52
2022-01-26 14:16:54.380 | DEBUG    | __main__:trials:24 - Trial = 6170/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.382 | DEBUG    | __main__:trials:29 - Trial = 6170/30000 | Total reward = 56.49
2022-01-26 14:16:54.385 | DEBUG    | __main__:trials:24 - Trial = 6171/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.385 | DEBUG    | __main__:trials:29 - Trial = 6171/30000 | Total reward = 62.66
2022-01-26 14:16:54.390 | DEBUG    | __main__:trials:24 - Trial = 6172/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.391 | DEBUG    | __main__:trials:29 - Trial = 6172/30000 | Total reward = 46.77
2022-01-26 14:16:54.395 | DEBUG    | __main__:trials:24 - Trial = 6173/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.396 | DEBUG    | __main__:trials:29 - Trial = 6173/30000 | Total reward = 47.61
2022-01-26 14:16:54.399 | DEBUG    | __main__:trials:24 - Trial = 6174/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.401 | DEBUG    | __main__:trials:29 - Trial = 6174/30000 | Total reward = 44.63
2022-01-26 14:16:54.404 | DEBUG    | __main__:trials:24 - Trial = 6175/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.406 | DEBUG    | __main__:trials:29 - Trial = 6175/30000 | Total reward = 45.86
2022-01-26 14:16:54.409 | DEBUG    | __main__:trials:24 - Trial = 6176/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.411 | DEBUG    | __main__:trials:29 - Trial = 6176/30000 | Total reward = 49.61
2022-01-26 14:16:54.415 | DEBUG    | __main__:trials:24 - Trial = 6177/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.415 | DEBUG    | __main__:trials:29 - Trial = 6177/30000 | Total reward = 44.17
2022-01-26 14:16:54.420 | DEBUG    | __main__:trials:24 - Trial = 6178/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.421 | DEBUG    | __main__:trials:29 - Trial = 6178/30000 | Total reward = 48.74
2022-01-26 14:16:54.424 | DEBUG    | __main__:trials:26 - Trial = 6179/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.425 | DEBUG    | __main__:trials:29 - Trial = 6179/30000 | Total reward = 14.54
2022-01-26 14:16:54.429 | DEBUG    | __main__:trials:24 - Trial = 6180/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.431 | DEBUG    | __main__:trials:29 - Trial = 6180/30000 | Total reward = 44.31
2022-01-26 14:16:54.435 | DEBUG    | __main__:trials:24 - Trial = 6181/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.436 | DEBUG    | __main__:trials:29 - Trial = 6181/30000 | Total reward = 46.92
2022-01-26 14:16:54.440 | DEBUG    | __main__:trials:24 - Trial = 6182/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.441 | DEBUG    | __main__:trials:29 - Trial = 6182/30000 | Total reward = 47.29
2022-01-26 14:16:54.445 | DEBUG    | __main__:trials:24 - Trial = 6183/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.446 | DEBUG    | __main__:trials:29 - Trial = 6183/30000 | Total reward = 36.35
2022-01-26 14:16:54.450 | DEBUG    | __main__:trials:24 - Trial = 6184/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.451 | DEBUG    | __main__:trials:29 - Trial = 6184/30000 | Total reward = 48.25
2022-01-26 14:16:54.454 | DEBUG    | __main__:trials:24 - Trial = 6185/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.456 | DEBUG    | __main__:trials:29 - Trial = 6185/30000 | Total reward = 48.32
2022-01-26 14:16:54.459 | DEBUG    | __main__:trials:24 - Trial = 6186/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.461 | DEBUG    | __main__:trials:29 - Trial = 6186/30000 | Total reward = 48.40
2022-01-26 14:16:54.464 | DEBUG    | __main__:trials:24 - Trial = 6187/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.466 | DEBUG    | __main__:trials:29 - Trial = 6187/30000 | Total reward = 45.94
2022-01-26 14:16:54.469 | DEBUG    | __main__:trials:26 - Trial = 6188/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.470 | DEBUG    | __main__:trials:29 - Trial = 6188/30000 | Total reward = 26.67
2022-01-26 14:16:54.474 | DEBUG    | __main__:trials:24 - Trial = 6189/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.475 | DEBUG    | __main__:trials:29 - Trial = 6189/30000 | Total reward = 45.30
2022-01-26 14:16:54.480 | DEBUG    | __main__:trials:24 - Trial = 6190/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.481 | DEBUG    | __main__:trials:29 - Trial = 6190/30000 | Total reward = 29.85
2022-01-26 14:16:54.485 | DEBUG    | __main__:trials:24 - Trial = 6191/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.486 | DEBUG    | __main__:trials:29 - Trial = 6191/30000 | Total reward = 48.84
2022-01-26 14:16:54.489 | DEBUG    | __main__:trials:24 - Trial = 6192/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.491 | DEBUG    | __main__:trials:29 - Trial = 6192/30000 | Total reward = 42.37
2022-01-26 14:16:54.493 | DEBUG    | __main__:trials:24 - Trial = 6193/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.495 | DEBUG    | __main__:trials:29 - Trial = 6193/30000 | Total reward = 26.17
2022-01-26 14:16:54.499 | DEBUG    | __main__:trials:24 - Trial = 6194/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.500 | DEBUG    | __main__:trials:29 - Trial = 6194/30000 | Total reward = 42.56
2022-01-26 14:16:54.503 | DEBUG    | __main__:trials:24 - Trial = 6195/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.505 | DEBUG    | __main__:trials:29 - Trial = 6195/30000 | Total reward = 38.10
2022-01-26 14:16:54.508 | DEBUG    | __main__:trials:24 - Trial = 6196/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.509 | DEBUG    | __main__:trials:29 - Trial = 6196/30000 | Total reward = 50.12
2022-01-26 14:16:54.513 | DEBUG    | __main__:trials:24 - Trial = 6197/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.514 | DEBUG    | __main__:trials:29 - Trial = 6197/30000 | Total reward = 50.61
2022-01-26 14:16:54.518 | DEBUG    | __main__:trials:24 - Trial = 6198/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.519 | DEBUG    | __main__:trials:29 - Trial = 6198/30000 | Total reward = 48.26
2022-01-26 14:16:54.523 | DEBUG    | __main__:trials:24 - Trial = 6199/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.524 | DEBUG    | __main__:trials:29 - Trial = 6199/30000 | Total reward = 29.71
2022-01-26 14:16:54.527 | DEBUG    | __main__:trials:24 - Trial = 6200/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.529 | DEBUG    | __main__:trials:29 - Trial = 6200/30000 | Total reward = 48.38
2022-01-26 14:16:54.532 | DEBUG    | __main__:trials:24 - Trial = 6201/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.534 | DEBUG    | __main__:trials:29 - Trial = 6201/30000 | Total reward = 42.35
2022-01-26 14:16:54.537 | DEBUG    | __main__:trials:24 - Trial = 6202/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.539 | DEBUG    | __main__:trials:29 - Trial = 6202/30000 | Total reward = 49.50
2022-01-26 14:16:54.542 | DEBUG    | __main__:trials:24 - Trial = 6203/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.544 | DEBUG    | __main__:trials:29 - Trial = 6203/30000 | Total reward = 50.19
2022-01-26 14:16:54.547 | DEBUG    | __main__:trials:24 - Trial = 6204/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.548 | DEBUG    | __main__:trials:29 - Trial = 6204/30000 | Total reward = 49.45
2022-01-26 14:16:54.552 | DEBUG    | __main__:trials:24 - Trial = 6205/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.554 | DEBUG    | __main__:trials:29 - Trial = 6205/30000 | Total reward = 39.31
2022-01-26 14:16:54.557 | DEBUG    | __main__:trials:24 - Trial = 6206/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.558 | DEBUG    | __main__:trials:29 - Trial = 6206/30000 | Total reward = 48.60
2022-01-26 14:16:54.562 | DEBUG    | __main__:trials:24 - Trial = 6207/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.564 | DEBUG    | __main__:trials:29 - Trial = 6207/30000 | Total reward = 48.98
2022-01-26 14:16:54.567 | DEBUG    | __main__:trials:24 - Trial = 6208/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.569 | DEBUG    | __main__:trials:29 - Trial = 6208/30000 | Total reward = 48.61
2022-01-26 14:16:54.572 | DEBUG    | __main__:trials:24 - Trial = 6209/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.574 | DEBUG    | __main__:trials:29 - Trial = 6209/30000 | Total reward = 20.06
2022-01-26 14:16:54.577 | DEBUG    | __main__:trials:24 - Trial = 6210/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.578 | DEBUG    | __main__:trials:29 - Trial = 6210/30000 | Total reward = 49.97
2022-01-26 14:16:54.581 | DEBUG    | __main__:trials:24 - Trial = 6211/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.582 | DEBUG    | __main__:trials:29 - Trial = 6211/30000 | Total reward = 49.41
2022-01-26 14:16:54.586 | DEBUG    | __main__:trials:24 - Trial = 6212/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.588 | DEBUG    | __main__:trials:29 - Trial = 6212/30000 | Total reward = 49.38
2022-01-26 14:16:54.591 | DEBUG    | __main__:trials:24 - Trial = 6213/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.593 | DEBUG    | __main__:trials:29 - Trial = 6213/30000 | Total reward = 20.07
2022-01-26 14:16:54.596 | DEBUG    | __main__:trials:24 - Trial = 6214/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.597 | DEBUG    | __main__:trials:29 - Trial = 6214/30000 | Total reward = 19.67
2022-01-26 14:16:54.601 | DEBUG    | __main__:trials:24 - Trial = 6215/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.602 | DEBUG    | __main__:trials:29 - Trial = 6215/30000 | Total reward = 49.76
2022-01-26 14:16:54.606 | DEBUG    | __main__:trials:24 - Trial = 6216/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.607 | DEBUG    | __main__:trials:29 - Trial = 6216/30000 | Total reward = 48.26
2022-01-26 14:16:54.610 | DEBUG    | __main__:trials:24 - Trial = 6217/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.612 | DEBUG    | __main__:trials:29 - Trial = 6217/30000 | Total reward = 52.48
2022-01-26 14:16:54.616 | DEBUG    | __main__:trials:24 - Trial = 6218/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.616 | DEBUG    | __main__:trials:29 - Trial = 6218/30000 | Total reward = 47.13
2022-01-26 14:16:54.620 | DEBUG    | __main__:trials:24 - Trial = 6219/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.622 | DEBUG    | __main__:trials:29 - Trial = 6219/30000 | Total reward = 48.49
2022-01-26 14:16:54.625 | DEBUG    | __main__:trials:24 - Trial = 6220/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.627 | DEBUG    | __main__:trials:29 - Trial = 6220/30000 | Total reward = 41.67
2022-01-26 14:16:54.631 | DEBUG    | __main__:trials:24 - Trial = 6221/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.631 | DEBUG    | __main__:trials:29 - Trial = 6221/30000 | Total reward = 49.44
2022-01-26 14:16:54.636 | DEBUG    | __main__:trials:24 - Trial = 6222/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.636 | DEBUG    | __main__:trials:29 - Trial = 6222/30000 | Total reward = 56.17
2022-01-26 14:16:54.641 | DEBUG    | __main__:trials:24 - Trial = 6223/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.641 | DEBUG    | __main__:trials:29 - Trial = 6223/30000 | Total reward = 46.65
2022-01-26 14:16:54.644 | DEBUG    | __main__:trials:24 - Trial = 6224/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.646 | DEBUG    | __main__:trials:29 - Trial = 6224/30000 | Total reward = 48.43
2022-01-26 14:16:54.649 | DEBUG    | __main__:trials:24 - Trial = 6225/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.649 | DEBUG    | __main__:trials:29 - Trial = 6225/30000 | Total reward = 49.99
2022-01-26 14:16:54.653 | DEBUG    | __main__:trials:24 - Trial = 6226/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.654 | DEBUG    | __main__:trials:29 - Trial = 6226/30000 | Total reward = 46.33
2022-01-26 14:16:54.658 | DEBUG    | __main__:trials:24 - Trial = 6227/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.659 | DEBUG    | __main__:trials:29 - Trial = 6227/30000 | Total reward = 43.92
2022-01-26 14:16:54.662 | DEBUG    | __main__:trials:24 - Trial = 6228/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.664 | DEBUG    | __main__:trials:29 - Trial = 6228/30000 | Total reward = 49.37
2022-01-26 14:16:54.667 | DEBUG    | __main__:trials:24 - Trial = 6229/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.667 | DEBUG    | __main__:trials:29 - Trial = 6229/30000 | Total reward = 52.37
2022-01-26 14:16:54.671 | DEBUG    | __main__:trials:24 - Trial = 6230/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.671 | DEBUG    | __main__:trials:29 - Trial = 6230/30000 | Total reward = 49.56
2022-01-26 14:16:54.676 | DEBUG    | __main__:trials:24 - Trial = 6231/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.677 | DEBUG    | __main__:trials:29 - Trial = 6231/30000 | Total reward = 48.61
2022-01-26 14:16:54.681 | DEBUG    | __main__:trials:24 - Trial = 6232/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.682 | DEBUG    | __main__:trials:29 - Trial = 6232/30000 | Total reward = 45.33
2022-01-26 14:16:54.686 | DEBUG    | __main__:trials:24 - Trial = 6233/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.687 | DEBUG    | __main__:trials:29 - Trial = 6233/30000 | Total reward = 44.98
2022-01-26 14:16:54.691 | DEBUG    | __main__:trials:24 - Trial = 6234/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.692 | DEBUG    | __main__:trials:29 - Trial = 6234/30000 | Total reward = 39.82
2022-01-26 14:16:54.695 | DEBUG    | __main__:trials:24 - Trial = 6235/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.697 | DEBUG    | __main__:trials:29 - Trial = 6235/30000 | Total reward = 40.98
2022-01-26 14:16:54.700 | DEBUG    | __main__:trials:24 - Trial = 6236/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.701 | DEBUG    | __main__:trials:29 - Trial = 6236/30000 | Total reward = 45.79
2022-01-26 14:16:54.705 | DEBUG    | __main__:trials:24 - Trial = 6237/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.707 | DEBUG    | __main__:trials:29 - Trial = 6237/30000 | Total reward = 49.72
2022-01-26 14:16:54.709 | DEBUG    | __main__:trials:24 - Trial = 6238/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.711 | DEBUG    | __main__:trials:29 - Trial = 6238/30000 | Total reward = 47.11
2022-01-26 14:16:54.714 | DEBUG    | __main__:trials:24 - Trial = 6239/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.716 | DEBUG    | __main__:trials:29 - Trial = 6239/30000 | Total reward = 50.19
2022-01-26 14:16:54.717 | DEBUG    | __main__:trials:26 - Trial = 6240/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:54.719 | DEBUG    | __main__:trials:29 - Trial = 6240/30000 | Total reward = 11.37
2022-01-26 14:16:54.723 | DEBUG    | __main__:trials:24 - Trial = 6241/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.723 | DEBUG    | __main__:trials:29 - Trial = 6241/30000 | Total reward = 49.11
2022-01-26 14:16:54.728 | DEBUG    | __main__:trials:24 - Trial = 6242/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.728 | DEBUG    | __main__:trials:29 - Trial = 6242/30000 | Total reward = 34.37
2022-01-26 14:16:54.733 | DEBUG    | __main__:trials:24 - Trial = 6243/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.734 | DEBUG    | __main__:trials:29 - Trial = 6243/30000 | Total reward = 49.10
2022-01-26 14:16:54.738 | DEBUG    | __main__:trials:24 - Trial = 6244/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.740 | DEBUG    | __main__:trials:29 - Trial = 6244/30000 | Total reward = 51.82
2022-01-26 14:16:54.743 | DEBUG    | __main__:trials:24 - Trial = 6245/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.744 | DEBUG    | __main__:trials:29 - Trial = 6245/30000 | Total reward = 34.79
2022-01-26 14:16:54.748 | DEBUG    | __main__:trials:24 - Trial = 6246/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.749 | DEBUG    | __main__:trials:29 - Trial = 6246/30000 | Total reward = 49.40
2022-01-26 14:16:54.752 | DEBUG    | __main__:trials:24 - Trial = 6247/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.753 | DEBUG    | __main__:trials:29 - Trial = 6247/30000 | Total reward = 28.92
2022-01-26 14:16:54.756 | DEBUG    | __main__:trials:24 - Trial = 6248/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.758 | DEBUG    | __main__:trials:29 - Trial = 6248/30000 | Total reward = 43.89
2022-01-26 14:16:54.761 | DEBUG    | __main__:trials:24 - Trial = 6249/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.763 | DEBUG    | __main__:trials:29 - Trial = 6249/30000 | Total reward = 49.32
2022-01-26 14:16:54.766 | DEBUG    | __main__:trials:24 - Trial = 6250/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.767 | DEBUG    | __main__:trials:29 - Trial = 6250/30000 | Total reward = 47.13
2022-01-26 14:16:54.771 | DEBUG    | __main__:trials:24 - Trial = 6251/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.772 | DEBUG    | __main__:trials:29 - Trial = 6251/30000 | Total reward = 46.54
2022-01-26 14:16:54.776 | DEBUG    | __main__:trials:24 - Trial = 6252/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.777 | DEBUG    | __main__:trials:29 - Trial = 6252/30000 | Total reward = 37.73
2022-01-26 14:16:54.781 | DEBUG    | __main__:trials:24 - Trial = 6253/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.782 | DEBUG    | __main__:trials:29 - Trial = 6253/30000 | Total reward = 49.92
2022-01-26 14:16:54.786 | DEBUG    | __main__:trials:24 - Trial = 6254/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.787 | DEBUG    | __main__:trials:29 - Trial = 6254/30000 | Total reward = 47.29
2022-01-26 14:16:54.790 | DEBUG    | __main__:trials:24 - Trial = 6255/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.792 | DEBUG    | __main__:trials:29 - Trial = 6255/30000 | Total reward = 55.21
2022-01-26 14:16:54.795 | DEBUG    | __main__:trials:24 - Trial = 6256/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.796 | DEBUG    | __main__:trials:29 - Trial = 6256/30000 | Total reward = 42.08
2022-01-26 14:16:54.800 | DEBUG    | __main__:trials:24 - Trial = 6257/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.801 | DEBUG    | __main__:trials:29 - Trial = 6257/30000 | Total reward = 49.82
2022-01-26 14:16:54.804 | DEBUG    | __main__:trials:24 - Trial = 6258/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.805 | DEBUG    | __main__:trials:29 - Trial = 6258/30000 | Total reward = 49.97
2022-01-26 14:16:54.808 | DEBUG    | __main__:trials:24 - Trial = 6259/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.809 | DEBUG    | __main__:trials:29 - Trial = 6259/30000 | Total reward = 55.74
2022-01-26 14:16:54.812 | DEBUG    | __main__:trials:24 - Trial = 6260/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.814 | DEBUG    | __main__:trials:29 - Trial = 6260/30000 | Total reward = 44.52
2022-01-26 14:16:54.818 | DEBUG    | __main__:trials:24 - Trial = 6261/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.819 | DEBUG    | __main__:trials:29 - Trial = 6261/30000 | Total reward = 48.09
2022-01-26 14:16:54.822 | DEBUG    | __main__:trials:24 - Trial = 6262/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.824 | DEBUG    | __main__:trials:29 - Trial = 6262/30000 | Total reward = 50.08
2022-01-26 14:16:54.827 | DEBUG    | __main__:trials:24 - Trial = 6263/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.829 | DEBUG    | __main__:trials:29 - Trial = 6263/30000 | Total reward = 47.51
2022-01-26 14:16:54.832 | DEBUG    | __main__:trials:24 - Trial = 6264/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.833 | DEBUG    | __main__:trials:29 - Trial = 6264/30000 | Total reward = 53.78
2022-01-26 14:16:54.837 | DEBUG    | __main__:trials:24 - Trial = 6265/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.838 | DEBUG    | __main__:trials:29 - Trial = 6265/30000 | Total reward = 50.43
2022-01-26 14:16:54.842 | DEBUG    | __main__:trials:24 - Trial = 6266/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.843 | DEBUG    | __main__:trials:29 - Trial = 6266/30000 | Total reward = 39.87
2022-01-26 14:16:54.847 | DEBUG    | __main__:trials:24 - Trial = 6267/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.849 | DEBUG    | __main__:trials:29 - Trial = 6267/30000 | Total reward = 31.96
2022-01-26 14:16:54.852 | DEBUG    | __main__:trials:24 - Trial = 6268/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.854 | DEBUG    | __main__:trials:29 - Trial = 6268/30000 | Total reward = 51.90
2022-01-26 14:16:54.858 | DEBUG    | __main__:trials:24 - Trial = 6269/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.859 | DEBUG    | __main__:trials:29 - Trial = 6269/30000 | Total reward = 56.95
2022-01-26 14:16:54.863 | DEBUG    | __main__:trials:24 - Trial = 6270/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.864 | DEBUG    | __main__:trials:29 - Trial = 6270/30000 | Total reward = 47.80
2022-01-26 14:16:54.867 | DEBUG    | __main__:trials:24 - Trial = 6271/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.869 | DEBUG    | __main__:trials:29 - Trial = 6271/30000 | Total reward = 57.39
2022-01-26 14:16:54.872 | DEBUG    | __main__:trials:24 - Trial = 6272/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.874 | DEBUG    | __main__:trials:29 - Trial = 6272/30000 | Total reward = 44.21
2022-01-26 14:16:54.877 | DEBUG    | __main__:trials:24 - Trial = 6273/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.878 | DEBUG    | __main__:trials:29 - Trial = 6273/30000 | Total reward = 48.62
2022-01-26 14:16:54.881 | DEBUG    | __main__:trials:24 - Trial = 6274/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.883 | DEBUG    | __main__:trials:29 - Trial = 6274/30000 | Total reward = 49.55
2022-01-26 14:16:54.886 | DEBUG    | __main__:trials:24 - Trial = 6275/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.888 | DEBUG    | __main__:trials:29 - Trial = 6275/30000 | Total reward = 55.22
2022-01-26 14:16:54.891 | DEBUG    | __main__:trials:24 - Trial = 6276/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.893 | DEBUG    | __main__:trials:29 - Trial = 6276/30000 | Total reward = 42.63
2022-01-26 14:16:54.896 | DEBUG    | __main__:trials:24 - Trial = 6277/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.898 | DEBUG    | __main__:trials:29 - Trial = 6277/30000 | Total reward = 41.30
2022-01-26 14:16:54.901 | DEBUG    | __main__:trials:24 - Trial = 6278/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.903 | DEBUG    | __main__:trials:29 - Trial = 6278/30000 | Total reward = 65.08
2022-01-26 14:16:54.906 | DEBUG    | __main__:trials:24 - Trial = 6279/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.907 | DEBUG    | __main__:trials:29 - Trial = 6279/30000 | Total reward = 57.57
2022-01-26 14:16:54.911 | DEBUG    | __main__:trials:24 - Trial = 6280/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.913 | DEBUG    | __main__:trials:29 - Trial = 6280/30000 | Total reward = 45.05
2022-01-26 14:16:54.916 | DEBUG    | __main__:trials:24 - Trial = 6281/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.918 | DEBUG    | __main__:trials:29 - Trial = 6281/30000 | Total reward = 44.38
2022-01-26 14:16:54.922 | DEBUG    | __main__:trials:24 - Trial = 6282/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.923 | DEBUG    | __main__:trials:29 - Trial = 6282/30000 | Total reward = 45.76
2022-01-26 14:16:54.927 | DEBUG    | __main__:trials:24 - Trial = 6283/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.928 | DEBUG    | __main__:trials:29 - Trial = 6283/30000 | Total reward = 39.45
2022-01-26 14:16:54.932 | DEBUG    | __main__:trials:24 - Trial = 6284/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.933 | DEBUG    | __main__:trials:29 - Trial = 6284/30000 | Total reward = 55.79
2022-01-26 14:16:54.937 | DEBUG    | __main__:trials:24 - Trial = 6285/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.938 | DEBUG    | __main__:trials:29 - Trial = 6285/30000 | Total reward = 56.62
2022-01-26 14:16:54.942 | DEBUG    | __main__:trials:24 - Trial = 6286/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.944 | DEBUG    | __main__:trials:29 - Trial = 6286/30000 | Total reward = 28.78
2022-01-26 14:16:54.947 | DEBUG    | __main__:trials:24 - Trial = 6287/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.949 | DEBUG    | __main__:trials:29 - Trial = 6287/30000 | Total reward = 44.68
2022-01-26 14:16:54.952 | DEBUG    | __main__:trials:24 - Trial = 6288/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.954 | DEBUG    | __main__:trials:29 - Trial = 6288/30000 | Total reward = 31.59
2022-01-26 14:16:54.958 | DEBUG    | __main__:trials:24 - Trial = 6289/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.959 | DEBUG    | __main__:trials:29 - Trial = 6289/30000 | Total reward = 49.89
2022-01-26 14:16:54.963 | DEBUG    | __main__:trials:24 - Trial = 6290/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.964 | DEBUG    | __main__:trials:29 - Trial = 6290/30000 | Total reward = 47.48
2022-01-26 14:16:54.968 | DEBUG    | __main__:trials:24 - Trial = 6291/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.969 | DEBUG    | __main__:trials:29 - Trial = 6291/30000 | Total reward = 44.57
2022-01-26 14:16:54.972 | DEBUG    | __main__:trials:24 - Trial = 6292/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.974 | DEBUG    | __main__:trials:29 - Trial = 6292/30000 | Total reward = 62.54
2022-01-26 14:16:54.978 | DEBUG    | __main__:trials:24 - Trial = 6293/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.979 | DEBUG    | __main__:trials:29 - Trial = 6293/30000 | Total reward = 55.78
2022-01-26 14:16:54.982 | DEBUG    | __main__:trials:24 - Trial = 6294/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.983 | DEBUG    | __main__:trials:29 - Trial = 6294/30000 | Total reward = 51.83
2022-01-26 14:16:54.986 | DEBUG    | __main__:trials:24 - Trial = 6295/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.987 | DEBUG    | __main__:trials:29 - Trial = 6295/30000 | Total reward = 49.20
2022-01-26 14:16:54.990 | DEBUG    | __main__:trials:24 - Trial = 6296/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.991 | DEBUG    | __main__:trials:29 - Trial = 6296/30000 | Total reward = 46.97
2022-01-26 14:16:54.994 | DEBUG    | __main__:trials:24 - Trial = 6297/30000 | Max number of steps (20) reached
2022-01-26 14:16:54.996 | DEBUG    | __main__:trials:29 - Trial = 6297/30000 | Total reward = 47.46
2022-01-26 14:16:54.999 | DEBUG    | __main__:trials:24 - Trial = 6298/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.000 | DEBUG    | __main__:trials:29 - Trial = 6298/30000 | Total reward = 42.30
2022-01-26 14:16:55.004 | DEBUG    | __main__:trials:24 - Trial = 6299/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.006 | DEBUG    | __main__:trials:29 - Trial = 6299/30000 | Total reward = 42.08
2022-01-26 14:16:55.009 | DEBUG    | __main__:trials:24 - Trial = 6300/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.011 | DEBUG    | __main__:trials:29 - Trial = 6300/30000 | Total reward = 49.34
2022-01-26 14:16:55.014 | DEBUG    | __main__:trials:24 - Trial = 6301/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.016 | DEBUG    | __main__:trials:29 - Trial = 6301/30000 | Total reward = 34.23
2022-01-26 14:16:55.020 | DEBUG    | __main__:trials:24 - Trial = 6302/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.021 | DEBUG    | __main__:trials:29 - Trial = 6302/30000 | Total reward = 40.91
2022-01-26 14:16:55.025 | DEBUG    | __main__:trials:24 - Trial = 6303/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.025 | DEBUG    | __main__:trials:29 - Trial = 6303/30000 | Total reward = 49.30
2022-01-26 14:16:55.029 | DEBUG    | __main__:trials:24 - Trial = 6304/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.031 | DEBUG    | __main__:trials:29 - Trial = 6304/30000 | Total reward = 50.29
2022-01-26 14:16:55.035 | DEBUG    | __main__:trials:24 - Trial = 6305/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.036 | DEBUG    | __main__:trials:29 - Trial = 6305/30000 | Total reward = 46.95
2022-01-26 14:16:55.040 | DEBUG    | __main__:trials:24 - Trial = 6306/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.041 | DEBUG    | __main__:trials:29 - Trial = 6306/30000 | Total reward = 46.70
2022-01-26 14:16:55.045 | DEBUG    | __main__:trials:24 - Trial = 6307/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.045 | DEBUG    | __main__:trials:29 - Trial = 6307/30000 | Total reward = 47.70
2022-01-26 14:16:55.049 | DEBUG    | __main__:trials:24 - Trial = 6308/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.050 | DEBUG    | __main__:trials:29 - Trial = 6308/30000 | Total reward = 52.54
2022-01-26 14:16:55.054 | DEBUG    | __main__:trials:24 - Trial = 6309/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.055 | DEBUG    | __main__:trials:29 - Trial = 6309/30000 | Total reward = 49.75
2022-01-26 14:16:55.059 | DEBUG    | __main__:trials:24 - Trial = 6310/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.060 | DEBUG    | __main__:trials:29 - Trial = 6310/30000 | Total reward = 51.59
2022-01-26 14:16:55.064 | DEBUG    | __main__:trials:24 - Trial = 6311/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.065 | DEBUG    | __main__:trials:29 - Trial = 6311/30000 | Total reward = 39.67
2022-01-26 14:16:55.069 | DEBUG    | __main__:trials:24 - Trial = 6312/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.070 | DEBUG    | __main__:trials:29 - Trial = 6312/30000 | Total reward = 43.68
2022-01-26 14:16:55.074 | DEBUG    | __main__:trials:24 - Trial = 6313/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.075 | DEBUG    | __main__:trials:29 - Trial = 6313/30000 | Total reward = 62.53
2022-01-26 14:16:55.079 | DEBUG    | __main__:trials:24 - Trial = 6314/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.080 | DEBUG    | __main__:trials:29 - Trial = 6314/30000 | Total reward = 48.60
2022-01-26 14:16:55.084 | DEBUG    | __main__:trials:24 - Trial = 6315/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.085 | DEBUG    | __main__:trials:29 - Trial = 6315/30000 | Total reward = 44.11
2022-01-26 14:16:55.089 | DEBUG    | __main__:trials:24 - Trial = 6316/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.090 | DEBUG    | __main__:trials:29 - Trial = 6316/30000 | Total reward = 46.82
2022-01-26 14:16:55.094 | DEBUG    | __main__:trials:24 - Trial = 6317/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.095 | DEBUG    | __main__:trials:29 - Trial = 6317/30000 | Total reward = 44.95
2022-01-26 14:16:55.098 | DEBUG    | __main__:trials:24 - Trial = 6318/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.100 | DEBUG    | __main__:trials:29 - Trial = 6318/30000 | Total reward = 54.66
2022-01-26 14:16:55.104 | DEBUG    | __main__:trials:24 - Trial = 6319/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.105 | DEBUG    | __main__:trials:29 - Trial = 6319/30000 | Total reward = 47.75
2022-01-26 14:16:55.108 | DEBUG    | __main__:trials:24 - Trial = 6320/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.110 | DEBUG    | __main__:trials:29 - Trial = 6320/30000 | Total reward = 43.28
2022-01-26 14:16:55.114 | DEBUG    | __main__:trials:24 - Trial = 6321/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.115 | DEBUG    | __main__:trials:29 - Trial = 6321/30000 | Total reward = 53.36
2022-01-26 14:16:55.119 | DEBUG    | __main__:trials:24 - Trial = 6322/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.121 | DEBUG    | __main__:trials:29 - Trial = 6322/30000 | Total reward = 44.76
2022-01-26 14:16:55.124 | DEBUG    | __main__:trials:24 - Trial = 6323/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.126 | DEBUG    | __main__:trials:29 - Trial = 6323/30000 | Total reward = 46.17
2022-01-26 14:16:55.129 | DEBUG    | __main__:trials:24 - Trial = 6324/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.131 | DEBUG    | __main__:trials:29 - Trial = 6324/30000 | Total reward = 56.06
2022-01-26 14:16:55.135 | DEBUG    | __main__:trials:24 - Trial = 6325/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.136 | DEBUG    | __main__:trials:29 - Trial = 6325/30000 | Total reward = 32.87
2022-01-26 14:16:55.139 | DEBUG    | __main__:trials:24 - Trial = 6326/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.141 | DEBUG    | __main__:trials:29 - Trial = 6326/30000 | Total reward = 52.28
2022-01-26 14:16:55.145 | DEBUG    | __main__:trials:24 - Trial = 6327/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.146 | DEBUG    | __main__:trials:29 - Trial = 6327/30000 | Total reward = 34.38
2022-01-26 14:16:55.150 | DEBUG    | __main__:trials:24 - Trial = 6328/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.151 | DEBUG    | __main__:trials:29 - Trial = 6328/30000 | Total reward = 51.32
2022-01-26 14:16:55.155 | DEBUG    | __main__:trials:24 - Trial = 6329/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.157 | DEBUG    | __main__:trials:29 - Trial = 6329/30000 | Total reward = 43.45
2022-01-26 14:16:55.161 | DEBUG    | __main__:trials:24 - Trial = 6330/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.161 | DEBUG    | __main__:trials:29 - Trial = 6330/30000 | Total reward = 55.32
2022-01-26 14:16:55.165 | DEBUG    | __main__:trials:24 - Trial = 6331/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.166 | DEBUG    | __main__:trials:29 - Trial = 6331/30000 | Total reward = 31.23
2022-01-26 14:16:55.170 | DEBUG    | __main__:trials:24 - Trial = 6332/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.170 | DEBUG    | __main__:trials:29 - Trial = 6332/30000 | Total reward = 57.27
2022-01-26 14:16:55.175 | DEBUG    | __main__:trials:24 - Trial = 6333/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.176 | DEBUG    | __main__:trials:29 - Trial = 6333/30000 | Total reward = 56.88
2022-01-26 14:16:55.179 | DEBUG    | __main__:trials:26 - Trial = 6334/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.181 | DEBUG    | __main__:trials:29 - Trial = 6334/30000 | Total reward = 27.73
2022-01-26 14:16:55.184 | DEBUG    | __main__:trials:24 - Trial = 6335/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.186 | DEBUG    | __main__:trials:29 - Trial = 6335/30000 | Total reward = 44.79
2022-01-26 14:16:55.190 | DEBUG    | __main__:trials:24 - Trial = 6336/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.190 | DEBUG    | __main__:trials:29 - Trial = 6336/30000 | Total reward = 51.33
2022-01-26 14:16:55.194 | DEBUG    | __main__:trials:24 - Trial = 6337/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.195 | DEBUG    | __main__:trials:29 - Trial = 6337/30000 | Total reward = 50.71
2022-01-26 14:16:55.198 | DEBUG    | __main__:trials:24 - Trial = 6338/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.200 | DEBUG    | __main__:trials:29 - Trial = 6338/30000 | Total reward = 38.09
2022-01-26 14:16:55.204 | DEBUG    | __main__:trials:24 - Trial = 6339/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.205 | DEBUG    | __main__:trials:29 - Trial = 6339/30000 | Total reward = 38.42
2022-01-26 14:16:55.209 | DEBUG    | __main__:trials:24 - Trial = 6340/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.210 | DEBUG    | __main__:trials:29 - Trial = 6340/30000 | Total reward = 45.84
2022-01-26 14:16:55.214 | DEBUG    | __main__:trials:24 - Trial = 6341/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.216 | DEBUG    | __main__:trials:29 - Trial = 6341/30000 | Total reward = 45.41
2022-01-26 14:16:55.219 | DEBUG    | __main__:trials:24 - Trial = 6342/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.221 | DEBUG    | __main__:trials:29 - Trial = 6342/30000 | Total reward = 45.61
2022-01-26 14:16:55.224 | DEBUG    | __main__:trials:24 - Trial = 6343/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.226 | DEBUG    | __main__:trials:29 - Trial = 6343/30000 | Total reward = 50.80
2022-01-26 14:16:55.230 | DEBUG    | __main__:trials:24 - Trial = 6344/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.231 | DEBUG    | __main__:trials:29 - Trial = 6344/30000 | Total reward = 50.52
2022-01-26 14:16:55.235 | DEBUG    | __main__:trials:24 - Trial = 6345/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.236 | DEBUG    | __main__:trials:29 - Trial = 6345/30000 | Total reward = 66.06
2022-01-26 14:16:55.240 | DEBUG    | __main__:trials:24 - Trial = 6346/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.241 | DEBUG    | __main__:trials:29 - Trial = 6346/30000 | Total reward = 31.33
2022-01-26 14:16:55.245 | DEBUG    | __main__:trials:24 - Trial = 6347/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.247 | DEBUG    | __main__:trials:29 - Trial = 6347/30000 | Total reward = 41.49
2022-01-26 14:16:55.250 | DEBUG    | __main__:trials:24 - Trial = 6348/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.252 | DEBUG    | __main__:trials:29 - Trial = 6348/30000 | Total reward = 45.69
2022-01-26 14:16:55.255 | DEBUG    | __main__:trials:24 - Trial = 6349/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.257 | DEBUG    | __main__:trials:29 - Trial = 6349/30000 | Total reward = 44.91
2022-01-26 14:16:55.260 | DEBUG    | __main__:trials:24 - Trial = 6350/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.262 | DEBUG    | __main__:trials:29 - Trial = 6350/30000 | Total reward = 45.54
2022-01-26 14:16:55.265 | DEBUG    | __main__:trials:24 - Trial = 6351/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.267 | DEBUG    | __main__:trials:29 - Trial = 6351/30000 | Total reward = 46.52
2022-01-26 14:16:55.270 | DEBUG    | __main__:trials:24 - Trial = 6352/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.272 | DEBUG    | __main__:trials:29 - Trial = 6352/30000 | Total reward = 50.14
2022-01-26 14:16:55.275 | DEBUG    | __main__:trials:24 - Trial = 6353/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.277 | DEBUG    | __main__:trials:29 - Trial = 6353/30000 | Total reward = 31.77
2022-01-26 14:16:55.280 | DEBUG    | __main__:trials:24 - Trial = 6354/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.282 | DEBUG    | __main__:trials:29 - Trial = 6354/30000 | Total reward = 43.51
2022-01-26 14:16:55.285 | DEBUG    | __main__:trials:24 - Trial = 6355/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.287 | DEBUG    | __main__:trials:29 - Trial = 6355/30000 | Total reward = 50.74
2022-01-26 14:16:55.290 | DEBUG    | __main__:trials:24 - Trial = 6356/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.292 | DEBUG    | __main__:trials:29 - Trial = 6356/30000 | Total reward = 43.05
2022-01-26 14:16:55.295 | DEBUG    | __main__:trials:24 - Trial = 6357/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.297 | DEBUG    | __main__:trials:29 - Trial = 6357/30000 | Total reward = 53.64
2022-01-26 14:16:55.300 | DEBUG    | __main__:trials:24 - Trial = 6358/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.302 | DEBUG    | __main__:trials:29 - Trial = 6358/30000 | Total reward = 47.90
2022-01-26 14:16:55.306 | DEBUG    | __main__:trials:24 - Trial = 6359/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.307 | DEBUG    | __main__:trials:29 - Trial = 6359/30000 | Total reward = 48.45
2022-01-26 14:16:55.311 | DEBUG    | __main__:trials:24 - Trial = 6360/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.311 | DEBUG    | __main__:trials:29 - Trial = 6360/30000 | Total reward = 44.35
2022-01-26 14:16:55.316 | DEBUG    | __main__:trials:24 - Trial = 6361/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.317 | DEBUG    | __main__:trials:29 - Trial = 6361/30000 | Total reward = 47.05
2022-01-26 14:16:55.321 | DEBUG    | __main__:trials:24 - Trial = 6362/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.322 | DEBUG    | __main__:trials:29 - Trial = 6362/30000 | Total reward = 42.70
2022-01-26 14:16:55.325 | DEBUG    | __main__:trials:24 - Trial = 6363/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.326 | DEBUG    | __main__:trials:29 - Trial = 6363/30000 | Total reward = 45.94
2022-01-26 14:16:55.329 | DEBUG    | __main__:trials:24 - Trial = 6364/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.330 | DEBUG    | __main__:trials:29 - Trial = 6364/30000 | Total reward = 44.86
2022-01-26 14:16:55.333 | DEBUG    | __main__:trials:24 - Trial = 6365/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.334 | DEBUG    | __main__:trials:29 - Trial = 6365/30000 | Total reward = 47.55
2022-01-26 14:16:55.338 | DEBUG    | __main__:trials:24 - Trial = 6366/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.340 | DEBUG    | __main__:trials:29 - Trial = 6366/30000 | Total reward = 37.96
2022-01-26 14:16:55.343 | DEBUG    | __main__:trials:24 - Trial = 6367/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.344 | DEBUG    | __main__:trials:29 - Trial = 6367/30000 | Total reward = 45.06
2022-01-26 14:16:55.348 | DEBUG    | __main__:trials:24 - Trial = 6368/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.350 | DEBUG    | __main__:trials:29 - Trial = 6368/30000 | Total reward = 50.31
2022-01-26 14:16:55.353 | DEBUG    | __main__:trials:24 - Trial = 6369/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.354 | DEBUG    | __main__:trials:29 - Trial = 6369/30000 | Total reward = 47.12
2022-01-26 14:16:55.357 | DEBUG    | __main__:trials:24 - Trial = 6370/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.358 | DEBUG    | __main__:trials:29 - Trial = 6370/30000 | Total reward = 46.48
2022-01-26 14:16:55.361 | DEBUG    | __main__:trials:24 - Trial = 6371/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.363 | DEBUG    | __main__:trials:29 - Trial = 6371/30000 | Total reward = 43.46
2022-01-26 14:16:55.366 | DEBUG    | __main__:trials:24 - Trial = 6372/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.368 | DEBUG    | __main__:trials:29 - Trial = 6372/30000 | Total reward = 59.11
2022-01-26 14:16:55.371 | DEBUG    | __main__:trials:24 - Trial = 6373/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.373 | DEBUG    | __main__:trials:29 - Trial = 6373/30000 | Total reward = 48.05
2022-01-26 14:16:55.376 | DEBUG    | __main__:trials:24 - Trial = 6374/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.378 | DEBUG    | __main__:trials:29 - Trial = 6374/30000 | Total reward = 62.51
2022-01-26 14:16:55.382 | DEBUG    | __main__:trials:24 - Trial = 6375/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.383 | DEBUG    | __main__:trials:29 - Trial = 6375/30000 | Total reward = 41.27
2022-01-26 14:16:55.386 | DEBUG    | __main__:trials:24 - Trial = 6376/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.388 | DEBUG    | __main__:trials:29 - Trial = 6376/30000 | Total reward = 49.64
2022-01-26 14:16:55.392 | DEBUG    | __main__:trials:24 - Trial = 6377/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.393 | DEBUG    | __main__:trials:29 - Trial = 6377/30000 | Total reward = 37.40
2022-01-26 14:16:55.397 | DEBUG    | __main__:trials:24 - Trial = 6378/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.398 | DEBUG    | __main__:trials:29 - Trial = 6378/30000 | Total reward = 48.83
2022-01-26 14:16:55.402 | DEBUG    | __main__:trials:24 - Trial = 6379/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.403 | DEBUG    | __main__:trials:29 - Trial = 6379/30000 | Total reward = 46.48
2022-01-26 14:16:55.407 | DEBUG    | __main__:trials:24 - Trial = 6380/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.409 | DEBUG    | __main__:trials:29 - Trial = 6380/30000 | Total reward = 64.56
2022-01-26 14:16:55.412 | DEBUG    | __main__:trials:24 - Trial = 6381/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.414 | DEBUG    | __main__:trials:29 - Trial = 6381/30000 | Total reward = 46.02
2022-01-26 14:16:55.418 | DEBUG    | __main__:trials:24 - Trial = 6382/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.418 | DEBUG    | __main__:trials:29 - Trial = 6382/30000 | Total reward = 44.79
2022-01-26 14:16:55.423 | DEBUG    | __main__:trials:24 - Trial = 6383/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.424 | DEBUG    | __main__:trials:29 - Trial = 6383/30000 | Total reward = 42.58
2022-01-26 14:16:55.428 | DEBUG    | __main__:trials:24 - Trial = 6384/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.429 | DEBUG    | __main__:trials:29 - Trial = 6384/30000 | Total reward = 48.31
2022-01-26 14:16:55.433 | DEBUG    | __main__:trials:24 - Trial = 6385/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.434 | DEBUG    | __main__:trials:29 - Trial = 6385/30000 | Total reward = 55.21
2022-01-26 14:16:55.438 | DEBUG    | __main__:trials:24 - Trial = 6386/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.439 | DEBUG    | __main__:trials:29 - Trial = 6386/30000 | Total reward = 44.46
2022-01-26 14:16:55.443 | DEBUG    | __main__:trials:24 - Trial = 6387/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.444 | DEBUG    | __main__:trials:29 - Trial = 6387/30000 | Total reward = 48.03
2022-01-26 14:16:55.448 | DEBUG    | __main__:trials:24 - Trial = 6388/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.448 | DEBUG    | __main__:trials:29 - Trial = 6388/30000 | Total reward = 32.34
2022-01-26 14:16:55.453 | DEBUG    | __main__:trials:24 - Trial = 6389/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.453 | DEBUG    | __main__:trials:29 - Trial = 6389/30000 | Total reward = 33.18
2022-01-26 14:16:55.457 | DEBUG    | __main__:trials:26 - Trial = 6390/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.459 | DEBUG    | __main__:trials:29 - Trial = 6390/30000 | Total reward = 21.38
2022-01-26 14:16:55.462 | DEBUG    | __main__:trials:26 - Trial = 6391/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.463 | DEBUG    | __main__:trials:29 - Trial = 6391/30000 | Total reward = 23.44
2022-01-26 14:16:55.466 | DEBUG    | __main__:trials:24 - Trial = 6392/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.468 | DEBUG    | __main__:trials:29 - Trial = 6392/30000 | Total reward = 33.85
2022-01-26 14:16:55.471 | DEBUG    | __main__:trials:24 - Trial = 6393/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.472 | DEBUG    | __main__:trials:29 - Trial = 6393/30000 | Total reward = 25.55
2022-01-26 14:16:55.475 | DEBUG    | __main__:trials:24 - Trial = 6394/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.475 | DEBUG    | __main__:trials:29 - Trial = 6394/30000 | Total reward = 42.38
2022-01-26 14:16:55.479 | DEBUG    | __main__:trials:24 - Trial = 6395/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.479 | DEBUG    | __main__:trials:29 - Trial = 6395/30000 | Total reward = 41.85
2022-01-26 14:16:55.483 | DEBUG    | __main__:trials:24 - Trial = 6396/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.484 | DEBUG    | __main__:trials:29 - Trial = 6396/30000 | Total reward = 32.98
2022-01-26 14:16:55.488 | DEBUG    | __main__:trials:24 - Trial = 6397/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.490 | DEBUG    | __main__:trials:29 - Trial = 6397/30000 | Total reward = 49.21
2022-01-26 14:16:55.493 | DEBUG    | __main__:trials:24 - Trial = 6398/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.494 | DEBUG    | __main__:trials:29 - Trial = 6398/30000 | Total reward = 45.99
2022-01-26 14:16:55.498 | DEBUG    | __main__:trials:24 - Trial = 6399/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.500 | DEBUG    | __main__:trials:29 - Trial = 6399/30000 | Total reward = 35.73
2022-01-26 14:16:55.504 | DEBUG    | __main__:trials:24 - Trial = 6400/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.505 | DEBUG    | __main__:trials:29 - Trial = 6400/30000 | Total reward = 28.67
2022-01-26 14:16:55.509 | DEBUG    | __main__:trials:24 - Trial = 6401/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.510 | DEBUG    | __main__:trials:29 - Trial = 6401/30000 | Total reward = 50.95
2022-01-26 14:16:55.514 | DEBUG    | __main__:trials:24 - Trial = 6402/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.514 | DEBUG    | __main__:trials:29 - Trial = 6402/30000 | Total reward = 39.80
2022-01-26 14:16:55.518 | DEBUG    | __main__:trials:26 - Trial = 6403/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.520 | DEBUG    | __main__:trials:29 - Trial = 6403/30000 | Total reward = 23.40
2022-01-26 14:16:55.523 | DEBUG    | __main__:trials:24 - Trial = 6404/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.524 | DEBUG    | __main__:trials:29 - Trial = 6404/30000 | Total reward = 58.16
2022-01-26 14:16:55.527 | DEBUG    | __main__:trials:24 - Trial = 6405/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.529 | DEBUG    | __main__:trials:29 - Trial = 6405/30000 | Total reward = 35.62
2022-01-26 14:16:55.532 | DEBUG    | __main__:trials:24 - Trial = 6406/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.533 | DEBUG    | __main__:trials:29 - Trial = 6406/30000 | Total reward = 34.19
2022-01-26 14:16:55.537 | DEBUG    | __main__:trials:24 - Trial = 6407/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.538 | DEBUG    | __main__:trials:29 - Trial = 6407/30000 | Total reward = 35.20
2022-01-26 14:16:55.542 | DEBUG    | __main__:trials:24 - Trial = 6408/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.543 | DEBUG    | __main__:trials:29 - Trial = 6408/30000 | Total reward = 43.89
2022-01-26 14:16:55.547 | DEBUG    | __main__:trials:24 - Trial = 6409/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.548 | DEBUG    | __main__:trials:29 - Trial = 6409/30000 | Total reward = 42.48
2022-01-26 14:16:55.552 | DEBUG    | __main__:trials:24 - Trial = 6410/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.553 | DEBUG    | __main__:trials:29 - Trial = 6410/30000 | Total reward = 56.93
2022-01-26 14:16:55.556 | DEBUG    | __main__:trials:24 - Trial = 6411/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.558 | DEBUG    | __main__:trials:29 - Trial = 6411/30000 | Total reward = 49.86
2022-01-26 14:16:55.562 | DEBUG    | __main__:trials:24 - Trial = 6412/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.563 | DEBUG    | __main__:trials:29 - Trial = 6412/30000 | Total reward = 42.88
2022-01-26 14:16:55.567 | DEBUG    | __main__:trials:24 - Trial = 6413/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.567 | DEBUG    | __main__:trials:29 - Trial = 6413/30000 | Total reward = 45.30
2022-01-26 14:16:55.571 | DEBUG    | __main__:trials:24 - Trial = 6414/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.573 | DEBUG    | __main__:trials:29 - Trial = 6414/30000 | Total reward = 41.74
2022-01-26 14:16:55.576 | DEBUG    | __main__:trials:24 - Trial = 6415/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.578 | DEBUG    | __main__:trials:29 - Trial = 6415/30000 | Total reward = 33.44
2022-01-26 14:16:55.581 | DEBUG    | __main__:trials:24 - Trial = 6416/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.583 | DEBUG    | __main__:trials:29 - Trial = 6416/30000 | Total reward = 36.97
2022-01-26 14:16:55.587 | DEBUG    | __main__:trials:24 - Trial = 6417/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.588 | DEBUG    | __main__:trials:29 - Trial = 6417/30000 | Total reward = 44.97
2022-01-26 14:16:55.592 | DEBUG    | __main__:trials:24 - Trial = 6418/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.592 | DEBUG    | __main__:trials:29 - Trial = 6418/30000 | Total reward = 41.50
2022-01-26 14:16:55.597 | DEBUG    | __main__:trials:24 - Trial = 6419/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.597 | DEBUG    | __main__:trials:29 - Trial = 6419/30000 | Total reward = 44.11
2022-01-26 14:16:55.601 | DEBUG    | __main__:trials:24 - Trial = 6420/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.602 | DEBUG    | __main__:trials:29 - Trial = 6420/30000 | Total reward = 36.29
2022-01-26 14:16:55.606 | DEBUG    | __main__:trials:24 - Trial = 6421/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.608 | DEBUG    | __main__:trials:29 - Trial = 6421/30000 | Total reward = 34.04
2022-01-26 14:16:55.611 | DEBUG    | __main__:trials:24 - Trial = 6422/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.613 | DEBUG    | __main__:trials:29 - Trial = 6422/30000 | Total reward = 45.06
2022-01-26 14:16:55.616 | DEBUG    | __main__:trials:24 - Trial = 6423/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.617 | DEBUG    | __main__:trials:29 - Trial = 6423/30000 | Total reward = 45.74
2022-01-26 14:16:55.621 | DEBUG    | __main__:trials:24 - Trial = 6424/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.622 | DEBUG    | __main__:trials:29 - Trial = 6424/30000 | Total reward = 30.15
2022-01-26 14:16:55.626 | DEBUG    | __main__:trials:24 - Trial = 6425/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.627 | DEBUG    | __main__:trials:29 - Trial = 6425/30000 | Total reward = 44.30
2022-01-26 14:16:55.631 | DEBUG    | __main__:trials:24 - Trial = 6426/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.633 | DEBUG    | __main__:trials:29 - Trial = 6426/30000 | Total reward = 49.11
2022-01-26 14:16:55.636 | DEBUG    | __main__:trials:24 - Trial = 6427/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.637 | DEBUG    | __main__:trials:29 - Trial = 6427/30000 | Total reward = 34.47
2022-01-26 14:16:55.640 | DEBUG    | __main__:trials:24 - Trial = 6428/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.642 | DEBUG    | __main__:trials:29 - Trial = 6428/30000 | Total reward = 35.09
2022-01-26 14:16:55.645 | DEBUG    | __main__:trials:24 - Trial = 6429/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.646 | DEBUG    | __main__:trials:29 - Trial = 6429/30000 | Total reward = 45.66
2022-01-26 14:16:55.651 | DEBUG    | __main__:trials:24 - Trial = 6430/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.651 | DEBUG    | __main__:trials:29 - Trial = 6430/30000 | Total reward = 32.28
2022-01-26 14:16:55.656 | DEBUG    | __main__:trials:24 - Trial = 6431/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.657 | DEBUG    | __main__:trials:29 - Trial = 6431/30000 | Total reward = 34.70
2022-01-26 14:16:55.660 | DEBUG    | __main__:trials:26 - Trial = 6432/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.661 | DEBUG    | __main__:trials:29 - Trial = 6432/30000 | Total reward = 13.94
2022-01-26 14:16:55.665 | DEBUG    | __main__:trials:24 - Trial = 6433/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.666 | DEBUG    | __main__:trials:29 - Trial = 6433/30000 | Total reward = 57.25
2022-01-26 14:16:55.670 | DEBUG    | __main__:trials:24 - Trial = 6434/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.671 | DEBUG    | __main__:trials:29 - Trial = 6434/30000 | Total reward = 57.07
2022-01-26 14:16:55.675 | DEBUG    | __main__:trials:24 - Trial = 6435/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.676 | DEBUG    | __main__:trials:29 - Trial = 6435/30000 | Total reward = 35.52
2022-01-26 14:16:55.680 | DEBUG    | __main__:trials:24 - Trial = 6436/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.681 | DEBUG    | __main__:trials:29 - Trial = 6436/30000 | Total reward = 51.62
2022-01-26 14:16:55.684 | DEBUG    | __main__:trials:24 - Trial = 6437/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.686 | DEBUG    | __main__:trials:29 - Trial = 6437/30000 | Total reward = 40.54
2022-01-26 14:16:55.690 | DEBUG    | __main__:trials:24 - Trial = 6438/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.690 | DEBUG    | __main__:trials:29 - Trial = 6438/30000 | Total reward = 36.50
2022-01-26 14:16:55.694 | DEBUG    | __main__:trials:24 - Trial = 6439/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.696 | DEBUG    | __main__:trials:29 - Trial = 6439/30000 | Total reward = 47.74
2022-01-26 14:16:55.699 | DEBUG    | __main__:trials:24 - Trial = 6440/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.700 | DEBUG    | __main__:trials:29 - Trial = 6440/30000 | Total reward = 43.90
2022-01-26 14:16:55.704 | DEBUG    | __main__:trials:24 - Trial = 6441/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.704 | DEBUG    | __main__:trials:29 - Trial = 6441/30000 | Total reward = 33.04
2022-01-26 14:16:55.707 | DEBUG    | __main__:trials:26 - Trial = 6442/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.707 | DEBUG    | __main__:trials:29 - Trial = 6442/30000 | Total reward = 18.03
2022-01-26 14:16:55.711 | DEBUG    | __main__:trials:24 - Trial = 6443/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.711 | DEBUG    | __main__:trials:29 - Trial = 6443/30000 | Total reward = 40.30
2022-01-26 14:16:55.715 | DEBUG    | __main__:trials:24 - Trial = 6444/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.717 | DEBUG    | __main__:trials:29 - Trial = 6444/30000 | Total reward = 41.76
2022-01-26 14:16:55.719 | DEBUG    | __main__:trials:24 - Trial = 6445/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.721 | DEBUG    | __main__:trials:29 - Trial = 6445/30000 | Total reward = 43.79
2022-01-26 14:16:55.724 | DEBUG    | __main__:trials:24 - Trial = 6446/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.726 | DEBUG    | __main__:trials:29 - Trial = 6446/30000 | Total reward = 30.92
2022-01-26 14:16:55.729 | DEBUG    | __main__:trials:24 - Trial = 6447/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.731 | DEBUG    | __main__:trials:29 - Trial = 6447/30000 | Total reward = 37.37
2022-01-26 14:16:55.734 | DEBUG    | __main__:trials:24 - Trial = 6448/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.736 | DEBUG    | __main__:trials:29 - Trial = 6448/30000 | Total reward = 29.46
2022-01-26 14:16:55.739 | DEBUG    | __main__:trials:24 - Trial = 6449/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.741 | DEBUG    | __main__:trials:29 - Trial = 6449/30000 | Total reward = 28.20
2022-01-26 14:16:55.744 | DEBUG    | __main__:trials:26 - Trial = 6450/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.745 | DEBUG    | __main__:trials:29 - Trial = 6450/30000 | Total reward = 16.25
2022-01-26 14:16:55.748 | DEBUG    | __main__:trials:24 - Trial = 6451/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.749 | DEBUG    | __main__:trials:29 - Trial = 6451/30000 | Total reward = 46.69
2022-01-26 14:16:55.752 | DEBUG    | __main__:trials:26 - Trial = 6452/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.753 | DEBUG    | __main__:trials:29 - Trial = 6452/30000 | Total reward = 16.73
2022-01-26 14:16:55.757 | DEBUG    | __main__:trials:24 - Trial = 6453/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.758 | DEBUG    | __main__:trials:29 - Trial = 6453/30000 | Total reward = 34.04
2022-01-26 14:16:55.761 | DEBUG    | __main__:trials:24 - Trial = 6454/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.763 | DEBUG    | __main__:trials:29 - Trial = 6454/30000 | Total reward = 46.52
2022-01-26 14:16:55.767 | DEBUG    | __main__:trials:24 - Trial = 6455/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.767 | DEBUG    | __main__:trials:29 - Trial = 6455/30000 | Total reward = 41.71
2022-01-26 14:16:55.772 | DEBUG    | __main__:trials:24 - Trial = 6456/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.773 | DEBUG    | __main__:trials:29 - Trial = 6456/30000 | Total reward = 45.50
2022-01-26 14:16:55.776 | DEBUG    | __main__:trials:24 - Trial = 6457/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.777 | DEBUG    | __main__:trials:29 - Trial = 6457/30000 | Total reward = 30.54
2022-01-26 14:16:55.780 | DEBUG    | __main__:trials:24 - Trial = 6458/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.781 | DEBUG    | __main__:trials:29 - Trial = 6458/30000 | Total reward = 41.47
2022-01-26 14:16:55.784 | DEBUG    | __main__:trials:24 - Trial = 6459/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.786 | DEBUG    | __main__:trials:29 - Trial = 6459/30000 | Total reward = 40.67
2022-01-26 14:16:55.789 | DEBUG    | __main__:trials:24 - Trial = 6460/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.790 | DEBUG    | __main__:trials:29 - Trial = 6460/30000 | Total reward = 37.14
2022-01-26 14:16:55.793 | DEBUG    | __main__:trials:24 - Trial = 6461/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.795 | DEBUG    | __main__:trials:29 - Trial = 6461/30000 | Total reward = 30.33
2022-01-26 14:16:55.798 | DEBUG    | __main__:trials:24 - Trial = 6462/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.800 | DEBUG    | __main__:trials:29 - Trial = 6462/30000 | Total reward = 28.73
2022-01-26 14:16:55.802 | DEBUG    | __main__:trials:24 - Trial = 6463/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.804 | DEBUG    | __main__:trials:29 - Trial = 6463/30000 | Total reward = 49.11
2022-01-26 14:16:55.807 | DEBUG    | __main__:trials:24 - Trial = 6464/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.809 | DEBUG    | __main__:trials:29 - Trial = 6464/30000 | Total reward = 56.50
2022-01-26 14:16:55.812 | DEBUG    | __main__:trials:24 - Trial = 6465/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.813 | DEBUG    | __main__:trials:29 - Trial = 6465/30000 | Total reward = 42.41
2022-01-26 14:16:55.816 | DEBUG    | __main__:trials:24 - Trial = 6466/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.818 | DEBUG    | __main__:trials:29 - Trial = 6466/30000 | Total reward = 43.63
2022-01-26 14:16:55.821 | DEBUG    | __main__:trials:24 - Trial = 6467/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.823 | DEBUG    | __main__:trials:29 - Trial = 6467/30000 | Total reward = 43.01
2022-01-26 14:16:55.826 | DEBUG    | __main__:trials:24 - Trial = 6468/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.827 | DEBUG    | __main__:trials:29 - Trial = 6468/30000 | Total reward = 54.07
2022-01-26 14:16:55.831 | DEBUG    | __main__:trials:24 - Trial = 6469/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.832 | DEBUG    | __main__:trials:29 - Trial = 6469/30000 | Total reward = 45.12
2022-01-26 14:16:55.835 | DEBUG    | __main__:trials:24 - Trial = 6470/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.837 | DEBUG    | __main__:trials:29 - Trial = 6470/30000 | Total reward = 39.32
2022-01-26 14:16:55.840 | DEBUG    | __main__:trials:24 - Trial = 6471/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.842 | DEBUG    | __main__:trials:29 - Trial = 6471/30000 | Total reward = 38.92
2022-01-26 14:16:55.846 | DEBUG    | __main__:trials:24 - Trial = 6472/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.847 | DEBUG    | __main__:trials:29 - Trial = 6472/30000 | Total reward = 33.77
2022-01-26 14:16:55.850 | DEBUG    | __main__:trials:24 - Trial = 6473/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.852 | DEBUG    | __main__:trials:29 - Trial = 6473/30000 | Total reward = 51.33
2022-01-26 14:16:55.855 | DEBUG    | __main__:trials:24 - Trial = 6474/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.857 | DEBUG    | __main__:trials:29 - Trial = 6474/30000 | Total reward = 36.40
2022-01-26 14:16:55.860 | DEBUG    | __main__:trials:24 - Trial = 6475/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.861 | DEBUG    | __main__:trials:29 - Trial = 6475/30000 | Total reward = 33.79
2022-01-26 14:16:55.864 | DEBUG    | __main__:trials:24 - Trial = 6476/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.866 | DEBUG    | __main__:trials:29 - Trial = 6476/30000 | Total reward = 27.14
2022-01-26 14:16:55.869 | DEBUG    | __main__:trials:24 - Trial = 6477/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.869 | DEBUG    | __main__:trials:29 - Trial = 6477/30000 | Total reward = 26.67
2022-01-26 14:16:55.873 | DEBUG    | __main__:trials:24 - Trial = 6478/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.875 | DEBUG    | __main__:trials:29 - Trial = 6478/30000 | Total reward = 34.26
2022-01-26 14:16:55.878 | DEBUG    | __main__:trials:24 - Trial = 6479/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.880 | DEBUG    | __main__:trials:29 - Trial = 6479/30000 | Total reward = 34.62
2022-01-26 14:16:55.883 | DEBUG    | __main__:trials:24 - Trial = 6480/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.885 | DEBUG    | __main__:trials:29 - Trial = 6480/30000 | Total reward = 49.42
2022-01-26 14:16:55.888 | DEBUG    | __main__:trials:24 - Trial = 6481/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.890 | DEBUG    | __main__:trials:29 - Trial = 6481/30000 | Total reward = 35.91
2022-01-26 14:16:55.893 | DEBUG    | __main__:trials:24 - Trial = 6482/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.894 | DEBUG    | __main__:trials:29 - Trial = 6482/30000 | Total reward = 48.16
2022-01-26 14:16:55.898 | DEBUG    | __main__:trials:24 - Trial = 6483/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.899 | DEBUG    | __main__:trials:29 - Trial = 6483/30000 | Total reward = 31.43
2022-01-26 14:16:55.903 | DEBUG    | __main__:trials:24 - Trial = 6484/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.904 | DEBUG    | __main__:trials:29 - Trial = 6484/30000 | Total reward = 43.27
2022-01-26 14:16:55.908 | DEBUG    | __main__:trials:24 - Trial = 6485/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.909 | DEBUG    | __main__:trials:29 - Trial = 6485/30000 | Total reward = 48.29
2022-01-26 14:16:55.913 | DEBUG    | __main__:trials:24 - Trial = 6486/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.914 | DEBUG    | __main__:trials:29 - Trial = 6486/30000 | Total reward = 51.78
2022-01-26 14:16:55.918 | DEBUG    | __main__:trials:24 - Trial = 6487/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.920 | DEBUG    | __main__:trials:29 - Trial = 6487/30000 | Total reward = 41.00
2022-01-26 14:16:55.923 | DEBUG    | __main__:trials:26 - Trial = 6488/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:55.925 | DEBUG    | __main__:trials:29 - Trial = 6488/30000 | Total reward = 28.84
2022-01-26 14:16:55.927 | DEBUG    | __main__:trials:24 - Trial = 6489/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.929 | DEBUG    | __main__:trials:29 - Trial = 6489/30000 | Total reward = 40.66
2022-01-26 14:16:55.933 | DEBUG    | __main__:trials:24 - Trial = 6490/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.934 | DEBUG    | __main__:trials:29 - Trial = 6490/30000 | Total reward = 60.55
2022-01-26 14:16:55.938 | DEBUG    | __main__:trials:24 - Trial = 6491/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.939 | DEBUG    | __main__:trials:29 - Trial = 6491/30000 | Total reward = 38.41
2022-01-26 14:16:55.942 | DEBUG    | __main__:trials:24 - Trial = 6492/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.944 | DEBUG    | __main__:trials:29 - Trial = 6492/30000 | Total reward = 42.00
2022-01-26 14:16:55.947 | DEBUG    | __main__:trials:24 - Trial = 6493/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.948 | DEBUG    | __main__:trials:29 - Trial = 6493/30000 | Total reward = 46.04
2022-01-26 14:16:55.952 | DEBUG    | __main__:trials:24 - Trial = 6494/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.953 | DEBUG    | __main__:trials:29 - Trial = 6494/30000 | Total reward = 42.30
2022-01-26 14:16:55.957 | DEBUG    | __main__:trials:24 - Trial = 6495/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.959 | DEBUG    | __main__:trials:29 - Trial = 6495/30000 | Total reward = 40.82
2022-01-26 14:16:55.962 | DEBUG    | __main__:trials:24 - Trial = 6496/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.963 | DEBUG    | __main__:trials:29 - Trial = 6496/30000 | Total reward = 51.16
2022-01-26 14:16:55.967 | DEBUG    | __main__:trials:24 - Trial = 6497/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.968 | DEBUG    | __main__:trials:29 - Trial = 6497/30000 | Total reward = 43.14
2022-01-26 14:16:55.972 | DEBUG    | __main__:trials:24 - Trial = 6498/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.973 | DEBUG    | __main__:trials:29 - Trial = 6498/30000 | Total reward = 43.14
2022-01-26 14:16:55.976 | DEBUG    | __main__:trials:24 - Trial = 6499/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.977 | DEBUG    | __main__:trials:29 - Trial = 6499/30000 | Total reward = 42.80
2022-01-26 14:16:55.981 | DEBUG    | __main__:trials:24 - Trial = 6500/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.982 | DEBUG    | __main__:trials:29 - Trial = 6500/30000 | Total reward = 33.25
2022-01-26 14:16:55.986 | DEBUG    | __main__:trials:24 - Trial = 6501/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.987 | DEBUG    | __main__:trials:29 - Trial = 6501/30000 | Total reward = 41.50
2022-01-26 14:16:55.991 | DEBUG    | __main__:trials:24 - Trial = 6502/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.992 | DEBUG    | __main__:trials:29 - Trial = 6502/30000 | Total reward = 42.18
2022-01-26 14:16:55.996 | DEBUG    | __main__:trials:24 - Trial = 6503/30000 | Max number of steps (20) reached
2022-01-26 14:16:55.997 | DEBUG    | __main__:trials:29 - Trial = 6503/30000 | Total reward = 46.59
2022-01-26 14:16:56.001 | DEBUG    | __main__:trials:24 - Trial = 6504/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.002 | DEBUG    | __main__:trials:29 - Trial = 6504/30000 | Total reward = 42.81
2022-01-26 14:16:56.006 | DEBUG    | __main__:trials:24 - Trial = 6505/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.007 | DEBUG    | __main__:trials:29 - Trial = 6505/30000 | Total reward = 39.63
2022-01-26 14:16:56.011 | DEBUG    | __main__:trials:24 - Trial = 6506/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.012 | DEBUG    | __main__:trials:29 - Trial = 6506/30000 | Total reward = 53.32
2022-01-26 14:16:56.016 | DEBUG    | __main__:trials:24 - Trial = 6507/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.018 | DEBUG    | __main__:trials:29 - Trial = 6507/30000 | Total reward = 36.09
2022-01-26 14:16:56.021 | DEBUG    | __main__:trials:24 - Trial = 6508/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.023 | DEBUG    | __main__:trials:29 - Trial = 6508/30000 | Total reward = 43.11
2022-01-26 14:16:56.026 | DEBUG    | __main__:trials:24 - Trial = 6509/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.027 | DEBUG    | __main__:trials:29 - Trial = 6509/30000 | Total reward = 50.49
2022-01-26 14:16:56.031 | DEBUG    | __main__:trials:24 - Trial = 6510/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.032 | DEBUG    | __main__:trials:29 - Trial = 6510/30000 | Total reward = 47.65
2022-01-26 14:16:56.036 | DEBUG    | __main__:trials:24 - Trial = 6511/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.037 | DEBUG    | __main__:trials:29 - Trial = 6511/30000 | Total reward = 43.77
2022-01-26 14:16:56.041 | DEBUG    | __main__:trials:24 - Trial = 6512/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.043 | DEBUG    | __main__:trials:29 - Trial = 6512/30000 | Total reward = 50.05
2022-01-26 14:16:56.046 | DEBUG    | __main__:trials:24 - Trial = 6513/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.048 | DEBUG    | __main__:trials:29 - Trial = 6513/30000 | Total reward = 42.96
2022-01-26 14:16:56.051 | DEBUG    | __main__:trials:24 - Trial = 6514/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.052 | DEBUG    | __main__:trials:29 - Trial = 6514/30000 | Total reward = 42.37
2022-01-26 14:16:56.055 | DEBUG    | __main__:trials:24 - Trial = 6515/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.057 | DEBUG    | __main__:trials:29 - Trial = 6515/30000 | Total reward = 46.17
2022-01-26 14:16:56.060 | DEBUG    | __main__:trials:24 - Trial = 6516/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.061 | DEBUG    | __main__:trials:29 - Trial = 6516/30000 | Total reward = 40.49
2022-01-26 14:16:56.064 | DEBUG    | __main__:trials:24 - Trial = 6517/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.065 | DEBUG    | __main__:trials:29 - Trial = 6517/30000 | Total reward = 55.28
2022-01-26 14:16:56.069 | DEBUG    | __main__:trials:24 - Trial = 6518/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.070 | DEBUG    | __main__:trials:29 - Trial = 6518/30000 | Total reward = 42.62
2022-01-26 14:16:56.074 | DEBUG    | __main__:trials:24 - Trial = 6519/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.074 | DEBUG    | __main__:trials:29 - Trial = 6519/30000 | Total reward = 41.82
2022-01-26 14:16:56.079 | DEBUG    | __main__:trials:24 - Trial = 6520/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.080 | DEBUG    | __main__:trials:29 - Trial = 6520/30000 | Total reward = 47.25
2022-01-26 14:16:56.084 | DEBUG    | __main__:trials:24 - Trial = 6521/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.085 | DEBUG    | __main__:trials:29 - Trial = 6521/30000 | Total reward = 34.38
2022-01-26 14:16:56.089 | DEBUG    | __main__:trials:24 - Trial = 6522/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.090 | DEBUG    | __main__:trials:29 - Trial = 6522/30000 | Total reward = 56.26
2022-01-26 14:16:56.093 | DEBUG    | __main__:trials:24 - Trial = 6523/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.095 | DEBUG    | __main__:trials:29 - Trial = 6523/30000 | Total reward = 50.63
2022-01-26 14:16:56.098 | DEBUG    | __main__:trials:24 - Trial = 6524/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.100 | DEBUG    | __main__:trials:29 - Trial = 6524/30000 | Total reward = 39.54
2022-01-26 14:16:56.103 | DEBUG    | __main__:trials:24 - Trial = 6525/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.105 | DEBUG    | __main__:trials:29 - Trial = 6525/30000 | Total reward = 41.29
2022-01-26 14:16:56.108 | DEBUG    | __main__:trials:24 - Trial = 6526/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.110 | DEBUG    | __main__:trials:29 - Trial = 6526/30000 | Total reward = 35.60
2022-01-26 14:16:56.113 | DEBUG    | __main__:trials:24 - Trial = 6527/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.115 | DEBUG    | __main__:trials:29 - Trial = 6527/30000 | Total reward = 36.29
2022-01-26 14:16:56.118 | DEBUG    | __main__:trials:24 - Trial = 6528/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.119 | DEBUG    | __main__:trials:29 - Trial = 6528/30000 | Total reward = 27.69
2022-01-26 14:16:56.123 | DEBUG    | __main__:trials:24 - Trial = 6529/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.124 | DEBUG    | __main__:trials:29 - Trial = 6529/30000 | Total reward = 42.96
2022-01-26 14:16:56.128 | DEBUG    | __main__:trials:24 - Trial = 6530/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.129 | DEBUG    | __main__:trials:29 - Trial = 6530/30000 | Total reward = 43.31
2022-01-26 14:16:56.132 | DEBUG    | __main__:trials:24 - Trial = 6531/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.134 | DEBUG    | __main__:trials:29 - Trial = 6531/30000 | Total reward = 45.18
2022-01-26 14:16:56.137 | DEBUG    | __main__:trials:24 - Trial = 6532/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.139 | DEBUG    | __main__:trials:29 - Trial = 6532/30000 | Total reward = 40.99
2022-01-26 14:16:56.142 | DEBUG    | __main__:trials:24 - Trial = 6533/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.143 | DEBUG    | __main__:trials:29 - Trial = 6533/30000 | Total reward = 43.33
2022-01-26 14:16:56.146 | DEBUG    | __main__:trials:24 - Trial = 6534/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.148 | DEBUG    | __main__:trials:29 - Trial = 6534/30000 | Total reward = 42.45
2022-01-26 14:16:56.151 | DEBUG    | __main__:trials:24 - Trial = 6535/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.152 | DEBUG    | __main__:trials:29 - Trial = 6535/30000 | Total reward = 44.33
2022-01-26 14:16:56.156 | DEBUG    | __main__:trials:24 - Trial = 6536/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.157 | DEBUG    | __main__:trials:29 - Trial = 6536/30000 | Total reward = 41.61
2022-01-26 14:16:56.161 | DEBUG    | __main__:trials:24 - Trial = 6537/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.162 | DEBUG    | __main__:trials:29 - Trial = 6537/30000 | Total reward = 42.51
2022-01-26 14:16:56.166 | DEBUG    | __main__:trials:24 - Trial = 6538/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.166 | DEBUG    | __main__:trials:29 - Trial = 6538/30000 | Total reward = 30.31
2022-01-26 14:16:56.170 | DEBUG    | __main__:trials:24 - Trial = 6539/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.172 | DEBUG    | __main__:trials:29 - Trial = 6539/30000 | Total reward = 43.96
2022-01-26 14:16:56.174 | DEBUG    | __main__:trials:24 - Trial = 6540/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.175 | DEBUG    | __main__:trials:29 - Trial = 6540/30000 | Total reward = 40.04
2022-01-26 14:16:56.178 | DEBUG    | __main__:trials:24 - Trial = 6541/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.180 | DEBUG    | __main__:trials:29 - Trial = 6541/30000 | Total reward = 38.24
2022-01-26 14:16:56.183 | DEBUG    | __main__:trials:24 - Trial = 6542/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.184 | DEBUG    | __main__:trials:29 - Trial = 6542/30000 | Total reward = 40.97
2022-01-26 14:16:56.187 | DEBUG    | __main__:trials:24 - Trial = 6543/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.188 | DEBUG    | __main__:trials:29 - Trial = 6543/30000 | Total reward = 43.27
2022-01-26 14:16:56.191 | DEBUG    | __main__:trials:24 - Trial = 6544/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.193 | DEBUG    | __main__:trials:29 - Trial = 6544/30000 | Total reward = 39.26
2022-01-26 14:16:56.196 | DEBUG    | __main__:trials:24 - Trial = 6545/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.197 | DEBUG    | __main__:trials:29 - Trial = 6545/30000 | Total reward = 54.66
2022-01-26 14:16:56.200 | DEBUG    | __main__:trials:24 - Trial = 6546/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.202 | DEBUG    | __main__:trials:29 - Trial = 6546/30000 | Total reward = 36.50
2022-01-26 14:16:56.205 | DEBUG    | __main__:trials:24 - Trial = 6547/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.206 | DEBUG    | __main__:trials:29 - Trial = 6547/30000 | Total reward = 44.33
2022-01-26 14:16:56.210 | DEBUG    | __main__:trials:24 - Trial = 6548/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.211 | DEBUG    | __main__:trials:29 - Trial = 6548/30000 | Total reward = 35.67
2022-01-26 14:16:56.213 | DEBUG    | __main__:trials:26 - Trial = 6549/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.214 | DEBUG    | __main__:trials:29 - Trial = 6549/30000 | Total reward = 22.67
2022-01-26 14:16:56.217 | DEBUG    | __main__:trials:24 - Trial = 6550/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.219 | DEBUG    | __main__:trials:29 - Trial = 6550/30000 | Total reward = 41.85
2022-01-26 14:16:56.222 | DEBUG    | __main__:trials:24 - Trial = 6551/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.224 | DEBUG    | __main__:trials:29 - Trial = 6551/30000 | Total reward = 28.27
2022-01-26 14:16:56.227 | DEBUG    | __main__:trials:24 - Trial = 6552/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.228 | DEBUG    | __main__:trials:29 - Trial = 6552/30000 | Total reward = 46.52
2022-01-26 14:16:56.231 | DEBUG    | __main__:trials:26 - Trial = 6553/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.232 | DEBUG    | __main__:trials:29 - Trial = 6553/30000 | Total reward = 17.18
2022-01-26 14:16:56.235 | DEBUG    | __main__:trials:24 - Trial = 6554/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.236 | DEBUG    | __main__:trials:29 - Trial = 6554/30000 | Total reward = 40.66
2022-01-26 14:16:56.240 | DEBUG    | __main__:trials:24 - Trial = 6555/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.241 | DEBUG    | __main__:trials:29 - Trial = 6555/30000 | Total reward = 64.45
2022-01-26 14:16:56.244 | DEBUG    | __main__:trials:24 - Trial = 6556/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.246 | DEBUG    | __main__:trials:29 - Trial = 6556/30000 | Total reward = 48.37
2022-01-26 14:16:56.249 | DEBUG    | __main__:trials:24 - Trial = 6557/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.251 | DEBUG    | __main__:trials:29 - Trial = 6557/30000 | Total reward = 32.22
2022-01-26 14:16:56.254 | DEBUG    | __main__:trials:24 - Trial = 6558/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.255 | DEBUG    | __main__:trials:29 - Trial = 6558/30000 | Total reward = 40.00
2022-01-26 14:16:56.259 | DEBUG    | __main__:trials:24 - Trial = 6559/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.260 | DEBUG    | __main__:trials:29 - Trial = 6559/30000 | Total reward = 41.23
2022-01-26 14:16:56.264 | DEBUG    | __main__:trials:24 - Trial = 6560/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.265 | DEBUG    | __main__:trials:29 - Trial = 6560/30000 | Total reward = 43.67
2022-01-26 14:16:56.269 | DEBUG    | __main__:trials:24 - Trial = 6561/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.270 | DEBUG    | __main__:trials:29 - Trial = 6561/30000 | Total reward = 33.38
2022-01-26 14:16:56.274 | DEBUG    | __main__:trials:24 - Trial = 6562/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.276 | DEBUG    | __main__:trials:29 - Trial = 6562/30000 | Total reward = 42.79
2022-01-26 14:16:56.279 | DEBUG    | __main__:trials:24 - Trial = 6563/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.280 | DEBUG    | __main__:trials:29 - Trial = 6563/30000 | Total reward = 45.58
2022-01-26 14:16:56.283 | DEBUG    | __main__:trials:24 - Trial = 6564/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.285 | DEBUG    | __main__:trials:29 - Trial = 6564/30000 | Total reward = 43.66
2022-01-26 14:16:56.288 | DEBUG    | __main__:trials:24 - Trial = 6565/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.290 | DEBUG    | __main__:trials:29 - Trial = 6565/30000 | Total reward = 41.45
2022-01-26 14:16:56.293 | DEBUG    | __main__:trials:24 - Trial = 6566/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.293 | DEBUG    | __main__:trials:29 - Trial = 6566/30000 | Total reward = 43.73
2022-01-26 14:16:56.298 | DEBUG    | __main__:trials:24 - Trial = 6567/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.298 | DEBUG    | __main__:trials:29 - Trial = 6567/30000 | Total reward = 43.84
2022-01-26 14:16:56.302 | DEBUG    | __main__:trials:24 - Trial = 6568/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.304 | DEBUG    | __main__:trials:29 - Trial = 6568/30000 | Total reward = 49.25
2022-01-26 14:16:56.307 | DEBUG    | __main__:trials:24 - Trial = 6569/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.309 | DEBUG    | __main__:trials:29 - Trial = 6569/30000 | Total reward = 48.82
2022-01-26 14:16:56.311 | DEBUG    | __main__:trials:24 - Trial = 6570/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.313 | DEBUG    | __main__:trials:29 - Trial = 6570/30000 | Total reward = 43.59
2022-01-26 14:16:56.316 | DEBUG    | __main__:trials:24 - Trial = 6571/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.318 | DEBUG    | __main__:trials:29 - Trial = 6571/30000 | Total reward = 36.92
2022-01-26 14:16:56.321 | DEBUG    | __main__:trials:24 - Trial = 6572/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.322 | DEBUG    | __main__:trials:29 - Trial = 6572/30000 | Total reward = 44.43
2022-01-26 14:16:56.325 | DEBUG    | __main__:trials:24 - Trial = 6573/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.326 | DEBUG    | __main__:trials:29 - Trial = 6573/30000 | Total reward = 42.52
2022-01-26 14:16:56.330 | DEBUG    | __main__:trials:24 - Trial = 6574/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.331 | DEBUG    | __main__:trials:29 - Trial = 6574/30000 | Total reward = 43.36
2022-01-26 14:16:56.335 | DEBUG    | __main__:trials:24 - Trial = 6575/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.336 | DEBUG    | __main__:trials:29 - Trial = 6575/30000 | Total reward = 55.48
2022-01-26 14:16:56.340 | DEBUG    | __main__:trials:24 - Trial = 6576/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.341 | DEBUG    | __main__:trials:29 - Trial = 6576/30000 | Total reward = 39.33
2022-01-26 14:16:56.344 | DEBUG    | __main__:trials:24 - Trial = 6577/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.346 | DEBUG    | __main__:trials:29 - Trial = 6577/30000 | Total reward = 50.48
2022-01-26 14:16:56.349 | DEBUG    | __main__:trials:24 - Trial = 6578/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.351 | DEBUG    | __main__:trials:29 - Trial = 6578/30000 | Total reward = 63.37
2022-01-26 14:16:56.353 | DEBUG    | __main__:trials:24 - Trial = 6579/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.355 | DEBUG    | __main__:trials:29 - Trial = 6579/30000 | Total reward = 46.63
2022-01-26 14:16:56.358 | DEBUG    | __main__:trials:24 - Trial = 6580/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.360 | DEBUG    | __main__:trials:29 - Trial = 6580/30000 | Total reward = 43.62
2022-01-26 14:16:56.364 | DEBUG    | __main__:trials:24 - Trial = 6581/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.364 | DEBUG    | __main__:trials:29 - Trial = 6581/30000 | Total reward = 40.33
2022-01-26 14:16:56.368 | DEBUG    | __main__:trials:24 - Trial = 6582/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.370 | DEBUG    | __main__:trials:29 - Trial = 6582/30000 | Total reward = 23.56
2022-01-26 14:16:56.373 | DEBUG    | __main__:trials:24 - Trial = 6583/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.375 | DEBUG    | __main__:trials:29 - Trial = 6583/30000 | Total reward = 42.42
2022-01-26 14:16:56.378 | DEBUG    | __main__:trials:24 - Trial = 6584/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.379 | DEBUG    | __main__:trials:29 - Trial = 6584/30000 | Total reward = 38.31
2022-01-26 14:16:56.383 | DEBUG    | __main__:trials:24 - Trial = 6585/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.384 | DEBUG    | __main__:trials:29 - Trial = 6585/30000 | Total reward = 42.06
2022-01-26 14:16:56.388 | DEBUG    | __main__:trials:24 - Trial = 6586/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.389 | DEBUG    | __main__:trials:29 - Trial = 6586/30000 | Total reward = 42.32
2022-01-26 14:16:56.393 | DEBUG    | __main__:trials:24 - Trial = 6587/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.394 | DEBUG    | __main__:trials:29 - Trial = 6587/30000 | Total reward = 34.44
2022-01-26 14:16:56.398 | DEBUG    | __main__:trials:24 - Trial = 6588/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.399 | DEBUG    | __main__:trials:29 - Trial = 6588/30000 | Total reward = 43.84
2022-01-26 14:16:56.403 | DEBUG    | __main__:trials:24 - Trial = 6589/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.404 | DEBUG    | __main__:trials:29 - Trial = 6589/30000 | Total reward = 45.58
2022-01-26 14:16:56.407 | DEBUG    | __main__:trials:24 - Trial = 6590/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.408 | DEBUG    | __main__:trials:29 - Trial = 6590/30000 | Total reward = 45.67
2022-01-26 14:16:56.411 | DEBUG    | __main__:trials:24 - Trial = 6591/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.412 | DEBUG    | __main__:trials:29 - Trial = 6591/30000 | Total reward = 49.87
2022-01-26 14:16:56.415 | DEBUG    | __main__:trials:24 - Trial = 6592/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.417 | DEBUG    | __main__:trials:29 - Trial = 6592/30000 | Total reward = 39.75
2022-01-26 14:16:56.421 | DEBUG    | __main__:trials:24 - Trial = 6593/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.422 | DEBUG    | __main__:trials:29 - Trial = 6593/30000 | Total reward = 42.25
2022-01-26 14:16:56.425 | DEBUG    | __main__:trials:24 - Trial = 6594/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.426 | DEBUG    | __main__:trials:29 - Trial = 6594/30000 | Total reward = 64.29
2022-01-26 14:16:56.431 | DEBUG    | __main__:trials:24 - Trial = 6595/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.432 | DEBUG    | __main__:trials:29 - Trial = 6595/30000 | Total reward = 44.00
2022-01-26 14:16:56.436 | DEBUG    | __main__:trials:24 - Trial = 6596/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.436 | DEBUG    | __main__:trials:29 - Trial = 6596/30000 | Total reward = 39.77
2022-01-26 14:16:56.440 | DEBUG    | __main__:trials:24 - Trial = 6597/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.441 | DEBUG    | __main__:trials:29 - Trial = 6597/30000 | Total reward = 39.80
2022-01-26 14:16:56.444 | DEBUG    | __main__:trials:24 - Trial = 6598/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.446 | DEBUG    | __main__:trials:29 - Trial = 6598/30000 | Total reward = 40.85
2022-01-26 14:16:56.449 | DEBUG    | __main__:trials:24 - Trial = 6599/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.450 | DEBUG    | __main__:trials:29 - Trial = 6599/30000 | Total reward = 55.23
2022-01-26 14:16:56.454 | DEBUG    | __main__:trials:24 - Trial = 6600/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.455 | DEBUG    | __main__:trials:29 - Trial = 6600/30000 | Total reward = 49.87
2022-01-26 14:16:56.459 | DEBUG    | __main__:trials:24 - Trial = 6601/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.460 | DEBUG    | __main__:trials:29 - Trial = 6601/30000 | Total reward = 58.48
2022-01-26 14:16:56.464 | DEBUG    | __main__:trials:24 - Trial = 6602/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.465 | DEBUG    | __main__:trials:29 - Trial = 6602/30000 | Total reward = 42.78
2022-01-26 14:16:56.469 | DEBUG    | __main__:trials:24 - Trial = 6603/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.470 | DEBUG    | __main__:trials:29 - Trial = 6603/30000 | Total reward = 39.27
2022-01-26 14:16:56.474 | DEBUG    | __main__:trials:24 - Trial = 6604/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.475 | DEBUG    | __main__:trials:29 - Trial = 6604/30000 | Total reward = 41.37
2022-01-26 14:16:56.478 | DEBUG    | __main__:trials:24 - Trial = 6605/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.480 | DEBUG    | __main__:trials:29 - Trial = 6605/30000 | Total reward = 37.29
2022-01-26 14:16:56.484 | DEBUG    | __main__:trials:24 - Trial = 6606/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.484 | DEBUG    | __main__:trials:29 - Trial = 6606/30000 | Total reward = 43.85
2022-01-26 14:16:56.488 | DEBUG    | __main__:trials:24 - Trial = 6607/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.490 | DEBUG    | __main__:trials:29 - Trial = 6607/30000 | Total reward = 41.61
2022-01-26 14:16:56.493 | DEBUG    | __main__:trials:24 - Trial = 6608/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.494 | DEBUG    | __main__:trials:29 - Trial = 6608/30000 | Total reward = 57.22
2022-01-26 14:16:56.498 | DEBUG    | __main__:trials:24 - Trial = 6609/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.499 | DEBUG    | __main__:trials:29 - Trial = 6609/30000 | Total reward = 40.86
2022-01-26 14:16:56.502 | DEBUG    | __main__:trials:24 - Trial = 6610/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.504 | DEBUG    | __main__:trials:29 - Trial = 6610/30000 | Total reward = 37.04
2022-01-26 14:16:56.507 | DEBUG    | __main__:trials:24 - Trial = 6611/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.508 | DEBUG    | __main__:trials:29 - Trial = 6611/30000 | Total reward = 49.28
2022-01-26 14:16:56.512 | DEBUG    | __main__:trials:24 - Trial = 6612/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.514 | DEBUG    | __main__:trials:29 - Trial = 6612/30000 | Total reward = 49.18
2022-01-26 14:16:56.517 | DEBUG    | __main__:trials:24 - Trial = 6613/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.518 | DEBUG    | __main__:trials:29 - Trial = 6613/30000 | Total reward = 45.03
2022-01-26 14:16:56.522 | DEBUG    | __main__:trials:24 - Trial = 6614/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.522 | DEBUG    | __main__:trials:29 - Trial = 6614/30000 | Total reward = 56.75
2022-01-26 14:16:56.526 | DEBUG    | __main__:trials:24 - Trial = 6615/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.528 | DEBUG    | __main__:trials:29 - Trial = 6615/30000 | Total reward = 58.60
2022-01-26 14:16:56.531 | DEBUG    | __main__:trials:24 - Trial = 6616/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.533 | DEBUG    | __main__:trials:29 - Trial = 6616/30000 | Total reward = 45.52
2022-01-26 14:16:56.536 | DEBUG    | __main__:trials:24 - Trial = 6617/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.537 | DEBUG    | __main__:trials:29 - Trial = 6617/30000 | Total reward = 43.71
2022-01-26 14:16:56.541 | DEBUG    | __main__:trials:24 - Trial = 6618/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.543 | DEBUG    | __main__:trials:29 - Trial = 6618/30000 | Total reward = 40.30
2022-01-26 14:16:56.546 | DEBUG    | __main__:trials:24 - Trial = 6619/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.548 | DEBUG    | __main__:trials:29 - Trial = 6619/30000 | Total reward = 34.51
2022-01-26 14:16:56.552 | DEBUG    | __main__:trials:24 - Trial = 6620/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.553 | DEBUG    | __main__:trials:29 - Trial = 6620/30000 | Total reward = 43.84
2022-01-26 14:16:56.557 | DEBUG    | __main__:trials:24 - Trial = 6621/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.559 | DEBUG    | __main__:trials:29 - Trial = 6621/30000 | Total reward = 54.40
2022-01-26 14:16:56.561 | DEBUG    | __main__:trials:24 - Trial = 6622/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.563 | DEBUG    | __main__:trials:29 - Trial = 6622/30000 | Total reward = 34.97
2022-01-26 14:16:56.567 | DEBUG    | __main__:trials:24 - Trial = 6623/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.568 | DEBUG    | __main__:trials:29 - Trial = 6623/30000 | Total reward = 42.78
2022-01-26 14:16:56.571 | DEBUG    | __main__:trials:24 - Trial = 6624/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.571 | DEBUG    | __main__:trials:29 - Trial = 6624/30000 | Total reward = 52.47
2022-01-26 14:16:56.575 | DEBUG    | __main__:trials:24 - Trial = 6625/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.575 | DEBUG    | __main__:trials:29 - Trial = 6625/30000 | Total reward = 43.84
2022-01-26 14:16:56.579 | DEBUG    | __main__:trials:24 - Trial = 6626/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.579 | DEBUG    | __main__:trials:29 - Trial = 6626/30000 | Total reward = 38.98
2022-01-26 14:16:56.583 | DEBUG    | __main__:trials:24 - Trial = 6627/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.583 | DEBUG    | __main__:trials:29 - Trial = 6627/30000 | Total reward = 41.61
2022-01-26 14:16:56.587 | DEBUG    | __main__:trials:24 - Trial = 6628/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.589 | DEBUG    | __main__:trials:29 - Trial = 6628/30000 | Total reward = 46.81
2022-01-26 14:16:56.591 | DEBUG    | __main__:trials:24 - Trial = 6629/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.593 | DEBUG    | __main__:trials:29 - Trial = 6629/30000 | Total reward = 55.56
2022-01-26 14:16:56.596 | DEBUG    | __main__:trials:24 - Trial = 6630/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.598 | DEBUG    | __main__:trials:29 - Trial = 6630/30000 | Total reward = 39.75
2022-01-26 14:16:56.601 | DEBUG    | __main__:trials:24 - Trial = 6631/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.602 | DEBUG    | __main__:trials:29 - Trial = 6631/30000 | Total reward = 43.35
2022-01-26 14:16:56.605 | DEBUG    | __main__:trials:24 - Trial = 6632/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.606 | DEBUG    | __main__:trials:29 - Trial = 6632/30000 | Total reward = 32.26
2022-01-26 14:16:56.609 | DEBUG    | __main__:trials:24 - Trial = 6633/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.611 | DEBUG    | __main__:trials:29 - Trial = 6633/30000 | Total reward = 47.08
2022-01-26 14:16:56.613 | DEBUG    | __main__:trials:24 - Trial = 6634/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.614 | DEBUG    | __main__:trials:29 - Trial = 6634/30000 | Total reward = 43.84
2022-01-26 14:16:56.618 | DEBUG    | __main__:trials:24 - Trial = 6635/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.618 | DEBUG    | __main__:trials:29 - Trial = 6635/30000 | Total reward = 39.64
2022-01-26 14:16:56.621 | DEBUG    | __main__:trials:26 - Trial = 6636/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.622 | DEBUG    | __main__:trials:29 - Trial = 6636/30000 | Total reward = 25.58
2022-01-26 14:16:56.625 | DEBUG    | __main__:trials:24 - Trial = 6637/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.626 | DEBUG    | __main__:trials:29 - Trial = 6637/30000 | Total reward = 42.84
2022-01-26 14:16:56.629 | DEBUG    | __main__:trials:24 - Trial = 6638/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.630 | DEBUG    | __main__:trials:29 - Trial = 6638/30000 | Total reward = 36.28
2022-01-26 14:16:56.633 | DEBUG    | __main__:trials:24 - Trial = 6639/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.634 | DEBUG    | __main__:trials:29 - Trial = 6639/30000 | Total reward = 44.86
2022-01-26 14:16:56.637 | DEBUG    | __main__:trials:24 - Trial = 6640/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.638 | DEBUG    | __main__:trials:29 - Trial = 6640/30000 | Total reward = 46.44
2022-01-26 14:16:56.642 | DEBUG    | __main__:trials:24 - Trial = 6641/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.643 | DEBUG    | __main__:trials:29 - Trial = 6641/30000 | Total reward = 38.03
2022-01-26 14:16:56.646 | DEBUG    | __main__:trials:24 - Trial = 6642/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.648 | DEBUG    | __main__:trials:29 - Trial = 6642/30000 | Total reward = 30.17
2022-01-26 14:16:56.651 | DEBUG    | __main__:trials:24 - Trial = 6643/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.651 | DEBUG    | __main__:trials:29 - Trial = 6643/30000 | Total reward = 42.59
2022-01-26 14:16:56.654 | DEBUG    | __main__:trials:24 - Trial = 6644/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.656 | DEBUG    | __main__:trials:29 - Trial = 6644/30000 | Total reward = 60.73
2022-01-26 14:16:56.659 | DEBUG    | __main__:trials:24 - Trial = 6645/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.661 | DEBUG    | __main__:trials:29 - Trial = 6645/30000 | Total reward = 43.84
2022-01-26 14:16:56.664 | DEBUG    | __main__:trials:24 - Trial = 6646/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.665 | DEBUG    | __main__:trials:29 - Trial = 6646/30000 | Total reward = 44.25
2022-01-26 14:16:56.668 | DEBUG    | __main__:trials:24 - Trial = 6647/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.670 | DEBUG    | __main__:trials:29 - Trial = 6647/30000 | Total reward = 28.24
2022-01-26 14:16:56.673 | DEBUG    | __main__:trials:24 - Trial = 6648/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.675 | DEBUG    | __main__:trials:29 - Trial = 6648/30000 | Total reward = 36.05
2022-01-26 14:16:56.678 | DEBUG    | __main__:trials:24 - Trial = 6649/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.680 | DEBUG    | __main__:trials:29 - Trial = 6649/30000 | Total reward = 43.84
2022-01-26 14:16:56.684 | DEBUG    | __main__:trials:24 - Trial = 6650/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.684 | DEBUG    | __main__:trials:29 - Trial = 6650/30000 | Total reward = 41.01
2022-01-26 14:16:56.688 | DEBUG    | __main__:trials:26 - Trial = 6651/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.689 | DEBUG    | __main__:trials:29 - Trial = 6651/30000 | Total reward = 28.13
2022-01-26 14:16:56.693 | DEBUG    | __main__:trials:24 - Trial = 6652/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.695 | DEBUG    | __main__:trials:29 - Trial = 6652/30000 | Total reward = 41.62
2022-01-26 14:16:56.698 | DEBUG    | __main__:trials:24 - Trial = 6653/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.700 | DEBUG    | __main__:trials:29 - Trial = 6653/30000 | Total reward = 43.59
2022-01-26 14:16:56.703 | DEBUG    | __main__:trials:24 - Trial = 6654/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.705 | DEBUG    | __main__:trials:29 - Trial = 6654/30000 | Total reward = 41.23
2022-01-26 14:16:56.708 | DEBUG    | __main__:trials:24 - Trial = 6655/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.709 | DEBUG    | __main__:trials:29 - Trial = 6655/30000 | Total reward = 37.48
2022-01-26 14:16:56.712 | DEBUG    | __main__:trials:24 - Trial = 6656/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.713 | DEBUG    | __main__:trials:29 - Trial = 6656/30000 | Total reward = 40.95
2022-01-26 14:16:56.716 | DEBUG    | __main__:trials:24 - Trial = 6657/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.718 | DEBUG    | __main__:trials:29 - Trial = 6657/30000 | Total reward = 43.96
2022-01-26 14:16:56.721 | DEBUG    | __main__:trials:24 - Trial = 6658/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.722 | DEBUG    | __main__:trials:29 - Trial = 6658/30000 | Total reward = 51.75
2022-01-26 14:16:56.725 | DEBUG    | __main__:trials:24 - Trial = 6659/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.727 | DEBUG    | __main__:trials:29 - Trial = 6659/30000 | Total reward = 58.94
2022-01-26 14:16:56.730 | DEBUG    | __main__:trials:24 - Trial = 6660/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.732 | DEBUG    | __main__:trials:29 - Trial = 6660/30000 | Total reward = 37.87
2022-01-26 14:16:56.735 | DEBUG    | __main__:trials:24 - Trial = 6661/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.737 | DEBUG    | __main__:trials:29 - Trial = 6661/30000 | Total reward = 47.90
2022-01-26 14:16:56.740 | DEBUG    | __main__:trials:24 - Trial = 6662/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.742 | DEBUG    | __main__:trials:29 - Trial = 6662/30000 | Total reward = 44.48
2022-01-26 14:16:56.746 | DEBUG    | __main__:trials:24 - Trial = 6663/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.746 | DEBUG    | __main__:trials:29 - Trial = 6663/30000 | Total reward = 43.84
2022-01-26 14:16:56.750 | DEBUG    | __main__:trials:24 - Trial = 6664/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.752 | DEBUG    | __main__:trials:29 - Trial = 6664/30000 | Total reward = 46.59
2022-01-26 14:16:56.756 | DEBUG    | __main__:trials:24 - Trial = 6665/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.757 | DEBUG    | __main__:trials:29 - Trial = 6665/30000 | Total reward = 58.28
2022-01-26 14:16:56.761 | DEBUG    | __main__:trials:24 - Trial = 6666/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.762 | DEBUG    | __main__:trials:29 - Trial = 6666/30000 | Total reward = 42.38
2022-01-26 14:16:56.766 | DEBUG    | __main__:trials:24 - Trial = 6667/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.768 | DEBUG    | __main__:trials:29 - Trial = 6667/30000 | Total reward = 33.23
2022-01-26 14:16:56.771 | DEBUG    | __main__:trials:24 - Trial = 6668/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.772 | DEBUG    | __main__:trials:29 - Trial = 6668/30000 | Total reward = 42.80
2022-01-26 14:16:56.776 | DEBUG    | __main__:trials:24 - Trial = 6669/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.778 | DEBUG    | __main__:trials:29 - Trial = 6669/30000 | Total reward = 38.00
2022-01-26 14:16:56.781 | DEBUG    | __main__:trials:24 - Trial = 6670/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.781 | DEBUG    | __main__:trials:29 - Trial = 6670/30000 | Total reward = 32.50
2022-01-26 14:16:56.786 | DEBUG    | __main__:trials:24 - Trial = 6671/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.786 | DEBUG    | __main__:trials:29 - Trial = 6671/30000 | Total reward = 30.92
2022-01-26 14:16:56.790 | DEBUG    | __main__:trials:24 - Trial = 6672/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.792 | DEBUG    | __main__:trials:29 - Trial = 6672/30000 | Total reward = 57.90
2022-01-26 14:16:56.795 | DEBUG    | __main__:trials:24 - Trial = 6673/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.796 | DEBUG    | __main__:trials:29 - Trial = 6673/30000 | Total reward = 44.38
2022-01-26 14:16:56.800 | DEBUG    | __main__:trials:24 - Trial = 6674/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.801 | DEBUG    | __main__:trials:29 - Trial = 6674/30000 | Total reward = 38.75
2022-01-26 14:16:56.805 | DEBUG    | __main__:trials:24 - Trial = 6675/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.805 | DEBUG    | __main__:trials:29 - Trial = 6675/30000 | Total reward = 34.98
2022-01-26 14:16:56.809 | DEBUG    | __main__:trials:24 - Trial = 6676/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.810 | DEBUG    | __main__:trials:29 - Trial = 6676/30000 | Total reward = 37.20
2022-01-26 14:16:56.814 | DEBUG    | __main__:trials:24 - Trial = 6677/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.815 | DEBUG    | __main__:trials:29 - Trial = 6677/30000 | Total reward = 43.53
2022-01-26 14:16:56.818 | DEBUG    | __main__:trials:24 - Trial = 6678/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.820 | DEBUG    | __main__:trials:29 - Trial = 6678/30000 | Total reward = 43.44
2022-01-26 14:16:56.824 | DEBUG    | __main__:trials:24 - Trial = 6679/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.825 | DEBUG    | __main__:trials:29 - Trial = 6679/30000 | Total reward = 27.33
2022-01-26 14:16:56.829 | DEBUG    | __main__:trials:24 - Trial = 6680/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.830 | DEBUG    | __main__:trials:29 - Trial = 6680/30000 | Total reward = 42.58
2022-01-26 14:16:56.834 | DEBUG    | __main__:trials:24 - Trial = 6681/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.835 | DEBUG    | __main__:trials:29 - Trial = 6681/30000 | Total reward = 35.98
2022-01-26 14:16:56.839 | DEBUG    | __main__:trials:24 - Trial = 6682/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.840 | DEBUG    | __main__:trials:29 - Trial = 6682/30000 | Total reward = 42.57
2022-01-26 14:16:56.844 | DEBUG    | __main__:trials:24 - Trial = 6683/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.846 | DEBUG    | __main__:trials:29 - Trial = 6683/30000 | Total reward = 36.37
2022-01-26 14:16:56.850 | DEBUG    | __main__:trials:24 - Trial = 6684/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.851 | DEBUG    | __main__:trials:29 - Trial = 6684/30000 | Total reward = 38.62
2022-01-26 14:16:56.855 | DEBUG    | __main__:trials:24 - Trial = 6685/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.856 | DEBUG    | __main__:trials:29 - Trial = 6685/30000 | Total reward = 34.43
2022-01-26 14:16:56.860 | DEBUG    | __main__:trials:24 - Trial = 6686/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.861 | DEBUG    | __main__:trials:29 - Trial = 6686/30000 | Total reward = 39.73
2022-01-26 14:16:56.865 | DEBUG    | __main__:trials:24 - Trial = 6687/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.866 | DEBUG    | __main__:trials:29 - Trial = 6687/30000 | Total reward = 35.54
2022-01-26 14:16:56.870 | DEBUG    | __main__:trials:24 - Trial = 6688/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.871 | DEBUG    | __main__:trials:29 - Trial = 6688/30000 | Total reward = 36.41
2022-01-26 14:16:56.874 | DEBUG    | __main__:trials:24 - Trial = 6689/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.875 | DEBUG    | __main__:trials:29 - Trial = 6689/30000 | Total reward = 28.34
2022-01-26 14:16:56.878 | DEBUG    | __main__:trials:24 - Trial = 6690/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.879 | DEBUG    | __main__:trials:29 - Trial = 6690/30000 | Total reward = 36.37
2022-01-26 14:16:56.882 | DEBUG    | __main__:trials:24 - Trial = 6691/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.884 | DEBUG    | __main__:trials:29 - Trial = 6691/30000 | Total reward = 35.90
2022-01-26 14:16:56.887 | DEBUG    | __main__:trials:24 - Trial = 6692/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.888 | DEBUG    | __main__:trials:29 - Trial = 6692/30000 | Total reward = 45.26
2022-01-26 14:16:56.892 | DEBUG    | __main__:trials:24 - Trial = 6693/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.893 | DEBUG    | __main__:trials:29 - Trial = 6693/30000 | Total reward = 34.13
2022-01-26 14:16:56.897 | DEBUG    | __main__:trials:24 - Trial = 6694/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.899 | DEBUG    | __main__:trials:29 - Trial = 6694/30000 | Total reward = 49.29
2022-01-26 14:16:56.902 | DEBUG    | __main__:trials:24 - Trial = 6695/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.903 | DEBUG    | __main__:trials:29 - Trial = 6695/30000 | Total reward = 36.50
2022-01-26 14:16:56.907 | DEBUG    | __main__:trials:24 - Trial = 6696/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.909 | DEBUG    | __main__:trials:29 - Trial = 6696/30000 | Total reward = 37.52
2022-01-26 14:16:56.911 | DEBUG    | __main__:trials:26 - Trial = 6697/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.913 | DEBUG    | __main__:trials:29 - Trial = 6697/30000 | Total reward = 21.38
2022-01-26 14:16:56.916 | DEBUG    | __main__:trials:26 - Trial = 6698/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.917 | DEBUG    | __main__:trials:29 - Trial = 6698/30000 | Total reward = 24.60
2022-01-26 14:16:56.920 | DEBUG    | __main__:trials:24 - Trial = 6699/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.922 | DEBUG    | __main__:trials:29 - Trial = 6699/30000 | Total reward = 46.73
2022-01-26 14:16:56.926 | DEBUG    | __main__:trials:24 - Trial = 6700/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.927 | DEBUG    | __main__:trials:29 - Trial = 6700/30000 | Total reward = 27.02
2022-01-26 14:16:56.930 | DEBUG    | __main__:trials:24 - Trial = 6701/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.932 | DEBUG    | __main__:trials:29 - Trial = 6701/30000 | Total reward = 62.51
2022-01-26 14:16:56.935 | DEBUG    | __main__:trials:24 - Trial = 6702/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.936 | DEBUG    | __main__:trials:29 - Trial = 6702/30000 | Total reward = 35.66
2022-01-26 14:16:56.940 | DEBUG    | __main__:trials:24 - Trial = 6703/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.941 | DEBUG    | __main__:trials:29 - Trial = 6703/30000 | Total reward = 32.03
2022-01-26 14:16:56.944 | DEBUG    | __main__:trials:24 - Trial = 6704/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.946 | DEBUG    | __main__:trials:29 - Trial = 6704/30000 | Total reward = 43.98
2022-01-26 14:16:56.950 | DEBUG    | __main__:trials:24 - Trial = 6705/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.951 | DEBUG    | __main__:trials:29 - Trial = 6705/30000 | Total reward = 30.65
2022-01-26 14:16:56.954 | DEBUG    | __main__:trials:24 - Trial = 6706/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.956 | DEBUG    | __main__:trials:29 - Trial = 6706/30000 | Total reward = 41.71
2022-01-26 14:16:56.959 | DEBUG    | __main__:trials:24 - Trial = 6707/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.960 | DEBUG    | __main__:trials:29 - Trial = 6707/30000 | Total reward = 33.98
2022-01-26 14:16:56.964 | DEBUG    | __main__:trials:24 - Trial = 6708/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.966 | DEBUG    | __main__:trials:29 - Trial = 6708/30000 | Total reward = 53.59
2022-01-26 14:16:56.969 | DEBUG    | __main__:trials:24 - Trial = 6709/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.971 | DEBUG    | __main__:trials:29 - Trial = 6709/30000 | Total reward = 38.91
2022-01-26 14:16:56.974 | DEBUG    | __main__:trials:24 - Trial = 6710/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.976 | DEBUG    | __main__:trials:29 - Trial = 6710/30000 | Total reward = 46.83
2022-01-26 14:16:56.980 | DEBUG    | __main__:trials:24 - Trial = 6711/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.981 | DEBUG    | __main__:trials:29 - Trial = 6711/30000 | Total reward = 60.87
2022-01-26 14:16:56.984 | DEBUG    | __main__:trials:26 - Trial = 6712/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:56.986 | DEBUG    | __main__:trials:29 - Trial = 6712/30000 | Total reward = 20.68
2022-01-26 14:16:56.990 | DEBUG    | __main__:trials:24 - Trial = 6713/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.991 | DEBUG    | __main__:trials:29 - Trial = 6713/30000 | Total reward = 36.37
2022-01-26 14:16:56.995 | DEBUG    | __main__:trials:24 - Trial = 6714/30000 | Max number of steps (20) reached
2022-01-26 14:16:56.996 | DEBUG    | __main__:trials:29 - Trial = 6714/30000 | Total reward = 40.01
2022-01-26 14:16:57.000 | DEBUG    | __main__:trials:24 - Trial = 6715/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.001 | DEBUG    | __main__:trials:29 - Trial = 6715/30000 | Total reward = 49.66
2022-01-26 14:16:57.004 | DEBUG    | __main__:trials:24 - Trial = 6716/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.006 | DEBUG    | __main__:trials:29 - Trial = 6716/30000 | Total reward = 43.39
2022-01-26 14:16:57.010 | DEBUG    | __main__:trials:24 - Trial = 6717/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.012 | DEBUG    | __main__:trials:29 - Trial = 6717/30000 | Total reward = 35.06
2022-01-26 14:16:57.015 | DEBUG    | __main__:trials:24 - Trial = 6718/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.017 | DEBUG    | __main__:trials:29 - Trial = 6718/30000 | Total reward = 48.15
2022-01-26 14:16:57.020 | DEBUG    | __main__:trials:24 - Trial = 6719/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.021 | DEBUG    | __main__:trials:29 - Trial = 6719/30000 | Total reward = 39.94
2022-01-26 14:16:57.025 | DEBUG    | __main__:trials:24 - Trial = 6720/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.026 | DEBUG    | __main__:trials:29 - Trial = 6720/30000 | Total reward = 39.74
2022-01-26 14:16:57.030 | DEBUG    | __main__:trials:24 - Trial = 6721/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.032 | DEBUG    | __main__:trials:29 - Trial = 6721/30000 | Total reward = 43.22
2022-01-26 14:16:57.035 | DEBUG    | __main__:trials:24 - Trial = 6722/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.037 | DEBUG    | __main__:trials:29 - Trial = 6722/30000 | Total reward = 37.03
2022-01-26 14:16:57.040 | DEBUG    | __main__:trials:24 - Trial = 6723/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.042 | DEBUG    | __main__:trials:29 - Trial = 6723/30000 | Total reward = 44.88
2022-01-26 14:16:57.045 | DEBUG    | __main__:trials:24 - Trial = 6724/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.046 | DEBUG    | __main__:trials:29 - Trial = 6724/30000 | Total reward = 36.42
2022-01-26 14:16:57.048 | DEBUG    | __main__:trials:26 - Trial = 6725/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.050 | DEBUG    | __main__:trials:29 - Trial = 6725/30000 | Total reward = 23.99
2022-01-26 14:16:57.054 | DEBUG    | __main__:trials:24 - Trial = 6726/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.054 | DEBUG    | __main__:trials:29 - Trial = 6726/30000 | Total reward = 36.50
2022-01-26 14:16:57.058 | DEBUG    | __main__:trials:24 - Trial = 6727/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.060 | DEBUG    | __main__:trials:29 - Trial = 6727/30000 | Total reward = 36.37
2022-01-26 14:16:57.063 | DEBUG    | __main__:trials:24 - Trial = 6728/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.065 | DEBUG    | __main__:trials:29 - Trial = 6728/30000 | Total reward = 43.42
2022-01-26 14:16:57.068 | DEBUG    | __main__:trials:24 - Trial = 6729/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.070 | DEBUG    | __main__:trials:29 - Trial = 6729/30000 | Total reward = 44.59
2022-01-26 14:16:57.073 | DEBUG    | __main__:trials:24 - Trial = 6730/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.075 | DEBUG    | __main__:trials:29 - Trial = 6730/30000 | Total reward = 43.30
2022-01-26 14:16:57.079 | DEBUG    | __main__:trials:24 - Trial = 6731/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.080 | DEBUG    | __main__:trials:29 - Trial = 6731/30000 | Total reward = 30.61
2022-01-26 14:16:57.083 | DEBUG    | __main__:trials:26 - Trial = 6732/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.085 | DEBUG    | __main__:trials:29 - Trial = 6732/30000 | Total reward = 22.09
2022-01-26 14:16:57.088 | DEBUG    | __main__:trials:24 - Trial = 6733/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.090 | DEBUG    | __main__:trials:29 - Trial = 6733/30000 | Total reward = 56.06
2022-01-26 14:16:57.092 | DEBUG    | __main__:trials:24 - Trial = 6734/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.094 | DEBUG    | __main__:trials:29 - Trial = 6734/30000 | Total reward = 45.77
2022-01-26 14:16:57.098 | DEBUG    | __main__:trials:24 - Trial = 6735/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.099 | DEBUG    | __main__:trials:29 - Trial = 6735/30000 | Total reward = 42.34
2022-01-26 14:16:57.103 | DEBUG    | __main__:trials:24 - Trial = 6736/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.104 | DEBUG    | __main__:trials:29 - Trial = 6736/30000 | Total reward = 44.47
2022-01-26 14:16:57.107 | DEBUG    | __main__:trials:26 - Trial = 6737/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.109 | DEBUG    | __main__:trials:29 - Trial = 6737/30000 | Total reward = 22.76
2022-01-26 14:16:57.112 | DEBUG    | __main__:trials:24 - Trial = 6738/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.114 | DEBUG    | __main__:trials:29 - Trial = 6738/30000 | Total reward = 37.32
2022-01-26 14:16:57.118 | DEBUG    | __main__:trials:24 - Trial = 6739/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.119 | DEBUG    | __main__:trials:29 - Trial = 6739/30000 | Total reward = 30.08
2022-01-26 14:16:57.121 | DEBUG    | __main__:trials:26 - Trial = 6740/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.122 | DEBUG    | __main__:trials:29 - Trial = 6740/30000 | Total reward = 21.38
2022-01-26 14:16:57.125 | DEBUG    | __main__:trials:24 - Trial = 6741/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.126 | DEBUG    | __main__:trials:29 - Trial = 6741/30000 | Total reward = 40.55
2022-01-26 14:16:57.128 | DEBUG    | __main__:trials:26 - Trial = 6742/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.130 | DEBUG    | __main__:trials:29 - Trial = 6742/30000 | Total reward = 19.20
2022-01-26 14:16:57.133 | DEBUG    | __main__:trials:24 - Trial = 6743/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.135 | DEBUG    | __main__:trials:29 - Trial = 6743/30000 | Total reward = 49.51
2022-01-26 14:16:57.138 | DEBUG    | __main__:trials:24 - Trial = 6744/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.140 | DEBUG    | __main__:trials:29 - Trial = 6744/30000 | Total reward = 32.14
2022-01-26 14:16:57.142 | DEBUG    | __main__:trials:26 - Trial = 6745/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.143 | DEBUG    | __main__:trials:29 - Trial = 6745/30000 | Total reward = 17.44
2022-01-26 14:16:57.147 | DEBUG    | __main__:trials:24 - Trial = 6746/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.149 | DEBUG    | __main__:trials:29 - Trial = 6746/30000 | Total reward = 44.77
2022-01-26 14:16:57.153 | DEBUG    | __main__:trials:24 - Trial = 6747/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.154 | DEBUG    | __main__:trials:29 - Trial = 6747/30000 | Total reward = 45.14
2022-01-26 14:16:57.157 | DEBUG    | __main__:trials:24 - Trial = 6748/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.158 | DEBUG    | __main__:trials:29 - Trial = 6748/30000 | Total reward = 35.21
2022-01-26 14:16:57.162 | DEBUG    | __main__:trials:24 - Trial = 6749/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.164 | DEBUG    | __main__:trials:29 - Trial = 6749/30000 | Total reward = 35.23
2022-01-26 14:16:57.167 | DEBUG    | __main__:trials:24 - Trial = 6750/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.167 | DEBUG    | __main__:trials:29 - Trial = 6750/30000 | Total reward = 42.92
2022-01-26 14:16:57.171 | DEBUG    | __main__:trials:24 - Trial = 6751/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.172 | DEBUG    | __main__:trials:29 - Trial = 6751/30000 | Total reward = 44.04
2022-01-26 14:16:57.176 | DEBUG    | __main__:trials:24 - Trial = 6752/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.178 | DEBUG    | __main__:trials:29 - Trial = 6752/30000 | Total reward = 36.79
2022-01-26 14:16:57.181 | DEBUG    | __main__:trials:24 - Trial = 6753/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.183 | DEBUG    | __main__:trials:29 - Trial = 6753/30000 | Total reward = 31.60
2022-01-26 14:16:57.186 | DEBUG    | __main__:trials:24 - Trial = 6754/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.188 | DEBUG    | __main__:trials:29 - Trial = 6754/30000 | Total reward = 36.98
2022-01-26 14:16:57.191 | DEBUG    | __main__:trials:24 - Trial = 6755/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.192 | DEBUG    | __main__:trials:29 - Trial = 6755/30000 | Total reward = 31.90
2022-01-26 14:16:57.196 | DEBUG    | __main__:trials:24 - Trial = 6756/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.198 | DEBUG    | __main__:trials:29 - Trial = 6756/30000 | Total reward = 44.69
2022-01-26 14:16:57.201 | DEBUG    | __main__:trials:24 - Trial = 6757/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.203 | DEBUG    | __main__:trials:29 - Trial = 6757/30000 | Total reward = 44.88
2022-01-26 14:16:57.207 | DEBUG    | __main__:trials:24 - Trial = 6758/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.208 | DEBUG    | __main__:trials:29 - Trial = 6758/30000 | Total reward = 37.49
2022-01-26 14:16:57.212 | DEBUG    | __main__:trials:24 - Trial = 6759/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.213 | DEBUG    | __main__:trials:29 - Trial = 6759/30000 | Total reward = 45.88
2022-01-26 14:16:57.217 | DEBUG    | __main__:trials:24 - Trial = 6760/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.219 | DEBUG    | __main__:trials:29 - Trial = 6760/30000 | Total reward = 40.69
2022-01-26 14:16:57.223 | DEBUG    | __main__:trials:24 - Trial = 6761/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.224 | DEBUG    | __main__:trials:29 - Trial = 6761/30000 | Total reward = 39.85
2022-01-26 14:16:57.227 | DEBUG    | __main__:trials:24 - Trial = 6762/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.229 | DEBUG    | __main__:trials:29 - Trial = 6762/30000 | Total reward = 46.85
2022-01-26 14:16:57.232 | DEBUG    | __main__:trials:24 - Trial = 6763/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.234 | DEBUG    | __main__:trials:29 - Trial = 6763/30000 | Total reward = 32.05
2022-01-26 14:16:57.238 | DEBUG    | __main__:trials:24 - Trial = 6764/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.239 | DEBUG    | __main__:trials:29 - Trial = 6764/30000 | Total reward = 41.53
2022-01-26 14:16:57.243 | DEBUG    | __main__:trials:24 - Trial = 6765/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.244 | DEBUG    | __main__:trials:29 - Trial = 6765/30000 | Total reward = 37.40
2022-01-26 14:16:57.248 | DEBUG    | __main__:trials:24 - Trial = 6766/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.250 | DEBUG    | __main__:trials:29 - Trial = 6766/30000 | Total reward = 48.48
2022-01-26 14:16:57.253 | DEBUG    | __main__:trials:24 - Trial = 6767/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.255 | DEBUG    | __main__:trials:29 - Trial = 6767/30000 | Total reward = 28.52
2022-01-26 14:16:57.258 | DEBUG    | __main__:trials:24 - Trial = 6768/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.259 | DEBUG    | __main__:trials:29 - Trial = 6768/30000 | Total reward = 46.20
2022-01-26 14:16:57.263 | DEBUG    | __main__:trials:24 - Trial = 6769/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.265 | DEBUG    | __main__:trials:29 - Trial = 6769/30000 | Total reward = 44.48
2022-01-26 14:16:57.268 | DEBUG    | __main__:trials:24 - Trial = 6770/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.269 | DEBUG    | __main__:trials:29 - Trial = 6770/30000 | Total reward = 17.69
2022-01-26 14:16:57.272 | DEBUG    | __main__:trials:24 - Trial = 6771/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.273 | DEBUG    | __main__:trials:29 - Trial = 6771/30000 | Total reward = 56.64
2022-01-26 14:16:57.277 | DEBUG    | __main__:trials:24 - Trial = 6772/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.278 | DEBUG    | __main__:trials:29 - Trial = 6772/30000 | Total reward = 39.26
2022-01-26 14:16:57.282 | DEBUG    | __main__:trials:24 - Trial = 6773/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.284 | DEBUG    | __main__:trials:29 - Trial = 6773/30000 | Total reward = 61.37
2022-01-26 14:16:57.287 | DEBUG    | __main__:trials:24 - Trial = 6774/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.289 | DEBUG    | __main__:trials:29 - Trial = 6774/30000 | Total reward = 46.09
2022-01-26 14:16:57.292 | DEBUG    | __main__:trials:24 - Trial = 6775/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.294 | DEBUG    | __main__:trials:29 - Trial = 6775/30000 | Total reward = 57.54
2022-01-26 14:16:57.297 | DEBUG    | __main__:trials:24 - Trial = 6776/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.299 | DEBUG    | __main__:trials:29 - Trial = 6776/30000 | Total reward = 36.25
2022-01-26 14:16:57.302 | DEBUG    | __main__:trials:24 - Trial = 6777/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.304 | DEBUG    | __main__:trials:29 - Trial = 6777/30000 | Total reward = 45.55
2022-01-26 14:16:57.307 | DEBUG    | __main__:trials:24 - Trial = 6778/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.309 | DEBUG    | __main__:trials:29 - Trial = 6778/30000 | Total reward = 41.36
2022-01-26 14:16:57.312 | DEBUG    | __main__:trials:24 - Trial = 6779/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.314 | DEBUG    | __main__:trials:29 - Trial = 6779/30000 | Total reward = 52.08
2022-01-26 14:16:57.317 | DEBUG    | __main__:trials:24 - Trial = 6780/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.318 | DEBUG    | __main__:trials:29 - Trial = 6780/30000 | Total reward = 43.34
2022-01-26 14:16:57.323 | DEBUG    | __main__:trials:24 - Trial = 6781/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.325 | DEBUG    | __main__:trials:29 - Trial = 6781/30000 | Total reward = 49.42
2022-01-26 14:16:57.327 | DEBUG    | __main__:trials:24 - Trial = 6782/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.329 | DEBUG    | __main__:trials:29 - Trial = 6782/30000 | Total reward = 48.99
2022-01-26 14:16:57.333 | DEBUG    | __main__:trials:24 - Trial = 6783/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.335 | DEBUG    | __main__:trials:29 - Trial = 6783/30000 | Total reward = 47.34
2022-01-26 14:16:57.338 | DEBUG    | __main__:trials:24 - Trial = 6784/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.340 | DEBUG    | __main__:trials:29 - Trial = 6784/30000 | Total reward = 44.61
2022-01-26 14:16:57.344 | DEBUG    | __main__:trials:24 - Trial = 6785/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.345 | DEBUG    | __main__:trials:29 - Trial = 6785/30000 | Total reward = 43.59
2022-01-26 14:16:57.349 | DEBUG    | __main__:trials:24 - Trial = 6786/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.350 | DEBUG    | __main__:trials:29 - Trial = 6786/30000 | Total reward = 38.12
2022-01-26 14:16:57.354 | DEBUG    | __main__:trials:24 - Trial = 6787/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.356 | DEBUG    | __main__:trials:29 - Trial = 6787/30000 | Total reward = 42.96
2022-01-26 14:16:57.359 | DEBUG    | __main__:trials:24 - Trial = 6788/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.361 | DEBUG    | __main__:trials:29 - Trial = 6788/30000 | Total reward = 48.76
2022-01-26 14:16:57.364 | DEBUG    | __main__:trials:24 - Trial = 6789/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.366 | DEBUG    | __main__:trials:29 - Trial = 6789/30000 | Total reward = 53.44
2022-01-26 14:16:57.370 | DEBUG    | __main__:trials:24 - Trial = 6790/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.371 | DEBUG    | __main__:trials:29 - Trial = 6790/30000 | Total reward = 41.23
2022-01-26 14:16:57.374 | DEBUG    | __main__:trials:24 - Trial = 6791/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.376 | DEBUG    | __main__:trials:29 - Trial = 6791/30000 | Total reward = 45.99
2022-01-26 14:16:57.378 | DEBUG    | __main__:trials:24 - Trial = 6792/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.380 | DEBUG    | __main__:trials:29 - Trial = 6792/30000 | Total reward = 34.36
2022-01-26 14:16:57.384 | DEBUG    | __main__:trials:24 - Trial = 6793/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.386 | DEBUG    | __main__:trials:29 - Trial = 6793/30000 | Total reward = 46.58
2022-01-26 14:16:57.389 | DEBUG    | __main__:trials:24 - Trial = 6794/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.391 | DEBUG    | __main__:trials:29 - Trial = 6794/30000 | Total reward = 51.18
2022-01-26 14:16:57.395 | DEBUG    | __main__:trials:24 - Trial = 6795/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.396 | DEBUG    | __main__:trials:29 - Trial = 6795/30000 | Total reward = 41.96
2022-01-26 14:16:57.400 | DEBUG    | __main__:trials:24 - Trial = 6796/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.401 | DEBUG    | __main__:trials:29 - Trial = 6796/30000 | Total reward = 38.81
2022-01-26 14:16:57.405 | DEBUG    | __main__:trials:24 - Trial = 6797/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.406 | DEBUG    | __main__:trials:29 - Trial = 6797/30000 | Total reward = 44.02
2022-01-26 14:16:57.409 | DEBUG    | __main__:trials:24 - Trial = 6798/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.411 | DEBUG    | __main__:trials:29 - Trial = 6798/30000 | Total reward = 43.00
2022-01-26 14:16:57.414 | DEBUG    | __main__:trials:24 - Trial = 6799/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.416 | DEBUG    | __main__:trials:29 - Trial = 6799/30000 | Total reward = 36.37
2022-01-26 14:16:57.420 | DEBUG    | __main__:trials:24 - Trial = 6800/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.421 | DEBUG    | __main__:trials:29 - Trial = 6800/30000 | Total reward = 39.82
2022-01-26 14:16:57.425 | DEBUG    | __main__:trials:24 - Trial = 6801/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.426 | DEBUG    | __main__:trials:29 - Trial = 6801/30000 | Total reward = 34.33
2022-01-26 14:16:57.429 | DEBUG    | __main__:trials:24 - Trial = 6802/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.431 | DEBUG    | __main__:trials:29 - Trial = 6802/30000 | Total reward = 33.88
2022-01-26 14:16:57.434 | DEBUG    | __main__:trials:24 - Trial = 6803/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.435 | DEBUG    | __main__:trials:29 - Trial = 6803/30000 | Total reward = 45.05
2022-01-26 14:16:57.439 | DEBUG    | __main__:trials:24 - Trial = 6804/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.439 | DEBUG    | __main__:trials:29 - Trial = 6804/30000 | Total reward = 47.61
2022-01-26 14:16:57.443 | DEBUG    | __main__:trials:24 - Trial = 6805/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.445 | DEBUG    | __main__:trials:29 - Trial = 6805/30000 | Total reward = 46.52
2022-01-26 14:16:57.448 | DEBUG    | __main__:trials:24 - Trial = 6806/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.450 | DEBUG    | __main__:trials:29 - Trial = 6806/30000 | Total reward = 40.52
2022-01-26 14:16:57.454 | DEBUG    | __main__:trials:24 - Trial = 6807/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.454 | DEBUG    | __main__:trials:29 - Trial = 6807/30000 | Total reward = 51.31
2022-01-26 14:16:57.458 | DEBUG    | __main__:trials:24 - Trial = 6808/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.460 | DEBUG    | __main__:trials:29 - Trial = 6808/30000 | Total reward = 42.17
2022-01-26 14:16:57.463 | DEBUG    | __main__:trials:24 - Trial = 6809/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.465 | DEBUG    | __main__:trials:29 - Trial = 6809/30000 | Total reward = 47.03
2022-01-26 14:16:57.468 | DEBUG    | __main__:trials:24 - Trial = 6810/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.470 | DEBUG    | __main__:trials:29 - Trial = 6810/30000 | Total reward = 36.18
2022-01-26 14:16:57.474 | DEBUG    | __main__:trials:24 - Trial = 6811/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.475 | DEBUG    | __main__:trials:29 - Trial = 6811/30000 | Total reward = 36.72
2022-01-26 14:16:57.479 | DEBUG    | __main__:trials:24 - Trial = 6812/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.480 | DEBUG    | __main__:trials:29 - Trial = 6812/30000 | Total reward = 31.05
2022-01-26 14:16:57.484 | DEBUG    | __main__:trials:24 - Trial = 6813/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.485 | DEBUG    | __main__:trials:29 - Trial = 6813/30000 | Total reward = 33.19
2022-01-26 14:16:57.489 | DEBUG    | __main__:trials:24 - Trial = 6814/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.491 | DEBUG    | __main__:trials:29 - Trial = 6814/30000 | Total reward = 44.06
2022-01-26 14:16:57.494 | DEBUG    | __main__:trials:24 - Trial = 6815/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.496 | DEBUG    | __main__:trials:29 - Trial = 6815/30000 | Total reward = 35.23
2022-01-26 14:16:57.500 | DEBUG    | __main__:trials:24 - Trial = 6816/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.500 | DEBUG    | __main__:trials:29 - Trial = 6816/30000 | Total reward = 43.57
2022-01-26 14:16:57.504 | DEBUG    | __main__:trials:24 - Trial = 6817/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.506 | DEBUG    | __main__:trials:29 - Trial = 6817/30000 | Total reward = 47.31
2022-01-26 14:16:57.510 | DEBUG    | __main__:trials:24 - Trial = 6818/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.511 | DEBUG    | __main__:trials:29 - Trial = 6818/30000 | Total reward = 35.03
2022-01-26 14:16:57.514 | DEBUG    | __main__:trials:26 - Trial = 6819/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.516 | DEBUG    | __main__:trials:29 - Trial = 6819/30000 | Total reward = 18.03
2022-01-26 14:16:57.519 | DEBUG    | __main__:trials:24 - Trial = 6820/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.521 | DEBUG    | __main__:trials:29 - Trial = 6820/30000 | Total reward = 37.40
2022-01-26 14:16:57.524 | DEBUG    | __main__:trials:24 - Trial = 6821/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.526 | DEBUG    | __main__:trials:29 - Trial = 6821/30000 | Total reward = 42.91
2022-01-26 14:16:57.529 | DEBUG    | __main__:trials:24 - Trial = 6822/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.531 | DEBUG    | __main__:trials:29 - Trial = 6822/30000 | Total reward = 35.42
2022-01-26 14:16:57.535 | DEBUG    | __main__:trials:24 - Trial = 6823/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.536 | DEBUG    | __main__:trials:29 - Trial = 6823/30000 | Total reward = 36.37
2022-01-26 14:16:57.540 | DEBUG    | __main__:trials:24 - Trial = 6824/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.541 | DEBUG    | __main__:trials:29 - Trial = 6824/30000 | Total reward = 36.52
2022-01-26 14:16:57.544 | DEBUG    | __main__:trials:24 - Trial = 6825/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.546 | DEBUG    | __main__:trials:29 - Trial = 6825/30000 | Total reward = 32.00
2022-01-26 14:16:57.549 | DEBUG    | __main__:trials:24 - Trial = 6826/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.551 | DEBUG    | __main__:trials:29 - Trial = 6826/30000 | Total reward = 42.23
2022-01-26 14:16:57.554 | DEBUG    | __main__:trials:24 - Trial = 6827/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.556 | DEBUG    | __main__:trials:29 - Trial = 6827/30000 | Total reward = 35.35
2022-01-26 14:16:57.560 | DEBUG    | __main__:trials:24 - Trial = 6828/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.561 | DEBUG    | __main__:trials:29 - Trial = 6828/30000 | Total reward = 42.00
2022-01-26 14:16:57.565 | DEBUG    | __main__:trials:24 - Trial = 6829/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.565 | DEBUG    | __main__:trials:29 - Trial = 6829/30000 | Total reward = 48.91
2022-01-26 14:16:57.568 | DEBUG    | __main__:trials:26 - Trial = 6830/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.569 | DEBUG    | __main__:trials:29 - Trial = 6830/30000 | Total reward = 25.02
2022-01-26 14:16:57.573 | DEBUG    | __main__:trials:24 - Trial = 6831/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.574 | DEBUG    | __main__:trials:29 - Trial = 6831/30000 | Total reward = 52.12
2022-01-26 14:16:57.578 | DEBUG    | __main__:trials:24 - Trial = 6832/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.579 | DEBUG    | __main__:trials:29 - Trial = 6832/30000 | Total reward = 41.77
2022-01-26 14:16:57.583 | DEBUG    | __main__:trials:24 - Trial = 6833/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.585 | DEBUG    | __main__:trials:29 - Trial = 6833/30000 | Total reward = 43.98
2022-01-26 14:16:57.588 | DEBUG    | __main__:trials:24 - Trial = 6834/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.590 | DEBUG    | __main__:trials:29 - Trial = 6834/30000 | Total reward = 31.37
2022-01-26 14:16:57.593 | DEBUG    | __main__:trials:24 - Trial = 6835/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.595 | DEBUG    | __main__:trials:29 - Trial = 6835/30000 | Total reward = 36.11
2022-01-26 14:16:57.599 | DEBUG    | __main__:trials:24 - Trial = 6836/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.600 | DEBUG    | __main__:trials:29 - Trial = 6836/30000 | Total reward = 33.73
2022-01-26 14:16:57.604 | DEBUG    | __main__:trials:24 - Trial = 6837/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.605 | DEBUG    | __main__:trials:29 - Trial = 6837/30000 | Total reward = 43.90
2022-01-26 14:16:57.609 | DEBUG    | __main__:trials:24 - Trial = 6838/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.611 | DEBUG    | __main__:trials:29 - Trial = 6838/30000 | Total reward = 37.21
2022-01-26 14:16:57.614 | DEBUG    | __main__:trials:24 - Trial = 6839/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.615 | DEBUG    | __main__:trials:29 - Trial = 6839/30000 | Total reward = 36.10
2022-01-26 14:16:57.619 | DEBUG    | __main__:trials:24 - Trial = 6840/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.621 | DEBUG    | __main__:trials:29 - Trial = 6840/30000 | Total reward = 43.06
2022-01-26 14:16:57.624 | DEBUG    | __main__:trials:24 - Trial = 6841/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.626 | DEBUG    | __main__:trials:29 - Trial = 6841/30000 | Total reward = 49.56
2022-01-26 14:16:57.630 | DEBUG    | __main__:trials:24 - Trial = 6842/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.631 | DEBUG    | __main__:trials:29 - Trial = 6842/30000 | Total reward = 36.26
2022-01-26 14:16:57.635 | DEBUG    | __main__:trials:24 - Trial = 6843/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.636 | DEBUG    | __main__:trials:29 - Trial = 6843/30000 | Total reward = 35.91
2022-01-26 14:16:57.640 | DEBUG    | __main__:trials:24 - Trial = 6844/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.641 | DEBUG    | __main__:trials:29 - Trial = 6844/30000 | Total reward = 35.17
2022-01-26 14:16:57.645 | DEBUG    | __main__:trials:24 - Trial = 6845/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.647 | DEBUG    | __main__:trials:29 - Trial = 6845/30000 | Total reward = 40.81
2022-01-26 14:16:57.650 | DEBUG    | __main__:trials:24 - Trial = 6846/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.652 | DEBUG    | __main__:trials:29 - Trial = 6846/30000 | Total reward = 36.50
2022-01-26 14:16:57.655 | DEBUG    | __main__:trials:24 - Trial = 6847/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.657 | DEBUG    | __main__:trials:29 - Trial = 6847/30000 | Total reward = 36.70
2022-01-26 14:16:57.660 | DEBUG    | __main__:trials:24 - Trial = 6848/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.662 | DEBUG    | __main__:trials:29 - Trial = 6848/30000 | Total reward = 44.24
2022-01-26 14:16:57.666 | DEBUG    | __main__:trials:24 - Trial = 6849/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.667 | DEBUG    | __main__:trials:29 - Trial = 6849/30000 | Total reward = 42.88
2022-01-26 14:16:57.671 | DEBUG    | __main__:trials:26 - Trial = 6850/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.672 | DEBUG    | __main__:trials:29 - Trial = 6850/30000 | Total reward = 30.22
2022-01-26 14:16:57.676 | DEBUG    | __main__:trials:24 - Trial = 6851/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.677 | DEBUG    | __main__:trials:29 - Trial = 6851/30000 | Total reward = 36.41
2022-01-26 14:16:57.681 | DEBUG    | __main__:trials:24 - Trial = 6852/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.682 | DEBUG    | __main__:trials:29 - Trial = 6852/30000 | Total reward = 32.08
2022-01-26 14:16:57.686 | DEBUG    | __main__:trials:24 - Trial = 6853/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.688 | DEBUG    | __main__:trials:29 - Trial = 6853/30000 | Total reward = 44.48
2022-01-26 14:16:57.691 | DEBUG    | __main__:trials:24 - Trial = 6854/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.693 | DEBUG    | __main__:trials:29 - Trial = 6854/30000 | Total reward = 41.55
2022-01-26 14:16:57.696 | DEBUG    | __main__:trials:24 - Trial = 6855/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.698 | DEBUG    | __main__:trials:29 - Trial = 6855/30000 | Total reward = 39.10
2022-01-26 14:16:57.701 | DEBUG    | __main__:trials:24 - Trial = 6856/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.703 | DEBUG    | __main__:trials:29 - Trial = 6856/30000 | Total reward = 30.96
2022-01-26 14:16:57.706 | DEBUG    | __main__:trials:26 - Trial = 6857/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.708 | DEBUG    | __main__:trials:29 - Trial = 6857/30000 | Total reward = 28.39
2022-01-26 14:16:57.711 | DEBUG    | __main__:trials:24 - Trial = 6858/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.713 | DEBUG    | __main__:trials:29 - Trial = 6858/30000 | Total reward = 55.82
2022-01-26 14:16:57.716 | DEBUG    | __main__:trials:24 - Trial = 6859/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.717 | DEBUG    | __main__:trials:29 - Trial = 6859/30000 | Total reward = 36.57
2022-01-26 14:16:57.722 | DEBUG    | __main__:trials:24 - Trial = 6860/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.722 | DEBUG    | __main__:trials:29 - Trial = 6860/30000 | Total reward = 45.76
2022-01-26 14:16:57.726 | DEBUG    | __main__:trials:26 - Trial = 6861/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.728 | DEBUG    | __main__:trials:29 - Trial = 6861/30000 | Total reward = 20.20
2022-01-26 14:16:57.731 | DEBUG    | __main__:trials:24 - Trial = 6862/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.732 | DEBUG    | __main__:trials:29 - Trial = 6862/30000 | Total reward = 37.24
2022-01-26 14:16:57.736 | DEBUG    | __main__:trials:24 - Trial = 6863/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.738 | DEBUG    | __main__:trials:29 - Trial = 6863/30000 | Total reward = 49.44
2022-01-26 14:16:57.741 | DEBUG    | __main__:trials:24 - Trial = 6864/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.743 | DEBUG    | __main__:trials:29 - Trial = 6864/30000 | Total reward = 40.75
2022-01-26 14:16:57.746 | DEBUG    | __main__:trials:24 - Trial = 6865/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.748 | DEBUG    | __main__:trials:29 - Trial = 6865/30000 | Total reward = 34.78
2022-01-26 14:16:57.752 | DEBUG    | __main__:trials:24 - Trial = 6866/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.753 | DEBUG    | __main__:trials:29 - Trial = 6866/30000 | Total reward = 33.67
2022-01-26 14:16:57.756 | DEBUG    | __main__:trials:24 - Trial = 6867/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.758 | DEBUG    | __main__:trials:29 - Trial = 6867/30000 | Total reward = 46.72
2022-01-26 14:16:57.762 | DEBUG    | __main__:trials:24 - Trial = 6868/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.762 | DEBUG    | __main__:trials:29 - Trial = 6868/30000 | Total reward = 40.99
2022-01-26 14:16:57.766 | DEBUG    | __main__:trials:24 - Trial = 6869/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.768 | DEBUG    | __main__:trials:29 - Trial = 6869/30000 | Total reward = 41.89
2022-01-26 14:16:57.772 | DEBUG    | __main__:trials:24 - Trial = 6870/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.773 | DEBUG    | __main__:trials:29 - Trial = 6870/30000 | Total reward = 39.32
2022-01-26 14:16:57.777 | DEBUG    | __main__:trials:24 - Trial = 6871/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.779 | DEBUG    | __main__:trials:29 - Trial = 6871/30000 | Total reward = 44.36
2022-01-26 14:16:57.782 | DEBUG    | __main__:trials:24 - Trial = 6872/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.784 | DEBUG    | __main__:trials:29 - Trial = 6872/30000 | Total reward = 36.57
2022-01-26 14:16:57.787 | DEBUG    | __main__:trials:24 - Trial = 6873/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.789 | DEBUG    | __main__:trials:29 - Trial = 6873/30000 | Total reward = 36.57
2022-01-26 14:16:57.792 | DEBUG    | __main__:trials:24 - Trial = 6874/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.793 | DEBUG    | __main__:trials:29 - Trial = 6874/30000 | Total reward = 31.44
2022-01-26 14:16:57.798 | DEBUG    | __main__:trials:24 - Trial = 6875/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.798 | DEBUG    | __main__:trials:29 - Trial = 6875/30000 | Total reward = 43.66
2022-01-26 14:16:57.802 | DEBUG    | __main__:trials:24 - Trial = 6876/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.804 | DEBUG    | __main__:trials:29 - Trial = 6876/30000 | Total reward = 43.87
2022-01-26 14:16:57.807 | DEBUG    | __main__:trials:26 - Trial = 6877/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.808 | DEBUG    | __main__:trials:29 - Trial = 6877/30000 | Total reward = 33.42
2022-01-26 14:16:57.812 | DEBUG    | __main__:trials:24 - Trial = 6878/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.814 | DEBUG    | __main__:trials:29 - Trial = 6878/30000 | Total reward = 36.64
2022-01-26 14:16:57.817 | DEBUG    | __main__:trials:24 - Trial = 6879/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.819 | DEBUG    | __main__:trials:29 - Trial = 6879/30000 | Total reward = 36.70
2022-01-26 14:16:57.822 | DEBUG    | __main__:trials:24 - Trial = 6880/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.824 | DEBUG    | __main__:trials:29 - Trial = 6880/30000 | Total reward = 34.54
2022-01-26 14:16:57.828 | DEBUG    | __main__:trials:24 - Trial = 6881/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.829 | DEBUG    | __main__:trials:29 - Trial = 6881/30000 | Total reward = 36.48
2022-01-26 14:16:57.833 | DEBUG    | __main__:trials:24 - Trial = 6882/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.835 | DEBUG    | __main__:trials:29 - Trial = 6882/30000 | Total reward = 43.04
2022-01-26 14:16:57.838 | DEBUG    | __main__:trials:24 - Trial = 6883/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.839 | DEBUG    | __main__:trials:29 - Trial = 6883/30000 | Total reward = 57.48
2022-01-26 14:16:57.842 | DEBUG    | __main__:trials:24 - Trial = 6884/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.844 | DEBUG    | __main__:trials:29 - Trial = 6884/30000 | Total reward = 36.37
2022-01-26 14:16:57.848 | DEBUG    | __main__:trials:24 - Trial = 6885/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.849 | DEBUG    | __main__:trials:29 - Trial = 6885/30000 | Total reward = 34.08
2022-01-26 14:16:57.853 | DEBUG    | __main__:trials:24 - Trial = 6886/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.855 | DEBUG    | __main__:trials:29 - Trial = 6886/30000 | Total reward = 43.11
2022-01-26 14:16:57.857 | DEBUG    | __main__:trials:24 - Trial = 6887/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.858 | DEBUG    | __main__:trials:29 - Trial = 6887/30000 | Total reward = 52.14
2022-01-26 14:16:57.861 | DEBUG    | __main__:trials:24 - Trial = 6888/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.863 | DEBUG    | __main__:trials:29 - Trial = 6888/30000 | Total reward = 38.46
2022-01-26 14:16:57.866 | DEBUG    | __main__:trials:24 - Trial = 6889/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.867 | DEBUG    | __main__:trials:29 - Trial = 6889/30000 | Total reward = 45.69
2022-01-26 14:16:57.870 | DEBUG    | __main__:trials:24 - Trial = 6890/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.872 | DEBUG    | __main__:trials:29 - Trial = 6890/30000 | Total reward = 40.81
2022-01-26 14:16:57.875 | DEBUG    | __main__:trials:24 - Trial = 6891/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.877 | DEBUG    | __main__:trials:29 - Trial = 6891/30000 | Total reward = 43.65
2022-01-26 14:16:57.880 | DEBUG    | __main__:trials:26 - Trial = 6892/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.882 | DEBUG    | __main__:trials:29 - Trial = 6892/30000 | Total reward = 31.40
2022-01-26 14:16:57.885 | DEBUG    | __main__:trials:24 - Trial = 6893/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.887 | DEBUG    | __main__:trials:29 - Trial = 6893/30000 | Total reward = 42.54
2022-01-26 14:16:57.891 | DEBUG    | __main__:trials:24 - Trial = 6894/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.892 | DEBUG    | __main__:trials:29 - Trial = 6894/30000 | Total reward = 44.86
2022-01-26 14:16:57.896 | DEBUG    | __main__:trials:24 - Trial = 6895/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.898 | DEBUG    | __main__:trials:29 - Trial = 6895/30000 | Total reward = 50.54
2022-01-26 14:16:57.901 | DEBUG    | __main__:trials:24 - Trial = 6896/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.903 | DEBUG    | __main__:trials:29 - Trial = 6896/30000 | Total reward = 43.18
2022-01-26 14:16:57.907 | DEBUG    | __main__:trials:24 - Trial = 6897/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.908 | DEBUG    | __main__:trials:29 - Trial = 6897/30000 | Total reward = 45.48
2022-01-26 14:16:57.912 | DEBUG    | __main__:trials:24 - Trial = 6898/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.913 | DEBUG    | __main__:trials:29 - Trial = 6898/30000 | Total reward = 48.29
2022-01-26 14:16:57.917 | DEBUG    | __main__:trials:24 - Trial = 6899/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.918 | DEBUG    | __main__:trials:29 - Trial = 6899/30000 | Total reward = 45.29
2022-01-26 14:16:57.922 | DEBUG    | __main__:trials:24 - Trial = 6900/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.922 | DEBUG    | __main__:trials:29 - Trial = 6900/30000 | Total reward = 40.27
2022-01-26 14:16:57.926 | DEBUG    | __main__:trials:24 - Trial = 6901/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.928 | DEBUG    | __main__:trials:29 - Trial = 6901/30000 | Total reward = 39.74
2022-01-26 14:16:57.931 | DEBUG    | __main__:trials:24 - Trial = 6902/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.933 | DEBUG    | __main__:trials:29 - Trial = 6902/30000 | Total reward = 42.09
2022-01-26 14:16:57.936 | DEBUG    | __main__:trials:24 - Trial = 6903/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.937 | DEBUG    | __main__:trials:29 - Trial = 6903/30000 | Total reward = 43.19
2022-01-26 14:16:57.941 | DEBUG    | __main__:trials:24 - Trial = 6904/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.942 | DEBUG    | __main__:trials:29 - Trial = 6904/30000 | Total reward = 41.75
2022-01-26 14:16:57.945 | DEBUG    | __main__:trials:24 - Trial = 6905/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.946 | DEBUG    | __main__:trials:29 - Trial = 6905/30000 | Total reward = 45.07
2022-01-26 14:16:57.950 | DEBUG    | __main__:trials:24 - Trial = 6906/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.951 | DEBUG    | __main__:trials:29 - Trial = 6906/30000 | Total reward = 43.00
2022-01-26 14:16:57.954 | DEBUG    | __main__:trials:24 - Trial = 6907/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.956 | DEBUG    | __main__:trials:29 - Trial = 6907/30000 | Total reward = 41.27
2022-01-26 14:16:57.959 | DEBUG    | __main__:trials:24 - Trial = 6908/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.961 | DEBUG    | __main__:trials:29 - Trial = 6908/30000 | Total reward = 35.91
2022-01-26 14:16:57.964 | DEBUG    | __main__:trials:24 - Trial = 6909/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.966 | DEBUG    | __main__:trials:29 - Trial = 6909/30000 | Total reward = 40.31
2022-01-26 14:16:57.970 | DEBUG    | __main__:trials:24 - Trial = 6910/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.972 | DEBUG    | __main__:trials:29 - Trial = 6910/30000 | Total reward = 29.57
2022-01-26 14:16:57.975 | DEBUG    | __main__:trials:24 - Trial = 6911/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.977 | DEBUG    | __main__:trials:29 - Trial = 6911/30000 | Total reward = 38.46
2022-01-26 14:16:57.981 | DEBUG    | __main__:trials:24 - Trial = 6912/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.982 | DEBUG    | __main__:trials:29 - Trial = 6912/30000 | Total reward = 42.22
2022-01-26 14:16:57.985 | DEBUG    | __main__:trials:24 - Trial = 6913/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.986 | DEBUG    | __main__:trials:29 - Trial = 6913/30000 | Total reward = 44.88
2022-01-26 14:16:57.988 | DEBUG    | __main__:trials:26 - Trial = 6914/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:57.990 | DEBUG    | __main__:trials:29 - Trial = 6914/30000 | Total reward = 20.38
2022-01-26 14:16:57.995 | DEBUG    | __main__:trials:24 - Trial = 6915/30000 | Max number of steps (20) reached
2022-01-26 14:16:57.995 | DEBUG    | __main__:trials:29 - Trial = 6915/30000 | Total reward = 39.58
2022-01-26 14:16:58.000 | DEBUG    | __main__:trials:24 - Trial = 6916/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.001 | DEBUG    | __main__:trials:29 - Trial = 6916/30000 | Total reward = 50.36
2022-01-26 14:16:58.004 | DEBUG    | __main__:trials:26 - Trial = 6917/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.006 | DEBUG    | __main__:trials:29 - Trial = 6917/30000 | Total reward = 15.91
2022-01-26 14:16:58.009 | DEBUG    | __main__:trials:24 - Trial = 6918/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.012 | DEBUG    | __main__:trials:29 - Trial = 6918/30000 | Total reward = 44.17
2022-01-26 14:16:58.015 | DEBUG    | __main__:trials:24 - Trial = 6919/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.017 | DEBUG    | __main__:trials:29 - Trial = 6919/30000 | Total reward = 37.20
2022-01-26 14:16:58.020 | DEBUG    | __main__:trials:24 - Trial = 6920/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.021 | DEBUG    | __main__:trials:29 - Trial = 6920/30000 | Total reward = 48.20
2022-01-26 14:16:58.025 | DEBUG    | __main__:trials:24 - Trial = 6921/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.027 | DEBUG    | __main__:trials:29 - Trial = 6921/30000 | Total reward = 44.19
2022-01-26 14:16:58.030 | DEBUG    | __main__:trials:24 - Trial = 6922/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.032 | DEBUG    | __main__:trials:29 - Trial = 6922/30000 | Total reward = 44.99
2022-01-26 14:16:58.035 | DEBUG    | __main__:trials:24 - Trial = 6923/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.037 | DEBUG    | __main__:trials:29 - Trial = 6923/30000 | Total reward = 52.91
2022-01-26 14:16:58.040 | DEBUG    | __main__:trials:24 - Trial = 6924/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.042 | DEBUG    | __main__:trials:29 - Trial = 6924/30000 | Total reward = 36.37
2022-01-26 14:16:58.046 | DEBUG    | __main__:trials:24 - Trial = 6925/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.047 | DEBUG    | __main__:trials:29 - Trial = 6925/30000 | Total reward = 44.36
2022-01-26 14:16:58.051 | DEBUG    | __main__:trials:24 - Trial = 6926/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.052 | DEBUG    | __main__:trials:29 - Trial = 6926/30000 | Total reward = 36.71
2022-01-26 14:16:58.056 | DEBUG    | __main__:trials:24 - Trial = 6927/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.058 | DEBUG    | __main__:trials:29 - Trial = 6927/30000 | Total reward = 46.83
2022-01-26 14:16:58.061 | DEBUG    | __main__:trials:24 - Trial = 6928/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.063 | DEBUG    | __main__:trials:29 - Trial = 6928/30000 | Total reward = 32.55
2022-01-26 14:16:58.067 | DEBUG    | __main__:trials:24 - Trial = 6929/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.068 | DEBUG    | __main__:trials:29 - Trial = 6929/30000 | Total reward = 47.10
2022-01-26 14:16:58.071 | DEBUG    | __main__:trials:24 - Trial = 6930/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.073 | DEBUG    | __main__:trials:29 - Trial = 6930/30000 | Total reward = 39.10
2022-01-26 14:16:58.077 | DEBUG    | __main__:trials:24 - Trial = 6931/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.078 | DEBUG    | __main__:trials:29 - Trial = 6931/30000 | Total reward = 34.89
2022-01-26 14:16:58.082 | DEBUG    | __main__:trials:24 - Trial = 6932/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.083 | DEBUG    | __main__:trials:29 - Trial = 6932/30000 | Total reward = 42.01
2022-01-26 14:16:58.086 | DEBUG    | __main__:trials:24 - Trial = 6933/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.087 | DEBUG    | __main__:trials:29 - Trial = 6933/30000 | Total reward = 39.45
2022-01-26 14:16:58.090 | DEBUG    | __main__:trials:24 - Trial = 6934/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.091 | DEBUG    | __main__:trials:29 - Trial = 6934/30000 | Total reward = 45.10
2022-01-26 14:16:58.094 | DEBUG    | __main__:trials:24 - Trial = 6935/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.096 | DEBUG    | __main__:trials:29 - Trial = 6935/30000 | Total reward = 37.03
2022-01-26 14:16:58.100 | DEBUG    | __main__:trials:24 - Trial = 6936/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.101 | DEBUG    | __main__:trials:29 - Trial = 6936/30000 | Total reward = 43.77
2022-01-26 14:16:58.105 | DEBUG    | __main__:trials:24 - Trial = 6937/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.106 | DEBUG    | __main__:trials:29 - Trial = 6937/30000 | Total reward = 37.20
2022-01-26 14:16:58.110 | DEBUG    | __main__:trials:24 - Trial = 6938/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.112 | DEBUG    | __main__:trials:29 - Trial = 6938/30000 | Total reward = 58.89
2022-01-26 14:16:58.115 | DEBUG    | __main__:trials:24 - Trial = 6939/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.117 | DEBUG    | __main__:trials:29 - Trial = 6939/30000 | Total reward = 48.10
2022-01-26 14:16:58.120 | DEBUG    | __main__:trials:24 - Trial = 6940/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.122 | DEBUG    | __main__:trials:29 - Trial = 6940/30000 | Total reward = 44.03
2022-01-26 14:16:58.126 | DEBUG    | __main__:trials:24 - Trial = 6941/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.126 | DEBUG    | __main__:trials:29 - Trial = 6941/30000 | Total reward = 36.61
2022-01-26 14:16:58.130 | DEBUG    | __main__:trials:24 - Trial = 6942/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.132 | DEBUG    | __main__:trials:29 - Trial = 6942/30000 | Total reward = 54.91
2022-01-26 14:16:58.136 | DEBUG    | __main__:trials:24 - Trial = 6943/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.137 | DEBUG    | __main__:trials:29 - Trial = 6943/30000 | Total reward = 44.46
2022-01-26 14:16:58.140 | DEBUG    | __main__:trials:24 - Trial = 6944/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.142 | DEBUG    | __main__:trials:29 - Trial = 6944/30000 | Total reward = 36.18
2022-01-26 14:16:58.146 | DEBUG    | __main__:trials:24 - Trial = 6945/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.147 | DEBUG    | __main__:trials:29 - Trial = 6945/30000 | Total reward = 33.46
2022-01-26 14:16:58.151 | DEBUG    | __main__:trials:24 - Trial = 6946/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.153 | DEBUG    | __main__:trials:29 - Trial = 6946/30000 | Total reward = 35.24
2022-01-26 14:16:58.156 | DEBUG    | __main__:trials:24 - Trial = 6947/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.157 | DEBUG    | __main__:trials:29 - Trial = 6947/30000 | Total reward = 64.02
2022-01-26 14:16:58.161 | DEBUG    | __main__:trials:24 - Trial = 6948/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.163 | DEBUG    | __main__:trials:29 - Trial = 6948/30000 | Total reward = 41.24
2022-01-26 14:16:58.166 | DEBUG    | __main__:trials:24 - Trial = 6949/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.168 | DEBUG    | __main__:trials:29 - Trial = 6949/30000 | Total reward = 45.68
2022-01-26 14:16:58.170 | DEBUG    | __main__:trials:24 - Trial = 6950/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.172 | DEBUG    | __main__:trials:29 - Trial = 6950/30000 | Total reward = 50.63
2022-01-26 14:16:58.176 | DEBUG    | __main__:trials:24 - Trial = 6951/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.178 | DEBUG    | __main__:trials:29 - Trial = 6951/30000 | Total reward = 47.31
2022-01-26 14:16:58.181 | DEBUG    | __main__:trials:24 - Trial = 6952/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.183 | DEBUG    | __main__:trials:29 - Trial = 6952/30000 | Total reward = 41.87
2022-01-26 14:16:58.187 | DEBUG    | __main__:trials:24 - Trial = 6953/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.188 | DEBUG    | __main__:trials:29 - Trial = 6953/30000 | Total reward = 43.95
2022-01-26 14:16:58.192 | DEBUG    | __main__:trials:24 - Trial = 6954/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.194 | DEBUG    | __main__:trials:29 - Trial = 6954/30000 | Total reward = 58.20
2022-01-26 14:16:58.198 | DEBUG    | __main__:trials:24 - Trial = 6955/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.198 | DEBUG    | __main__:trials:29 - Trial = 6955/30000 | Total reward = 46.31
2022-01-26 14:16:58.202 | DEBUG    | __main__:trials:24 - Trial = 6956/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.204 | DEBUG    | __main__:trials:29 - Trial = 6956/30000 | Total reward = 57.29
2022-01-26 14:16:58.208 | DEBUG    | __main__:trials:24 - Trial = 6957/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.209 | DEBUG    | __main__:trials:29 - Trial = 6957/30000 | Total reward = 41.72
2022-01-26 14:16:58.213 | DEBUG    | __main__:trials:24 - Trial = 6958/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.214 | DEBUG    | __main__:trials:29 - Trial = 6958/30000 | Total reward = 47.38
2022-01-26 14:16:58.218 | DEBUG    | __main__:trials:24 - Trial = 6959/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.219 | DEBUG    | __main__:trials:29 - Trial = 6959/30000 | Total reward = 32.77
2022-01-26 14:16:58.222 | DEBUG    | __main__:trials:26 - Trial = 6960/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.223 | DEBUG    | __main__:trials:29 - Trial = 6960/30000 | Total reward = 18.35
2022-01-26 14:16:58.227 | DEBUG    | __main__:trials:24 - Trial = 6961/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.229 | DEBUG    | __main__:trials:29 - Trial = 6961/30000 | Total reward = 33.85
2022-01-26 14:16:58.232 | DEBUG    | __main__:trials:24 - Trial = 6962/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.233 | DEBUG    | __main__:trials:29 - Trial = 6962/30000 | Total reward = 37.32
2022-01-26 14:16:58.237 | DEBUG    | __main__:trials:24 - Trial = 6963/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.238 | DEBUG    | __main__:trials:29 - Trial = 6963/30000 | Total reward = 36.18
2022-01-26 14:16:58.242 | DEBUG    | __main__:trials:24 - Trial = 6964/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.244 | DEBUG    | __main__:trials:29 - Trial = 6964/30000 | Total reward = 39.53
2022-01-26 14:16:58.248 | DEBUG    | __main__:trials:24 - Trial = 6965/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.248 | DEBUG    | __main__:trials:29 - Trial = 6965/30000 | Total reward = 45.12
2022-01-26 14:16:58.252 | DEBUG    | __main__:trials:26 - Trial = 6966/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.252 | DEBUG    | __main__:trials:29 - Trial = 6966/30000 | Total reward = 23.58
2022-01-26 14:16:58.256 | DEBUG    | __main__:trials:24 - Trial = 6967/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.258 | DEBUG    | __main__:trials:29 - Trial = 6967/30000 | Total reward = 44.27
2022-01-26 14:16:58.261 | DEBUG    | __main__:trials:24 - Trial = 6968/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.263 | DEBUG    | __main__:trials:29 - Trial = 6968/30000 | Total reward = 33.48
2022-01-26 14:16:58.266 | DEBUG    | __main__:trials:24 - Trial = 6969/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.268 | DEBUG    | __main__:trials:29 - Trial = 6969/30000 | Total reward = 53.71
2022-01-26 14:16:58.271 | DEBUG    | __main__:trials:24 - Trial = 6970/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.272 | DEBUG    | __main__:trials:29 - Trial = 6970/30000 | Total reward = 56.59
2022-01-26 14:16:58.275 | DEBUG    | __main__:trials:24 - Trial = 6971/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.276 | DEBUG    | __main__:trials:29 - Trial = 6971/30000 | Total reward = 35.58
2022-01-26 14:16:58.280 | DEBUG    | __main__:trials:24 - Trial = 6972/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.282 | DEBUG    | __main__:trials:29 - Trial = 6972/30000 | Total reward = 34.64
2022-01-26 14:16:58.284 | DEBUG    | __main__:trials:24 - Trial = 6973/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.285 | DEBUG    | __main__:trials:29 - Trial = 6973/30000 | Total reward = 45.92
2022-01-26 14:16:58.289 | DEBUG    | __main__:trials:24 - Trial = 6974/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.289 | DEBUG    | __main__:trials:29 - Trial = 6974/30000 | Total reward = 49.82
2022-01-26 14:16:58.293 | DEBUG    | __main__:trials:24 - Trial = 6975/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.294 | DEBUG    | __main__:trials:29 - Trial = 6975/30000 | Total reward = 58.94
2022-01-26 14:16:58.297 | DEBUG    | __main__:trials:24 - Trial = 6976/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.298 | DEBUG    | __main__:trials:29 - Trial = 6976/30000 | Total reward = 43.69
2022-01-26 14:16:58.301 | DEBUG    | __main__:trials:26 - Trial = 6977/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.303 | DEBUG    | __main__:trials:29 - Trial = 6977/30000 | Total reward = 23.59
2022-01-26 14:16:58.305 | DEBUG    | __main__:trials:24 - Trial = 6978/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.306 | DEBUG    | __main__:trials:29 - Trial = 6978/30000 | Total reward = 27.72
2022-01-26 14:16:58.310 | DEBUG    | __main__:trials:24 - Trial = 6979/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.310 | DEBUG    | __main__:trials:29 - Trial = 6979/30000 | Total reward = 34.00
2022-01-26 14:16:58.314 | DEBUG    | __main__:trials:24 - Trial = 6980/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.315 | DEBUG    | __main__:trials:29 - Trial = 6980/30000 | Total reward = 54.26
2022-01-26 14:16:58.319 | DEBUG    | __main__:trials:24 - Trial = 6981/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.320 | DEBUG    | __main__:trials:29 - Trial = 6981/30000 | Total reward = 34.70
2022-01-26 14:16:58.323 | DEBUG    | __main__:trials:24 - Trial = 6982/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.325 | DEBUG    | __main__:trials:29 - Trial = 6982/30000 | Total reward = 59.99
2022-01-26 14:16:58.328 | DEBUG    | __main__:trials:24 - Trial = 6983/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.329 | DEBUG    | __main__:trials:29 - Trial = 6983/30000 | Total reward = 53.08
2022-01-26 14:16:58.332 | DEBUG    | __main__:trials:24 - Trial = 6984/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.334 | DEBUG    | __main__:trials:29 - Trial = 6984/30000 | Total reward = 44.55
2022-01-26 14:16:58.337 | DEBUG    | __main__:trials:24 - Trial = 6985/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.338 | DEBUG    | __main__:trials:29 - Trial = 6985/30000 | Total reward = 46.15
2022-01-26 14:16:58.342 | DEBUG    | __main__:trials:24 - Trial = 6986/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.343 | DEBUG    | __main__:trials:29 - Trial = 6986/30000 | Total reward = 40.20
2022-01-26 14:16:58.346 | DEBUG    | __main__:trials:24 - Trial = 6987/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.348 | DEBUG    | __main__:trials:29 - Trial = 6987/30000 | Total reward = 41.55
2022-01-26 14:16:58.352 | DEBUG    | __main__:trials:24 - Trial = 6988/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.352 | DEBUG    | __main__:trials:29 - Trial = 6988/30000 | Total reward = 37.72
2022-01-26 14:16:58.356 | DEBUG    | __main__:trials:24 - Trial = 6989/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.357 | DEBUG    | __main__:trials:29 - Trial = 6989/30000 | Total reward = 37.78
2022-01-26 14:16:58.360 | DEBUG    | __main__:trials:24 - Trial = 6990/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.361 | DEBUG    | __main__:trials:29 - Trial = 6990/30000 | Total reward = 37.08
2022-01-26 14:16:58.364 | DEBUG    | __main__:trials:24 - Trial = 6991/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.365 | DEBUG    | __main__:trials:29 - Trial = 6991/30000 | Total reward = 31.60
2022-01-26 14:16:58.369 | DEBUG    | __main__:trials:24 - Trial = 6992/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.370 | DEBUG    | __main__:trials:29 - Trial = 6992/30000 | Total reward = 51.58
2022-01-26 14:16:58.373 | DEBUG    | __main__:trials:24 - Trial = 6993/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.374 | DEBUG    | __main__:trials:29 - Trial = 6993/30000 | Total reward = 47.01
2022-01-26 14:16:58.378 | DEBUG    | __main__:trials:24 - Trial = 6994/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.378 | DEBUG    | __main__:trials:29 - Trial = 6994/30000 | Total reward = 41.57
2022-01-26 14:16:58.381 | DEBUG    | __main__:trials:26 - Trial = 6995/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.382 | DEBUG    | __main__:trials:29 - Trial = 6995/30000 | Total reward = 23.91
2022-01-26 14:16:58.385 | DEBUG    | __main__:trials:24 - Trial = 6996/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.386 | DEBUG    | __main__:trials:29 - Trial = 6996/30000 | Total reward = 32.61
2022-01-26 14:16:58.390 | DEBUG    | __main__:trials:24 - Trial = 6997/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.392 | DEBUG    | __main__:trials:29 - Trial = 6997/30000 | Total reward = 42.09
2022-01-26 14:16:58.395 | DEBUG    | __main__:trials:24 - Trial = 6998/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.396 | DEBUG    | __main__:trials:29 - Trial = 6998/30000 | Total reward = 47.12
2022-01-26 14:16:58.399 | DEBUG    | __main__:trials:24 - Trial = 6999/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.401 | DEBUG    | __main__:trials:29 - Trial = 6999/30000 | Total reward = 42.02
2022-01-26 14:16:58.404 | DEBUG    | __main__:trials:24 - Trial = 7000/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.405 | DEBUG    | __main__:trials:29 - Trial = 7000/30000 | Total reward = 37.34
2022-01-26 14:16:58.408 | DEBUG    | __main__:trials:24 - Trial = 7001/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.410 | DEBUG    | __main__:trials:29 - Trial = 7001/30000 | Total reward = 57.48
2022-01-26 14:16:58.413 | DEBUG    | __main__:trials:24 - Trial = 7002/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.414 | DEBUG    | __main__:trials:29 - Trial = 7002/30000 | Total reward = 49.34
2022-01-26 14:16:58.417 | DEBUG    | __main__:trials:24 - Trial = 7003/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.418 | DEBUG    | __main__:trials:29 - Trial = 7003/30000 | Total reward = 38.35
2022-01-26 14:16:58.421 | DEBUG    | __main__:trials:24 - Trial = 7004/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.422 | DEBUG    | __main__:trials:29 - Trial = 7004/30000 | Total reward = 45.11
2022-01-26 14:16:58.425 | DEBUG    | __main__:trials:24 - Trial = 7005/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.426 | DEBUG    | __main__:trials:29 - Trial = 7005/30000 | Total reward = 47.62
2022-01-26 14:16:58.429 | DEBUG    | __main__:trials:24 - Trial = 7006/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.431 | DEBUG    | __main__:trials:29 - Trial = 7006/30000 | Total reward = 42.55
2022-01-26 14:16:58.435 | DEBUG    | __main__:trials:24 - Trial = 7007/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.436 | DEBUG    | __main__:trials:29 - Trial = 7007/30000 | Total reward = 36.04
2022-01-26 14:16:58.440 | DEBUG    | __main__:trials:24 - Trial = 7008/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.441 | DEBUG    | __main__:trials:29 - Trial = 7008/30000 | Total reward = 41.17
2022-01-26 14:16:58.444 | DEBUG    | __main__:trials:24 - Trial = 7009/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.446 | DEBUG    | __main__:trials:29 - Trial = 7009/30000 | Total reward = 48.57
2022-01-26 14:16:58.450 | DEBUG    | __main__:trials:24 - Trial = 7010/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.452 | DEBUG    | __main__:trials:29 - Trial = 7010/30000 | Total reward = 42.55
2022-01-26 14:16:58.455 | DEBUG    | __main__:trials:24 - Trial = 7011/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.457 | DEBUG    | __main__:trials:29 - Trial = 7011/30000 | Total reward = 40.44
2022-01-26 14:16:58.460 | DEBUG    | __main__:trials:24 - Trial = 7012/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.462 | DEBUG    | __main__:trials:29 - Trial = 7012/30000 | Total reward = 38.31
2022-01-26 14:16:58.466 | DEBUG    | __main__:trials:24 - Trial = 7013/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.467 | DEBUG    | __main__:trials:29 - Trial = 7013/30000 | Total reward = 32.75
2022-01-26 14:16:58.470 | DEBUG    | __main__:trials:26 - Trial = 7014/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.471 | DEBUG    | __main__:trials:29 - Trial = 7014/30000 | Total reward = 13.44
2022-01-26 14:16:58.475 | DEBUG    | __main__:trials:24 - Trial = 7015/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.477 | DEBUG    | __main__:trials:29 - Trial = 7015/30000 | Total reward = 44.23
2022-01-26 14:16:58.480 | DEBUG    | __main__:trials:24 - Trial = 7016/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.482 | DEBUG    | __main__:trials:29 - Trial = 7016/30000 | Total reward = 33.94
2022-01-26 14:16:58.485 | DEBUG    | __main__:trials:24 - Trial = 7017/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.487 | DEBUG    | __main__:trials:29 - Trial = 7017/30000 | Total reward = 28.90
2022-01-26 14:16:58.491 | DEBUG    | __main__:trials:24 - Trial = 7018/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.492 | DEBUG    | __main__:trials:29 - Trial = 7018/30000 | Total reward = 40.67
2022-01-26 14:16:58.496 | DEBUG    | __main__:trials:24 - Trial = 7019/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.498 | DEBUG    | __main__:trials:29 - Trial = 7019/30000 | Total reward = 37.45
2022-01-26 14:16:58.502 | DEBUG    | __main__:trials:24 - Trial = 7020/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.503 | DEBUG    | __main__:trials:29 - Trial = 7020/30000 | Total reward = 39.96
2022-01-26 14:16:58.507 | DEBUG    | __main__:trials:24 - Trial = 7021/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.509 | DEBUG    | __main__:trials:29 - Trial = 7021/30000 | Total reward = 43.96
2022-01-26 14:16:58.512 | DEBUG    | __main__:trials:24 - Trial = 7022/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.514 | DEBUG    | __main__:trials:29 - Trial = 7022/30000 | Total reward = 37.90
2022-01-26 14:16:58.517 | DEBUG    | __main__:trials:24 - Trial = 7023/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.519 | DEBUG    | __main__:trials:29 - Trial = 7023/30000 | Total reward = 36.57
2022-01-26 14:16:58.522 | DEBUG    | __main__:trials:24 - Trial = 7024/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.524 | DEBUG    | __main__:trials:29 - Trial = 7024/30000 | Total reward = 43.42
2022-01-26 14:16:58.527 | DEBUG    | __main__:trials:24 - Trial = 7025/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.529 | DEBUG    | __main__:trials:29 - Trial = 7025/30000 | Total reward = 31.59
2022-01-26 14:16:58.532 | DEBUG    | __main__:trials:24 - Trial = 7026/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.534 | DEBUG    | __main__:trials:29 - Trial = 7026/30000 | Total reward = 44.77
2022-01-26 14:16:58.537 | DEBUG    | __main__:trials:24 - Trial = 7027/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.538 | DEBUG    | __main__:trials:29 - Trial = 7027/30000 | Total reward = 32.27
2022-01-26 14:16:58.542 | DEBUG    | __main__:trials:24 - Trial = 7028/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.543 | DEBUG    | __main__:trials:29 - Trial = 7028/30000 | Total reward = 43.42
2022-01-26 14:16:58.547 | DEBUG    | __main__:trials:24 - Trial = 7029/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.549 | DEBUG    | __main__:trials:29 - Trial = 7029/30000 | Total reward = 51.74
2022-01-26 14:16:58.552 | DEBUG    | __main__:trials:24 - Trial = 7030/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.554 | DEBUG    | __main__:trials:29 - Trial = 7030/30000 | Total reward = 47.99
2022-01-26 14:16:58.557 | DEBUG    | __main__:trials:24 - Trial = 7031/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.559 | DEBUG    | __main__:trials:29 - Trial = 7031/30000 | Total reward = 36.70
2022-01-26 14:16:58.563 | DEBUG    | __main__:trials:24 - Trial = 7032/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.564 | DEBUG    | __main__:trials:29 - Trial = 7032/30000 | Total reward = 46.86
2022-01-26 14:16:58.568 | DEBUG    | __main__:trials:24 - Trial = 7033/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.570 | DEBUG    | __main__:trials:29 - Trial = 7033/30000 | Total reward = 38.11
2022-01-26 14:16:58.573 | DEBUG    | __main__:trials:24 - Trial = 7034/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.575 | DEBUG    | __main__:trials:29 - Trial = 7034/30000 | Total reward = 42.14
2022-01-26 14:16:58.579 | DEBUG    | __main__:trials:24 - Trial = 7035/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.579 | DEBUG    | __main__:trials:29 - Trial = 7035/30000 | Total reward = 44.31
2022-01-26 14:16:58.584 | DEBUG    | __main__:trials:24 - Trial = 7036/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.585 | DEBUG    | __main__:trials:29 - Trial = 7036/30000 | Total reward = 33.79
2022-01-26 14:16:58.588 | DEBUG    | __main__:trials:24 - Trial = 7037/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.590 | DEBUG    | __main__:trials:29 - Trial = 7037/30000 | Total reward = 45.29
2022-01-26 14:16:58.594 | DEBUG    | __main__:trials:24 - Trial = 7038/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.595 | DEBUG    | __main__:trials:29 - Trial = 7038/30000 | Total reward = 42.86
2022-01-26 14:16:58.598 | DEBUG    | __main__:trials:24 - Trial = 7039/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.600 | DEBUG    | __main__:trials:29 - Trial = 7039/30000 | Total reward = 45.82
2022-01-26 14:16:58.604 | DEBUG    | __main__:trials:24 - Trial = 7040/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.605 | DEBUG    | __main__:trials:29 - Trial = 7040/30000 | Total reward = 36.26
2022-01-26 14:16:58.608 | DEBUG    | __main__:trials:24 - Trial = 7041/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.610 | DEBUG    | __main__:trials:29 - Trial = 7041/30000 | Total reward = 48.43
2022-01-26 14:16:58.614 | DEBUG    | __main__:trials:24 - Trial = 7042/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.615 | DEBUG    | __main__:trials:29 - Trial = 7042/30000 | Total reward = 56.93
2022-01-26 14:16:58.619 | DEBUG    | __main__:trials:24 - Trial = 7043/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.621 | DEBUG    | __main__:trials:29 - Trial = 7043/30000 | Total reward = 47.29
2022-01-26 14:16:58.624 | DEBUG    | __main__:trials:24 - Trial = 7044/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.626 | DEBUG    | __main__:trials:29 - Trial = 7044/30000 | Total reward = 38.56
2022-01-26 14:16:58.630 | DEBUG    | __main__:trials:24 - Trial = 7045/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.631 | DEBUG    | __main__:trials:29 - Trial = 7045/30000 | Total reward = 33.47
2022-01-26 14:16:58.634 | DEBUG    | __main__:trials:24 - Trial = 7046/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.636 | DEBUG    | __main__:trials:29 - Trial = 7046/30000 | Total reward = 38.12
2022-01-26 14:16:58.640 | DEBUG    | __main__:trials:24 - Trial = 7047/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.641 | DEBUG    | __main__:trials:29 - Trial = 7047/30000 | Total reward = 64.78
2022-01-26 14:16:58.645 | DEBUG    | __main__:trials:24 - Trial = 7048/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.646 | DEBUG    | __main__:trials:29 - Trial = 7048/30000 | Total reward = 33.85
2022-01-26 14:16:58.650 | DEBUG    | __main__:trials:24 - Trial = 7049/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.651 | DEBUG    | __main__:trials:29 - Trial = 7049/30000 | Total reward = 58.54
2022-01-26 14:16:58.655 | DEBUG    | __main__:trials:24 - Trial = 7050/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.657 | DEBUG    | __main__:trials:29 - Trial = 7050/30000 | Total reward = 53.84
2022-01-26 14:16:58.660 | DEBUG    | __main__:trials:24 - Trial = 7051/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.662 | DEBUG    | __main__:trials:29 - Trial = 7051/30000 | Total reward = 42.00
2022-01-26 14:16:58.665 | DEBUG    | __main__:trials:24 - Trial = 7052/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.667 | DEBUG    | __main__:trials:29 - Trial = 7052/30000 | Total reward = 36.57
2022-01-26 14:16:58.670 | DEBUG    | __main__:trials:24 - Trial = 7053/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.672 | DEBUG    | __main__:trials:29 - Trial = 7053/30000 | Total reward = 50.44
2022-01-26 14:16:58.675 | DEBUG    | __main__:trials:24 - Trial = 7054/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.677 | DEBUG    | __main__:trials:29 - Trial = 7054/30000 | Total reward = 33.06
2022-01-26 14:16:58.680 | DEBUG    | __main__:trials:24 - Trial = 7055/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.682 | DEBUG    | __main__:trials:29 - Trial = 7055/30000 | Total reward = 40.42
2022-01-26 14:16:58.686 | DEBUG    | __main__:trials:24 - Trial = 7056/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.688 | DEBUG    | __main__:trials:29 - Trial = 7056/30000 | Total reward = 34.84
2022-01-26 14:16:58.691 | DEBUG    | __main__:trials:24 - Trial = 7057/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.693 | DEBUG    | __main__:trials:29 - Trial = 7057/30000 | Total reward = 26.44
2022-01-26 14:16:58.697 | DEBUG    | __main__:trials:24 - Trial = 7058/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.697 | DEBUG    | __main__:trials:29 - Trial = 7058/30000 | Total reward = 33.88
2022-01-26 14:16:58.701 | DEBUG    | __main__:trials:24 - Trial = 7059/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.703 | DEBUG    | __main__:trials:29 - Trial = 7059/30000 | Total reward = 33.68
2022-01-26 14:16:58.706 | DEBUG    | __main__:trials:24 - Trial = 7060/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.707 | DEBUG    | __main__:trials:29 - Trial = 7060/30000 | Total reward = 36.02
2022-01-26 14:16:58.711 | DEBUG    | __main__:trials:24 - Trial = 7061/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.713 | DEBUG    | __main__:trials:29 - Trial = 7061/30000 | Total reward = 36.06
2022-01-26 14:16:58.716 | DEBUG    | __main__:trials:24 - Trial = 7062/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.718 | DEBUG    | __main__:trials:29 - Trial = 7062/30000 | Total reward = 49.78
2022-01-26 14:16:58.722 | DEBUG    | __main__:trials:24 - Trial = 7063/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.723 | DEBUG    | __main__:trials:29 - Trial = 7063/30000 | Total reward = 48.41
2022-01-26 14:16:58.727 | DEBUG    | __main__:trials:24 - Trial = 7064/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.729 | DEBUG    | __main__:trials:29 - Trial = 7064/30000 | Total reward = 49.03
2022-01-26 14:16:58.732 | DEBUG    | __main__:trials:24 - Trial = 7065/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.734 | DEBUG    | __main__:trials:29 - Trial = 7065/30000 | Total reward = 36.41
2022-01-26 14:16:58.738 | DEBUG    | __main__:trials:24 - Trial = 7066/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.739 | DEBUG    | __main__:trials:29 - Trial = 7066/30000 | Total reward = 62.99
2022-01-26 14:16:58.743 | DEBUG    | __main__:trials:24 - Trial = 7067/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.745 | DEBUG    | __main__:trials:29 - Trial = 7067/30000 | Total reward = 55.52
2022-01-26 14:16:58.748 | DEBUG    | __main__:trials:24 - Trial = 7068/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.750 | DEBUG    | __main__:trials:29 - Trial = 7068/30000 | Total reward = 44.56
2022-01-26 14:16:58.754 | DEBUG    | __main__:trials:24 - Trial = 7069/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.755 | DEBUG    | __main__:trials:29 - Trial = 7069/30000 | Total reward = 33.23
2022-01-26 14:16:58.759 | DEBUG    | __main__:trials:24 - Trial = 7070/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.760 | DEBUG    | __main__:trials:29 - Trial = 7070/30000 | Total reward = 36.37
2022-01-26 14:16:58.763 | DEBUG    | __main__:trials:24 - Trial = 7071/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.765 | DEBUG    | __main__:trials:29 - Trial = 7071/30000 | Total reward = 36.37
2022-01-26 14:16:58.768 | DEBUG    | __main__:trials:24 - Trial = 7072/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.770 | DEBUG    | __main__:trials:29 - Trial = 7072/30000 | Total reward = 35.96
2022-01-26 14:16:58.773 | DEBUG    | __main__:trials:24 - Trial = 7073/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.774 | DEBUG    | __main__:trials:29 - Trial = 7073/30000 | Total reward = 35.65
2022-01-26 14:16:58.777 | DEBUG    | __main__:trials:24 - Trial = 7074/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.778 | DEBUG    | __main__:trials:29 - Trial = 7074/30000 | Total reward = 38.54
2022-01-26 14:16:58.781 | DEBUG    | __main__:trials:24 - Trial = 7075/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.782 | DEBUG    | __main__:trials:29 - Trial = 7075/30000 | Total reward = 41.85
2022-01-26 14:16:58.785 | DEBUG    | __main__:trials:24 - Trial = 7076/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.787 | DEBUG    | __main__:trials:29 - Trial = 7076/30000 | Total reward = 58.96
2022-01-26 14:16:58.790 | DEBUG    | __main__:trials:24 - Trial = 7077/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.792 | DEBUG    | __main__:trials:29 - Trial = 7077/30000 | Total reward = 43.49
2022-01-26 14:16:58.795 | DEBUG    | __main__:trials:24 - Trial = 7078/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.797 | DEBUG    | __main__:trials:29 - Trial = 7078/30000 | Total reward = 39.59
2022-01-26 14:16:58.800 | DEBUG    | __main__:trials:24 - Trial = 7079/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.802 | DEBUG    | __main__:trials:29 - Trial = 7079/30000 | Total reward = 50.33
2022-01-26 14:16:58.806 | DEBUG    | __main__:trials:24 - Trial = 7080/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.807 | DEBUG    | __main__:trials:29 - Trial = 7080/30000 | Total reward = 32.86
2022-01-26 14:16:58.810 | DEBUG    | __main__:trials:24 - Trial = 7081/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.812 | DEBUG    | __main__:trials:29 - Trial = 7081/30000 | Total reward = 37.56
2022-01-26 14:16:58.816 | DEBUG    | __main__:trials:24 - Trial = 7082/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.817 | DEBUG    | __main__:trials:29 - Trial = 7082/30000 | Total reward = 46.98
2022-01-26 14:16:58.821 | DEBUG    | __main__:trials:24 - Trial = 7083/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.823 | DEBUG    | __main__:trials:29 - Trial = 7083/30000 | Total reward = 58.30
2022-01-26 14:16:58.826 | DEBUG    | __main__:trials:24 - Trial = 7084/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.828 | DEBUG    | __main__:trials:29 - Trial = 7084/30000 | Total reward = 41.99
2022-01-26 14:16:58.832 | DEBUG    | __main__:trials:24 - Trial = 7085/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.833 | DEBUG    | __main__:trials:29 - Trial = 7085/30000 | Total reward = 41.27
2022-01-26 14:16:58.837 | DEBUG    | __main__:trials:24 - Trial = 7086/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.838 | DEBUG    | __main__:trials:29 - Trial = 7086/30000 | Total reward = 43.69
2022-01-26 14:16:58.841 | DEBUG    | __main__:trials:26 - Trial = 7087/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:58.842 | DEBUG    | __main__:trials:29 - Trial = 7087/30000 | Total reward = 16.31
2022-01-26 14:16:58.846 | DEBUG    | __main__:trials:24 - Trial = 7088/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.847 | DEBUG    | __main__:trials:29 - Trial = 7088/30000 | Total reward = 43.31
2022-01-26 14:16:58.851 | DEBUG    | __main__:trials:24 - Trial = 7089/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.853 | DEBUG    | __main__:trials:29 - Trial = 7089/30000 | Total reward = 41.99
2022-01-26 14:16:58.856 | DEBUG    | __main__:trials:24 - Trial = 7090/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.858 | DEBUG    | __main__:trials:29 - Trial = 7090/30000 | Total reward = 40.82
2022-01-26 14:16:58.861 | DEBUG    | __main__:trials:24 - Trial = 7091/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.863 | DEBUG    | __main__:trials:29 - Trial = 7091/30000 | Total reward = 44.35
2022-01-26 14:16:58.866 | DEBUG    | __main__:trials:24 - Trial = 7092/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.868 | DEBUG    | __main__:trials:29 - Trial = 7092/30000 | Total reward = 59.30
2022-01-26 14:16:58.872 | DEBUG    | __main__:trials:24 - Trial = 7093/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.872 | DEBUG    | __main__:trials:29 - Trial = 7093/30000 | Total reward = 39.14
2022-01-26 14:16:58.876 | DEBUG    | __main__:trials:24 - Trial = 7094/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.878 | DEBUG    | __main__:trials:29 - Trial = 7094/30000 | Total reward = 38.95
2022-01-26 14:16:58.881 | DEBUG    | __main__:trials:24 - Trial = 7095/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.883 | DEBUG    | __main__:trials:29 - Trial = 7095/30000 | Total reward = 44.61
2022-01-26 14:16:58.887 | DEBUG    | __main__:trials:24 - Trial = 7096/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.888 | DEBUG    | __main__:trials:29 - Trial = 7096/30000 | Total reward = 42.68
2022-01-26 14:16:58.892 | DEBUG    | __main__:trials:24 - Trial = 7097/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.893 | DEBUG    | __main__:trials:29 - Trial = 7097/30000 | Total reward = 43.08
2022-01-26 14:16:58.897 | DEBUG    | __main__:trials:24 - Trial = 7098/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.898 | DEBUG    | __main__:trials:29 - Trial = 7098/30000 | Total reward = 42.68
2022-01-26 14:16:58.901 | DEBUG    | __main__:trials:24 - Trial = 7099/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.902 | DEBUG    | __main__:trials:29 - Trial = 7099/30000 | Total reward = 41.01
2022-01-26 14:16:58.906 | DEBUG    | __main__:trials:24 - Trial = 7100/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.907 | DEBUG    | __main__:trials:29 - Trial = 7100/30000 | Total reward = 41.27
2022-01-26 14:16:58.910 | DEBUG    | __main__:trials:24 - Trial = 7101/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.912 | DEBUG    | __main__:trials:29 - Trial = 7101/30000 | Total reward = 39.64
2022-01-26 14:16:58.916 | DEBUG    | __main__:trials:24 - Trial = 7102/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.918 | DEBUG    | __main__:trials:29 - Trial = 7102/30000 | Total reward = 46.12
2022-01-26 14:16:58.921 | DEBUG    | __main__:trials:24 - Trial = 7103/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.923 | DEBUG    | __main__:trials:29 - Trial = 7103/30000 | Total reward = 40.83
2022-01-26 14:16:58.927 | DEBUG    | __main__:trials:24 - Trial = 7104/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.927 | DEBUG    | __main__:trials:29 - Trial = 7104/30000 | Total reward = 43.57
2022-01-26 14:16:58.931 | DEBUG    | __main__:trials:24 - Trial = 7105/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.933 | DEBUG    | __main__:trials:29 - Trial = 7105/30000 | Total reward = 42.72
2022-01-26 14:16:58.937 | DEBUG    | __main__:trials:24 - Trial = 7106/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.938 | DEBUG    | __main__:trials:29 - Trial = 7106/30000 | Total reward = 36.05
2022-01-26 14:16:58.941 | DEBUG    | __main__:trials:24 - Trial = 7107/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.942 | DEBUG    | __main__:trials:29 - Trial = 7107/30000 | Total reward = 58.30
2022-01-26 14:16:58.946 | DEBUG    | __main__:trials:24 - Trial = 7108/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.947 | DEBUG    | __main__:trials:29 - Trial = 7108/30000 | Total reward = 46.89
2022-01-26 14:16:58.951 | DEBUG    | __main__:trials:24 - Trial = 7109/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.953 | DEBUG    | __main__:trials:29 - Trial = 7109/30000 | Total reward = 42.21
2022-01-26 14:16:58.956 | DEBUG    | __main__:trials:24 - Trial = 7110/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.957 | DEBUG    | __main__:trials:29 - Trial = 7110/30000 | Total reward = 34.20
2022-01-26 14:16:58.960 | DEBUG    | __main__:trials:24 - Trial = 7111/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.962 | DEBUG    | __main__:trials:29 - Trial = 7111/30000 | Total reward = 42.73
2022-01-26 14:16:58.965 | DEBUG    | __main__:trials:24 - Trial = 7112/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.966 | DEBUG    | __main__:trials:29 - Trial = 7112/30000 | Total reward = 42.87
2022-01-26 14:16:58.969 | DEBUG    | __main__:trials:24 - Trial = 7113/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.970 | DEBUG    | __main__:trials:29 - Trial = 7113/30000 | Total reward = 41.43
2022-01-26 14:16:58.973 | DEBUG    | __main__:trials:24 - Trial = 7114/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.975 | DEBUG    | __main__:trials:29 - Trial = 7114/30000 | Total reward = 41.27
2022-01-26 14:16:58.979 | DEBUG    | __main__:trials:24 - Trial = 7115/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.980 | DEBUG    | __main__:trials:29 - Trial = 7115/30000 | Total reward = 36.51
2022-01-26 14:16:58.984 | DEBUG    | __main__:trials:24 - Trial = 7116/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.985 | DEBUG    | __main__:trials:29 - Trial = 7116/30000 | Total reward = 48.54
2022-01-26 14:16:58.989 | DEBUG    | __main__:trials:24 - Trial = 7117/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.990 | DEBUG    | __main__:trials:29 - Trial = 7117/30000 | Total reward = 42.97
2022-01-26 14:16:58.994 | DEBUG    | __main__:trials:24 - Trial = 7118/30000 | Max number of steps (20) reached
2022-01-26 14:16:58.996 | DEBUG    | __main__:trials:29 - Trial = 7118/30000 | Total reward = 43.14
2022-01-26 14:16:58.999 | DEBUG    | __main__:trials:24 - Trial = 7119/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.000 | DEBUG    | __main__:trials:29 - Trial = 7119/30000 | Total reward = 51.69
2022-01-26 14:16:59.004 | DEBUG    | __main__:trials:24 - Trial = 7120/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.006 | DEBUG    | __main__:trials:29 - Trial = 7120/30000 | Total reward = 38.61
2022-01-26 14:16:59.010 | DEBUG    | __main__:trials:24 - Trial = 7121/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.011 | DEBUG    | __main__:trials:29 - Trial = 7121/30000 | Total reward = 39.52
2022-01-26 14:16:59.015 | DEBUG    | __main__:trials:24 - Trial = 7122/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.016 | DEBUG    | __main__:trials:29 - Trial = 7122/30000 | Total reward = 53.64
2022-01-26 14:16:59.020 | DEBUG    | __main__:trials:24 - Trial = 7123/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.021 | DEBUG    | __main__:trials:29 - Trial = 7123/30000 | Total reward = 42.56
2022-01-26 14:16:59.025 | DEBUG    | __main__:trials:24 - Trial = 7124/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.026 | DEBUG    | __main__:trials:29 - Trial = 7124/30000 | Total reward = 43.07
2022-01-26 14:16:59.030 | DEBUG    | __main__:trials:24 - Trial = 7125/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.031 | DEBUG    | __main__:trials:29 - Trial = 7125/30000 | Total reward = 34.92
2022-01-26 14:16:59.035 | DEBUG    | __main__:trials:24 - Trial = 7126/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.037 | DEBUG    | __main__:trials:29 - Trial = 7126/30000 | Total reward = 25.22
2022-01-26 14:16:59.040 | DEBUG    | __main__:trials:24 - Trial = 7127/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.042 | DEBUG    | __main__:trials:29 - Trial = 7127/30000 | Total reward = 40.79
2022-01-26 14:16:59.046 | DEBUG    | __main__:trials:24 - Trial = 7128/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.047 | DEBUG    | __main__:trials:29 - Trial = 7128/30000 | Total reward = 41.20
2022-01-26 14:16:59.051 | DEBUG    | __main__:trials:24 - Trial = 7129/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.053 | DEBUG    | __main__:trials:29 - Trial = 7129/30000 | Total reward = 43.39
2022-01-26 14:16:59.056 | DEBUG    | __main__:trials:24 - Trial = 7130/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.058 | DEBUG    | __main__:trials:29 - Trial = 7130/30000 | Total reward = 42.45
2022-01-26 14:16:59.062 | DEBUG    | __main__:trials:24 - Trial = 7131/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.062 | DEBUG    | __main__:trials:29 - Trial = 7131/30000 | Total reward = 32.58
2022-01-26 14:16:59.067 | DEBUG    | __main__:trials:24 - Trial = 7132/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.068 | DEBUG    | __main__:trials:29 - Trial = 7132/30000 | Total reward = 36.07
2022-01-26 14:16:59.072 | DEBUG    | __main__:trials:24 - Trial = 7133/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.073 | DEBUG    | __main__:trials:29 - Trial = 7133/30000 | Total reward = 54.52
2022-01-26 14:16:59.077 | DEBUG    | __main__:trials:24 - Trial = 7134/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.078 | DEBUG    | __main__:trials:29 - Trial = 7134/30000 | Total reward = 37.46
2022-01-26 14:16:59.082 | DEBUG    | __main__:trials:24 - Trial = 7135/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.083 | DEBUG    | __main__:trials:29 - Trial = 7135/30000 | Total reward = 37.41
2022-01-26 14:16:59.087 | DEBUG    | __main__:trials:24 - Trial = 7136/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.089 | DEBUG    | __main__:trials:29 - Trial = 7136/30000 | Total reward = 49.26
2022-01-26 14:16:59.092 | DEBUG    | __main__:trials:24 - Trial = 7137/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.093 | DEBUG    | __main__:trials:29 - Trial = 7137/30000 | Total reward = 56.11
2022-01-26 14:16:59.096 | DEBUG    | __main__:trials:24 - Trial = 7138/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.097 | DEBUG    | __main__:trials:29 - Trial = 7138/30000 | Total reward = 47.48
2022-01-26 14:16:59.100 | DEBUG    | __main__:trials:24 - Trial = 7139/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.102 | DEBUG    | __main__:trials:29 - Trial = 7139/30000 | Total reward = 45.35
2022-01-26 14:16:59.106 | DEBUG    | __main__:trials:24 - Trial = 7140/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.107 | DEBUG    | __main__:trials:29 - Trial = 7140/30000 | Total reward = 38.34
2022-01-26 14:16:59.111 | DEBUG    | __main__:trials:24 - Trial = 7141/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.112 | DEBUG    | __main__:trials:29 - Trial = 7141/30000 | Total reward = 44.43
2022-01-26 14:16:59.116 | DEBUG    | __main__:trials:24 - Trial = 7142/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.117 | DEBUG    | __main__:trials:29 - Trial = 7142/30000 | Total reward = 36.90
2022-01-26 14:16:59.121 | DEBUG    | __main__:trials:24 - Trial = 7143/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.122 | DEBUG    | __main__:trials:29 - Trial = 7143/30000 | Total reward = 44.75
2022-01-26 14:16:59.126 | DEBUG    | __main__:trials:24 - Trial = 7144/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.127 | DEBUG    | __main__:trials:29 - Trial = 7144/30000 | Total reward = 41.38
2022-01-26 14:16:59.131 | DEBUG    | __main__:trials:24 - Trial = 7145/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.132 | DEBUG    | __main__:trials:29 - Trial = 7145/30000 | Total reward = 39.63
2022-01-26 14:16:59.136 | DEBUG    | __main__:trials:24 - Trial = 7146/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.137 | DEBUG    | __main__:trials:29 - Trial = 7146/30000 | Total reward = 44.18
2022-01-26 14:16:59.141 | DEBUG    | __main__:trials:24 - Trial = 7147/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.143 | DEBUG    | __main__:trials:29 - Trial = 7147/30000 | Total reward = 40.32
2022-01-26 14:16:59.145 | DEBUG    | __main__:trials:26 - Trial = 7148/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.146 | DEBUG    | __main__:trials:29 - Trial = 7148/30000 | Total reward = 19.66
2022-01-26 14:16:59.149 | DEBUG    | __main__:trials:24 - Trial = 7149/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.151 | DEBUG    | __main__:trials:29 - Trial = 7149/30000 | Total reward = 50.09
2022-01-26 14:16:59.154 | DEBUG    | __main__:trials:24 - Trial = 7150/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.156 | DEBUG    | __main__:trials:29 - Trial = 7150/30000 | Total reward = 45.80
2022-01-26 14:16:59.159 | DEBUG    | __main__:trials:24 - Trial = 7151/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.161 | DEBUG    | __main__:trials:29 - Trial = 7151/30000 | Total reward = 36.33
2022-01-26 14:16:59.165 | DEBUG    | __main__:trials:24 - Trial = 7152/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.165 | DEBUG    | __main__:trials:29 - Trial = 7152/30000 | Total reward = 43.94
2022-01-26 14:16:59.168 | DEBUG    | __main__:trials:24 - Trial = 7153/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.169 | DEBUG    | __main__:trials:29 - Trial = 7153/30000 | Total reward = 38.74
2022-01-26 14:16:59.173 | DEBUG    | __main__:trials:24 - Trial = 7154/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.173 | DEBUG    | __main__:trials:29 - Trial = 7154/30000 | Total reward = 38.69
2022-01-26 14:16:59.177 | DEBUG    | __main__:trials:24 - Trial = 7155/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.179 | DEBUG    | __main__:trials:29 - Trial = 7155/30000 | Total reward = 48.52
2022-01-26 14:16:59.181 | DEBUG    | __main__:trials:24 - Trial = 7156/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.183 | DEBUG    | __main__:trials:29 - Trial = 7156/30000 | Total reward = 50.56
2022-01-26 14:16:59.187 | DEBUG    | __main__:trials:24 - Trial = 7157/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.189 | DEBUG    | __main__:trials:29 - Trial = 7157/30000 | Total reward = 43.07
2022-01-26 14:16:59.192 | DEBUG    | __main__:trials:24 - Trial = 7158/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.194 | DEBUG    | __main__:trials:29 - Trial = 7158/30000 | Total reward = 43.98
2022-01-26 14:16:59.197 | DEBUG    | __main__:trials:24 - Trial = 7159/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.199 | DEBUG    | __main__:trials:29 - Trial = 7159/30000 | Total reward = 42.77
2022-01-26 14:16:59.202 | DEBUG    | __main__:trials:24 - Trial = 7160/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.203 | DEBUG    | __main__:trials:29 - Trial = 7160/30000 | Total reward = 41.39
2022-01-26 14:16:59.207 | DEBUG    | __main__:trials:24 - Trial = 7161/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.209 | DEBUG    | __main__:trials:29 - Trial = 7161/30000 | Total reward = 53.08
2022-01-26 14:16:59.212 | DEBUG    | __main__:trials:24 - Trial = 7162/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.214 | DEBUG    | __main__:trials:29 - Trial = 7162/30000 | Total reward = 41.27
2022-01-26 14:16:59.217 | DEBUG    | __main__:trials:24 - Trial = 7163/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.219 | DEBUG    | __main__:trials:29 - Trial = 7163/30000 | Total reward = 38.71
2022-01-26 14:16:59.222 | DEBUG    | __main__:trials:24 - Trial = 7164/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.223 | DEBUG    | __main__:trials:29 - Trial = 7164/30000 | Total reward = 41.42
2022-01-26 14:16:59.226 | DEBUG    | __main__:trials:24 - Trial = 7165/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.228 | DEBUG    | __main__:trials:29 - Trial = 7165/30000 | Total reward = 39.94
2022-01-26 14:16:59.232 | DEBUG    | __main__:trials:24 - Trial = 7166/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.234 | DEBUG    | __main__:trials:29 - Trial = 7166/30000 | Total reward = 49.67
2022-01-26 14:16:59.238 | DEBUG    | __main__:trials:24 - Trial = 7167/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.239 | DEBUG    | __main__:trials:29 - Trial = 7167/30000 | Total reward = 48.57
2022-01-26 14:16:59.243 | DEBUG    | __main__:trials:24 - Trial = 7168/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.245 | DEBUG    | __main__:trials:29 - Trial = 7168/30000 | Total reward = 44.35
2022-01-26 14:16:59.248 | DEBUG    | __main__:trials:24 - Trial = 7169/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.250 | DEBUG    | __main__:trials:29 - Trial = 7169/30000 | Total reward = 40.96
2022-01-26 14:16:59.253 | DEBUG    | __main__:trials:24 - Trial = 7170/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.254 | DEBUG    | __main__:trials:29 - Trial = 7170/30000 | Total reward = 40.37
2022-01-26 14:16:59.257 | DEBUG    | __main__:trials:24 - Trial = 7171/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.258 | DEBUG    | __main__:trials:29 - Trial = 7171/30000 | Total reward = 43.43
2022-01-26 14:16:59.261 | DEBUG    | __main__:trials:24 - Trial = 7172/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.263 | DEBUG    | __main__:trials:29 - Trial = 7172/30000 | Total reward = 40.95
2022-01-26 14:16:59.266 | DEBUG    | __main__:trials:24 - Trial = 7173/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.267 | DEBUG    | __main__:trials:29 - Trial = 7173/30000 | Total reward = 47.91
2022-01-26 14:16:59.271 | DEBUG    | __main__:trials:24 - Trial = 7174/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.273 | DEBUG    | __main__:trials:29 - Trial = 7174/30000 | Total reward = 39.45
2022-01-26 14:16:59.276 | DEBUG    | __main__:trials:24 - Trial = 7175/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.277 | DEBUG    | __main__:trials:29 - Trial = 7175/30000 | Total reward = 41.31
2022-01-26 14:16:59.280 | DEBUG    | __main__:trials:26 - Trial = 7176/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.281 | DEBUG    | __main__:trials:29 - Trial = 7176/30000 | Total reward = 27.12
2022-01-26 14:16:59.284 | DEBUG    | __main__:trials:24 - Trial = 7177/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.286 | DEBUG    | __main__:trials:29 - Trial = 7177/30000 | Total reward = 43.20
2022-01-26 14:16:59.289 | DEBUG    | __main__:trials:26 - Trial = 7178/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.290 | DEBUG    | __main__:trials:29 - Trial = 7178/30000 | Total reward = 33.09
2022-01-26 14:16:59.293 | DEBUG    | __main__:trials:24 - Trial = 7179/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.295 | DEBUG    | __main__:trials:29 - Trial = 7179/30000 | Total reward = 32.78
2022-01-26 14:16:59.299 | DEBUG    | __main__:trials:24 - Trial = 7180/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.300 | DEBUG    | __main__:trials:29 - Trial = 7180/30000 | Total reward = 43.26
2022-01-26 14:16:59.303 | DEBUG    | __main__:trials:26 - Trial = 7181/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.305 | DEBUG    | __main__:trials:29 - Trial = 7181/30000 | Total reward = 21.45
2022-01-26 14:16:59.308 | DEBUG    | __main__:trials:24 - Trial = 7182/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.310 | DEBUG    | __main__:trials:29 - Trial = 7182/30000 | Total reward = 57.92
2022-01-26 14:16:59.313 | DEBUG    | __main__:trials:24 - Trial = 7183/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.314 | DEBUG    | __main__:trials:29 - Trial = 7183/30000 | Total reward = 46.93
2022-01-26 14:16:59.317 | DEBUG    | __main__:trials:24 - Trial = 7184/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.319 | DEBUG    | __main__:trials:29 - Trial = 7184/30000 | Total reward = 22.64
2022-01-26 14:16:59.322 | DEBUG    | __main__:trials:24 - Trial = 7185/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.324 | DEBUG    | __main__:trials:29 - Trial = 7185/30000 | Total reward = 35.00
2022-01-26 14:16:59.327 | DEBUG    | __main__:trials:24 - Trial = 7186/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.329 | DEBUG    | __main__:trials:29 - Trial = 7186/30000 | Total reward = 27.59
2022-01-26 14:16:59.332 | DEBUG    | __main__:trials:24 - Trial = 7187/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.334 | DEBUG    | __main__:trials:29 - Trial = 7187/30000 | Total reward = 43.04
2022-01-26 14:16:59.337 | DEBUG    | __main__:trials:24 - Trial = 7188/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.339 | DEBUG    | __main__:trials:29 - Trial = 7188/30000 | Total reward = 42.35
2022-01-26 14:16:59.343 | DEBUG    | __main__:trials:24 - Trial = 7189/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.345 | DEBUG    | __main__:trials:29 - Trial = 7189/30000 | Total reward = 39.62
2022-01-26 14:16:59.348 | DEBUG    | __main__:trials:24 - Trial = 7190/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.350 | DEBUG    | __main__:trials:29 - Trial = 7190/30000 | Total reward = 42.83
2022-01-26 14:16:59.354 | DEBUG    | __main__:trials:24 - Trial = 7191/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.355 | DEBUG    | __main__:trials:29 - Trial = 7191/30000 | Total reward = 58.09
2022-01-26 14:16:59.359 | DEBUG    | __main__:trials:24 - Trial = 7192/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.360 | DEBUG    | __main__:trials:29 - Trial = 7192/30000 | Total reward = 35.39
2022-01-26 14:16:59.364 | DEBUG    | __main__:trials:24 - Trial = 7193/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.365 | DEBUG    | __main__:trials:29 - Trial = 7193/30000 | Total reward = 39.99
2022-01-26 14:16:59.368 | DEBUG    | __main__:trials:24 - Trial = 7194/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.370 | DEBUG    | __main__:trials:29 - Trial = 7194/30000 | Total reward = 41.56
2022-01-26 14:16:59.373 | DEBUG    | __main__:trials:24 - Trial = 7195/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.373 | DEBUG    | __main__:trials:29 - Trial = 7195/30000 | Total reward = 41.27
2022-01-26 14:16:59.376 | DEBUG    | __main__:trials:24 - Trial = 7196/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.377 | DEBUG    | __main__:trials:29 - Trial = 7196/30000 | Total reward = 45.57
2022-01-26 14:16:59.381 | DEBUG    | __main__:trials:24 - Trial = 7197/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.383 | DEBUG    | __main__:trials:29 - Trial = 7197/30000 | Total reward = 53.27
2022-01-26 14:16:59.387 | DEBUG    | __main__:trials:24 - Trial = 7198/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.387 | DEBUG    | __main__:trials:29 - Trial = 7198/30000 | Total reward = 34.98
2022-01-26 14:16:59.391 | DEBUG    | __main__:trials:24 - Trial = 7199/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.392 | DEBUG    | __main__:trials:29 - Trial = 7199/30000 | Total reward = 41.86
2022-01-26 14:16:59.396 | DEBUG    | __main__:trials:24 - Trial = 7200/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.398 | DEBUG    | __main__:trials:29 - Trial = 7200/30000 | Total reward = 39.08
2022-01-26 14:16:59.401 | DEBUG    | __main__:trials:24 - Trial = 7201/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.402 | DEBUG    | __main__:trials:29 - Trial = 7201/30000 | Total reward = 52.39
2022-01-26 14:16:59.406 | DEBUG    | __main__:trials:24 - Trial = 7202/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.407 | DEBUG    | __main__:trials:29 - Trial = 7202/30000 | Total reward = 42.72
2022-01-26 14:16:59.411 | DEBUG    | __main__:trials:24 - Trial = 7203/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.413 | DEBUG    | __main__:trials:29 - Trial = 7203/30000 | Total reward = 51.35
2022-01-26 14:16:59.416 | DEBUG    | __main__:trials:24 - Trial = 7204/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.417 | DEBUG    | __main__:trials:29 - Trial = 7204/30000 | Total reward = 44.80
2022-01-26 14:16:59.421 | DEBUG    | __main__:trials:24 - Trial = 7205/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.422 | DEBUG    | __main__:trials:29 - Trial = 7205/30000 | Total reward = 43.66
2022-01-26 14:16:59.426 | DEBUG    | __main__:trials:24 - Trial = 7206/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.426 | DEBUG    | __main__:trials:29 - Trial = 7206/30000 | Total reward = 40.82
2022-01-26 14:16:59.430 | DEBUG    | __main__:trials:24 - Trial = 7207/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.432 | DEBUG    | __main__:trials:29 - Trial = 7207/30000 | Total reward = 41.27
2022-01-26 14:16:59.435 | DEBUG    | __main__:trials:24 - Trial = 7208/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.435 | DEBUG    | __main__:trials:29 - Trial = 7208/30000 | Total reward = 47.56
2022-01-26 14:16:59.439 | DEBUG    | __main__:trials:24 - Trial = 7209/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.441 | DEBUG    | __main__:trials:29 - Trial = 7209/30000 | Total reward = 41.87
2022-01-26 14:16:59.444 | DEBUG    | __main__:trials:24 - Trial = 7210/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.446 | DEBUG    | __main__:trials:29 - Trial = 7210/30000 | Total reward = 45.43
2022-01-26 14:16:59.450 | DEBUG    | __main__:trials:24 - Trial = 7211/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.451 | DEBUG    | __main__:trials:29 - Trial = 7211/30000 | Total reward = 41.33
2022-01-26 14:16:59.455 | DEBUG    | __main__:trials:24 - Trial = 7212/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.456 | DEBUG    | __main__:trials:29 - Trial = 7212/30000 | Total reward = 36.19
2022-01-26 14:16:59.460 | DEBUG    | __main__:trials:24 - Trial = 7213/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.462 | DEBUG    | __main__:trials:29 - Trial = 7213/30000 | Total reward = 39.55
2022-01-26 14:16:59.466 | DEBUG    | __main__:trials:24 - Trial = 7214/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.466 | DEBUG    | __main__:trials:29 - Trial = 7214/30000 | Total reward = 43.24
2022-01-26 14:16:59.470 | DEBUG    | __main__:trials:24 - Trial = 7215/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.472 | DEBUG    | __main__:trials:29 - Trial = 7215/30000 | Total reward = 36.50
2022-01-26 14:16:59.476 | DEBUG    | __main__:trials:24 - Trial = 7216/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.476 | DEBUG    | __main__:trials:29 - Trial = 7216/30000 | Total reward = 38.30
2022-01-26 14:16:59.480 | DEBUG    | __main__:trials:24 - Trial = 7217/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.482 | DEBUG    | __main__:trials:29 - Trial = 7217/30000 | Total reward = 39.09
2022-01-26 14:16:59.485 | DEBUG    | __main__:trials:24 - Trial = 7218/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.486 | DEBUG    | __main__:trials:29 - Trial = 7218/30000 | Total reward = 45.46
2022-01-26 14:16:59.490 | DEBUG    | __main__:trials:24 - Trial = 7219/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.491 | DEBUG    | __main__:trials:29 - Trial = 7219/30000 | Total reward = 38.57
2022-01-26 14:16:59.495 | DEBUG    | __main__:trials:24 - Trial = 7220/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.496 | DEBUG    | __main__:trials:29 - Trial = 7220/30000 | Total reward = 49.26
2022-01-26 14:16:59.499 | DEBUG    | __main__:trials:24 - Trial = 7221/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.501 | DEBUG    | __main__:trials:29 - Trial = 7221/30000 | Total reward = 38.55
2022-01-26 14:16:59.504 | DEBUG    | __main__:trials:24 - Trial = 7222/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.506 | DEBUG    | __main__:trials:29 - Trial = 7222/30000 | Total reward = 35.68
2022-01-26 14:16:59.510 | DEBUG    | __main__:trials:24 - Trial = 7223/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.511 | DEBUG    | __main__:trials:29 - Trial = 7223/30000 | Total reward = 43.66
2022-01-26 14:16:59.515 | DEBUG    | __main__:trials:24 - Trial = 7224/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.516 | DEBUG    | __main__:trials:29 - Trial = 7224/30000 | Total reward = 42.74
2022-01-26 14:16:59.520 | DEBUG    | __main__:trials:24 - Trial = 7225/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.521 | DEBUG    | __main__:trials:29 - Trial = 7225/30000 | Total reward = 36.46
2022-01-26 14:16:59.525 | DEBUG    | __main__:trials:24 - Trial = 7226/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.525 | DEBUG    | __main__:trials:29 - Trial = 7226/30000 | Total reward = 47.11
2022-01-26 14:16:59.530 | DEBUG    | __main__:trials:24 - Trial = 7227/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.531 | DEBUG    | __main__:trials:29 - Trial = 7227/30000 | Total reward = 32.19
2022-01-26 14:16:59.535 | DEBUG    | __main__:trials:24 - Trial = 7228/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.536 | DEBUG    | __main__:trials:29 - Trial = 7228/30000 | Total reward = 42.05
2022-01-26 14:16:59.540 | DEBUG    | __main__:trials:24 - Trial = 7229/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.542 | DEBUG    | __main__:trials:29 - Trial = 7229/30000 | Total reward = 39.67
2022-01-26 14:16:59.545 | DEBUG    | __main__:trials:24 - Trial = 7230/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.547 | DEBUG    | __main__:trials:29 - Trial = 7230/30000 | Total reward = 29.93
2022-01-26 14:16:59.551 | DEBUG    | __main__:trials:24 - Trial = 7231/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.552 | DEBUG    | __main__:trials:29 - Trial = 7231/30000 | Total reward = 50.72
2022-01-26 14:16:59.556 | DEBUG    | __main__:trials:24 - Trial = 7232/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.557 | DEBUG    | __main__:trials:29 - Trial = 7232/30000 | Total reward = 50.83
2022-01-26 14:16:59.561 | DEBUG    | __main__:trials:24 - Trial = 7233/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.563 | DEBUG    | __main__:trials:29 - Trial = 7233/30000 | Total reward = 41.78
2022-01-26 14:16:59.566 | DEBUG    | __main__:trials:24 - Trial = 7234/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.568 | DEBUG    | __main__:trials:29 - Trial = 7234/30000 | Total reward = 43.39
2022-01-26 14:16:59.571 | DEBUG    | __main__:trials:24 - Trial = 7235/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.573 | DEBUG    | __main__:trials:29 - Trial = 7235/30000 | Total reward = 41.93
2022-01-26 14:16:59.576 | DEBUG    | __main__:trials:24 - Trial = 7236/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.578 | DEBUG    | __main__:trials:29 - Trial = 7236/30000 | Total reward = 41.78
2022-01-26 14:16:59.582 | DEBUG    | __main__:trials:24 - Trial = 7237/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.582 | DEBUG    | __main__:trials:29 - Trial = 7237/30000 | Total reward = 32.88
2022-01-26 14:16:59.586 | DEBUG    | __main__:trials:24 - Trial = 7238/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.588 | DEBUG    | __main__:trials:29 - Trial = 7238/30000 | Total reward = 40.47
2022-01-26 14:16:59.591 | DEBUG    | __main__:trials:24 - Trial = 7239/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.593 | DEBUG    | __main__:trials:29 - Trial = 7239/30000 | Total reward = 42.74
2022-01-26 14:16:59.596 | DEBUG    | __main__:trials:24 - Trial = 7240/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.597 | DEBUG    | __main__:trials:29 - Trial = 7240/30000 | Total reward = 49.26
2022-01-26 14:16:59.601 | DEBUG    | __main__:trials:24 - Trial = 7241/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.603 | DEBUG    | __main__:trials:29 - Trial = 7241/30000 | Total reward = 48.28
2022-01-26 14:16:59.606 | DEBUG    | __main__:trials:24 - Trial = 7242/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.607 | DEBUG    | __main__:trials:29 - Trial = 7242/30000 | Total reward = 42.77
2022-01-26 14:16:59.611 | DEBUG    | __main__:trials:24 - Trial = 7243/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.613 | DEBUG    | __main__:trials:29 - Trial = 7243/30000 | Total reward = 41.27
2022-01-26 14:16:59.616 | DEBUG    | __main__:trials:24 - Trial = 7244/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.618 | DEBUG    | __main__:trials:29 - Trial = 7244/30000 | Total reward = 35.98
2022-01-26 14:16:59.621 | DEBUG    | __main__:trials:24 - Trial = 7245/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.623 | DEBUG    | __main__:trials:29 - Trial = 7245/30000 | Total reward = 35.39
2022-01-26 14:16:59.626 | DEBUG    | __main__:trials:24 - Trial = 7246/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.628 | DEBUG    | __main__:trials:29 - Trial = 7246/30000 | Total reward = 48.28
2022-01-26 14:16:59.632 | DEBUG    | __main__:trials:24 - Trial = 7247/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.633 | DEBUG    | __main__:trials:29 - Trial = 7247/30000 | Total reward = 45.76
2022-01-26 14:16:59.637 | DEBUG    | __main__:trials:24 - Trial = 7248/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.639 | DEBUG    | __main__:trials:29 - Trial = 7248/30000 | Total reward = 41.61
2022-01-26 14:16:59.642 | DEBUG    | __main__:trials:24 - Trial = 7249/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.643 | DEBUG    | __main__:trials:29 - Trial = 7249/30000 | Total reward = 28.18
2022-01-26 14:16:59.647 | DEBUG    | __main__:trials:24 - Trial = 7250/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.649 | DEBUG    | __main__:trials:29 - Trial = 7250/30000 | Total reward = 30.82
2022-01-26 14:16:59.652 | DEBUG    | __main__:trials:24 - Trial = 7251/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.654 | DEBUG    | __main__:trials:29 - Trial = 7251/30000 | Total reward = 36.41
2022-01-26 14:16:59.658 | DEBUG    | __main__:trials:24 - Trial = 7252/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.660 | DEBUG    | __main__:trials:29 - Trial = 7252/30000 | Total reward = 58.29
2022-01-26 14:16:59.664 | DEBUG    | __main__:trials:24 - Trial = 7253/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.665 | DEBUG    | __main__:trials:29 - Trial = 7253/30000 | Total reward = 39.66
2022-01-26 14:16:59.669 | DEBUG    | __main__:trials:24 - Trial = 7254/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.670 | DEBUG    | __main__:trials:29 - Trial = 7254/30000 | Total reward = 44.18
2022-01-26 14:16:59.673 | DEBUG    | __main__:trials:24 - Trial = 7255/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.676 | DEBUG    | __main__:trials:29 - Trial = 7255/30000 | Total reward = 36.37
2022-01-26 14:16:59.679 | DEBUG    | __main__:trials:24 - Trial = 7256/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.681 | DEBUG    | __main__:trials:29 - Trial = 7256/30000 | Total reward = 42.76
2022-01-26 14:16:59.684 | DEBUG    | __main__:trials:24 - Trial = 7257/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.686 | DEBUG    | __main__:trials:29 - Trial = 7257/30000 | Total reward = 39.60
2022-01-26 14:16:59.689 | DEBUG    | __main__:trials:24 - Trial = 7258/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.690 | DEBUG    | __main__:trials:29 - Trial = 7258/30000 | Total reward = 30.20
2022-01-26 14:16:59.693 | DEBUG    | __main__:trials:26 - Trial = 7259/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.694 | DEBUG    | __main__:trials:29 - Trial = 7259/30000 | Total reward = 22.68
2022-01-26 14:16:59.698 | DEBUG    | __main__:trials:24 - Trial = 7260/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.700 | DEBUG    | __main__:trials:29 - Trial = 7260/30000 | Total reward = 59.30
2022-01-26 14:16:59.703 | DEBUG    | __main__:trials:24 - Trial = 7261/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.705 | DEBUG    | __main__:trials:29 - Trial = 7261/30000 | Total reward = 53.51
2022-01-26 14:16:59.708 | DEBUG    | __main__:trials:24 - Trial = 7262/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.709 | DEBUG    | __main__:trials:29 - Trial = 7262/30000 | Total reward = 35.71
2022-01-26 14:16:59.713 | DEBUG    | __main__:trials:24 - Trial = 7263/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.713 | DEBUG    | __main__:trials:29 - Trial = 7263/30000 | Total reward = 48.52
2022-01-26 14:16:59.717 | DEBUG    | __main__:trials:24 - Trial = 7264/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.719 | DEBUG    | __main__:trials:29 - Trial = 7264/30000 | Total reward = 50.16
2022-01-26 14:16:59.722 | DEBUG    | __main__:trials:24 - Trial = 7265/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.724 | DEBUG    | __main__:trials:29 - Trial = 7265/30000 | Total reward = 54.72
2022-01-26 14:16:59.728 | DEBUG    | __main__:trials:24 - Trial = 7266/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.729 | DEBUG    | __main__:trials:29 - Trial = 7266/30000 | Total reward = 33.40
2022-01-26 14:16:59.732 | DEBUG    | __main__:trials:24 - Trial = 7267/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.734 | DEBUG    | __main__:trials:29 - Trial = 7267/30000 | Total reward = 39.06
2022-01-26 14:16:59.736 | DEBUG    | __main__:trials:26 - Trial = 7268/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.738 | DEBUG    | __main__:trials:29 - Trial = 7268/30000 | Total reward = 22.54
2022-01-26 14:16:59.741 | DEBUG    | __main__:trials:24 - Trial = 7269/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.742 | DEBUG    | __main__:trials:29 - Trial = 7269/30000 | Total reward = 46.22
2022-01-26 14:16:59.746 | DEBUG    | __main__:trials:24 - Trial = 7270/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.748 | DEBUG    | __main__:trials:29 - Trial = 7270/30000 | Total reward = 28.76
2022-01-26 14:16:59.752 | DEBUG    | __main__:trials:24 - Trial = 7271/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.752 | DEBUG    | __main__:trials:29 - Trial = 7271/30000 | Total reward = 28.32
2022-01-26 14:16:59.756 | DEBUG    | __main__:trials:24 - Trial = 7272/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.758 | DEBUG    | __main__:trials:29 - Trial = 7272/30000 | Total reward = 48.93
2022-01-26 14:16:59.761 | DEBUG    | __main__:trials:24 - Trial = 7273/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.763 | DEBUG    | __main__:trials:29 - Trial = 7273/30000 | Total reward = 47.19
2022-01-26 14:16:59.767 | DEBUG    | __main__:trials:24 - Trial = 7274/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.768 | DEBUG    | __main__:trials:29 - Trial = 7274/30000 | Total reward = 45.55
2022-01-26 14:16:59.772 | DEBUG    | __main__:trials:24 - Trial = 7275/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.773 | DEBUG    | __main__:trials:29 - Trial = 7275/30000 | Total reward = 47.07
2022-01-26 14:16:59.776 | DEBUG    | __main__:trials:24 - Trial = 7276/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.778 | DEBUG    | __main__:trials:29 - Trial = 7276/30000 | Total reward = 45.95
2022-01-26 14:16:59.781 | DEBUG    | __main__:trials:24 - Trial = 7277/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.784 | DEBUG    | __main__:trials:29 - Trial = 7277/30000 | Total reward = 47.42
2022-01-26 14:16:59.787 | DEBUG    | __main__:trials:24 - Trial = 7278/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.789 | DEBUG    | __main__:trials:29 - Trial = 7278/30000 | Total reward = 42.59
2022-01-26 14:16:59.792 | DEBUG    | __main__:trials:24 - Trial = 7279/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.793 | DEBUG    | __main__:trials:29 - Trial = 7279/30000 | Total reward = 57.68
2022-01-26 14:16:59.797 | DEBUG    | __main__:trials:24 - Trial = 7280/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.798 | DEBUG    | __main__:trials:29 - Trial = 7280/30000 | Total reward = 47.21
2022-01-26 14:16:59.802 | DEBUG    | __main__:trials:24 - Trial = 7281/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.803 | DEBUG    | __main__:trials:29 - Trial = 7281/30000 | Total reward = 47.77
2022-01-26 14:16:59.806 | DEBUG    | __main__:trials:24 - Trial = 7282/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.808 | DEBUG    | __main__:trials:29 - Trial = 7282/30000 | Total reward = 46.93
2022-01-26 14:16:59.811 | DEBUG    | __main__:trials:24 - Trial = 7283/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.813 | DEBUG    | __main__:trials:29 - Trial = 7283/30000 | Total reward = 47.19
2022-01-26 14:16:59.817 | DEBUG    | __main__:trials:24 - Trial = 7284/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.818 | DEBUG    | __main__:trials:29 - Trial = 7284/30000 | Total reward = 41.57
2022-01-26 14:16:59.822 | DEBUG    | __main__:trials:24 - Trial = 7285/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.824 | DEBUG    | __main__:trials:29 - Trial = 7285/30000 | Total reward = 40.32
2022-01-26 14:16:59.827 | DEBUG    | __main__:trials:24 - Trial = 7286/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.829 | DEBUG    | __main__:trials:29 - Trial = 7286/30000 | Total reward = 49.37
2022-01-26 14:16:59.832 | DEBUG    | __main__:trials:24 - Trial = 7287/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.834 | DEBUG    | __main__:trials:29 - Trial = 7287/30000 | Total reward = 38.04
2022-01-26 14:16:59.838 | DEBUG    | __main__:trials:24 - Trial = 7288/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.839 | DEBUG    | __main__:trials:29 - Trial = 7288/30000 | Total reward = 48.31
2022-01-26 14:16:59.843 | DEBUG    | __main__:trials:24 - Trial = 7289/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.844 | DEBUG    | __main__:trials:29 - Trial = 7289/30000 | Total reward = 51.08
2022-01-26 14:16:59.847 | DEBUG    | __main__:trials:24 - Trial = 7290/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.854 | DEBUG    | __main__:trials:29 - Trial = 7290/30000 | Total reward = 29.41
2022-01-26 14:16:59.857 | DEBUG    | __main__:trials:24 - Trial = 7291/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.859 | DEBUG    | __main__:trials:29 - Trial = 7291/30000 | Total reward = 48.02
2022-01-26 14:16:59.863 | DEBUG    | __main__:trials:24 - Trial = 7292/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.863 | DEBUG    | __main__:trials:29 - Trial = 7292/30000 | Total reward = 34.59
2022-01-26 14:16:59.867 | DEBUG    | __main__:trials:24 - Trial = 7293/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.869 | DEBUG    | __main__:trials:29 - Trial = 7293/30000 | Total reward = 46.07
2022-01-26 14:16:59.873 | DEBUG    | __main__:trials:24 - Trial = 7294/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.874 | DEBUG    | __main__:trials:29 - Trial = 7294/30000 | Total reward = 47.22
2022-01-26 14:16:59.878 | DEBUG    | __main__:trials:24 - Trial = 7295/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.880 | DEBUG    | __main__:trials:29 - Trial = 7295/30000 | Total reward = 43.85
2022-01-26 14:16:59.883 | DEBUG    | __main__:trials:24 - Trial = 7296/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.884 | DEBUG    | __main__:trials:29 - Trial = 7296/30000 | Total reward = 47.27
2022-01-26 14:16:59.888 | DEBUG    | __main__:trials:24 - Trial = 7297/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.890 | DEBUG    | __main__:trials:29 - Trial = 7297/30000 | Total reward = 42.46
2022-01-26 14:16:59.893 | DEBUG    | __main__:trials:24 - Trial = 7298/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.895 | DEBUG    | __main__:trials:29 - Trial = 7298/30000 | Total reward = 49.93
2022-01-26 14:16:59.898 | DEBUG    | __main__:trials:24 - Trial = 7299/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.898 | DEBUG    | __main__:trials:29 - Trial = 7299/30000 | Total reward = 48.23
2022-01-26 14:16:59.902 | DEBUG    | __main__:trials:24 - Trial = 7300/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.904 | DEBUG    | __main__:trials:29 - Trial = 7300/30000 | Total reward = 47.39
2022-01-26 14:16:59.907 | DEBUG    | __main__:trials:24 - Trial = 7301/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.908 | DEBUG    | __main__:trials:29 - Trial = 7301/30000 | Total reward = 36.02
2022-01-26 14:16:59.912 | DEBUG    | __main__:trials:24 - Trial = 7302/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.914 | DEBUG    | __main__:trials:29 - Trial = 7302/30000 | Total reward = 43.34
2022-01-26 14:16:59.917 | DEBUG    | __main__:trials:24 - Trial = 7303/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.919 | DEBUG    | __main__:trials:29 - Trial = 7303/30000 | Total reward = 44.77
2022-01-26 14:16:59.922 | DEBUG    | __main__:trials:24 - Trial = 7304/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.924 | DEBUG    | __main__:trials:29 - Trial = 7304/30000 | Total reward = 47.03
2022-01-26 14:16:59.927 | DEBUG    | __main__:trials:24 - Trial = 7305/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.929 | DEBUG    | __main__:trials:29 - Trial = 7305/30000 | Total reward = 35.84
2022-01-26 14:16:59.932 | DEBUG    | __main__:trials:24 - Trial = 7306/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.934 | DEBUG    | __main__:trials:29 - Trial = 7306/30000 | Total reward = 47.62
2022-01-26 14:16:59.937 | DEBUG    | __main__:trials:24 - Trial = 7307/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.938 | DEBUG    | __main__:trials:29 - Trial = 7307/30000 | Total reward = 47.45
2022-01-26 14:16:59.941 | DEBUG    | __main__:trials:26 - Trial = 7308/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.944 | DEBUG    | __main__:trials:29 - Trial = 7308/30000 | Total reward = 26.05
2022-01-26 14:16:59.947 | DEBUG    | __main__:trials:24 - Trial = 7309/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.949 | DEBUG    | __main__:trials:29 - Trial = 7309/30000 | Total reward = 61.92
2022-01-26 14:16:59.952 | DEBUG    | __main__:trials:24 - Trial = 7310/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.953 | DEBUG    | __main__:trials:29 - Trial = 7310/30000 | Total reward = 47.59
2022-01-26 14:16:59.956 | DEBUG    | __main__:trials:24 - Trial = 7311/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.958 | DEBUG    | __main__:trials:29 - Trial = 7311/30000 | Total reward = 47.03
2022-01-26 14:16:59.961 | DEBUG    | __main__:trials:24 - Trial = 7312/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.963 | DEBUG    | __main__:trials:29 - Trial = 7312/30000 | Total reward = 36.19
2022-01-26 14:16:59.966 | DEBUG    | __main__:trials:26 - Trial = 7313/30000 | Agent went out of bounds, resetting
2022-01-26 14:16:59.967 | DEBUG    | __main__:trials:29 - Trial = 7313/30000 | Total reward = 28.78
2022-01-26 14:16:59.972 | DEBUG    | __main__:trials:24 - Trial = 7314/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.973 | DEBUG    | __main__:trials:29 - Trial = 7314/30000 | Total reward = 32.32
2022-01-26 14:16:59.976 | DEBUG    | __main__:trials:24 - Trial = 7315/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.978 | DEBUG    | __main__:trials:29 - Trial = 7315/30000 | Total reward = 47.35
2022-01-26 14:16:59.981 | DEBUG    | __main__:trials:24 - Trial = 7316/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.983 | DEBUG    | __main__:trials:29 - Trial = 7316/30000 | Total reward = 48.76
2022-01-26 14:16:59.987 | DEBUG    | __main__:trials:24 - Trial = 7317/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.988 | DEBUG    | __main__:trials:29 - Trial = 7317/30000 | Total reward = 50.00
2022-01-26 14:16:59.992 | DEBUG    | __main__:trials:24 - Trial = 7318/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.993 | DEBUG    | __main__:trials:29 - Trial = 7318/30000 | Total reward = 47.39
2022-01-26 14:16:59.997 | DEBUG    | __main__:trials:24 - Trial = 7319/30000 | Max number of steps (20) reached
2022-01-26 14:16:59.998 | DEBUG    | __main__:trials:29 - Trial = 7319/30000 | Total reward = 46.03
2022-01-26 14:17:00.002 | DEBUG    | __main__:trials:24 - Trial = 7320/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.003 | DEBUG    | __main__:trials:29 - Trial = 7320/30000 | Total reward = 37.09
2022-01-26 14:17:00.007 | DEBUG    | __main__:trials:24 - Trial = 7321/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.008 | DEBUG    | __main__:trials:29 - Trial = 7321/30000 | Total reward = 35.71
2022-01-26 14:17:00.011 | DEBUG    | __main__:trials:24 - Trial = 7322/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.013 | DEBUG    | __main__:trials:29 - Trial = 7322/30000 | Total reward = 39.64
2022-01-26 14:17:00.017 | DEBUG    | __main__:trials:24 - Trial = 7323/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.018 | DEBUG    | __main__:trials:29 - Trial = 7323/30000 | Total reward = 43.68
2022-01-26 14:17:00.022 | DEBUG    | __main__:trials:24 - Trial = 7324/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.023 | DEBUG    | __main__:trials:29 - Trial = 7324/30000 | Total reward = 51.83
2022-01-26 14:17:00.026 | DEBUG    | __main__:trials:24 - Trial = 7325/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.028 | DEBUG    | __main__:trials:29 - Trial = 7325/30000 | Total reward = 37.83
2022-01-26 14:17:00.032 | DEBUG    | __main__:trials:24 - Trial = 7326/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.033 | DEBUG    | __main__:trials:29 - Trial = 7326/30000 | Total reward = 56.65
2022-01-26 14:17:00.037 | DEBUG    | __main__:trials:24 - Trial = 7327/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.038 | DEBUG    | __main__:trials:29 - Trial = 7327/30000 | Total reward = 33.20
2022-01-26 14:17:00.042 | DEBUG    | __main__:trials:24 - Trial = 7328/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.043 | DEBUG    | __main__:trials:29 - Trial = 7328/30000 | Total reward = 48.31
2022-01-26 14:17:00.047 | DEBUG    | __main__:trials:24 - Trial = 7329/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.050 | DEBUG    | __main__:trials:29 - Trial = 7329/30000 | Total reward = 51.33
2022-01-26 14:17:00.052 | DEBUG    | __main__:trials:24 - Trial = 7330/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.054 | DEBUG    | __main__:trials:29 - Trial = 7330/30000 | Total reward = 44.54
2022-01-26 14:17:00.057 | DEBUG    | __main__:trials:24 - Trial = 7331/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.059 | DEBUG    | __main__:trials:29 - Trial = 7331/30000 | Total reward = 45.49
2022-01-26 14:17:00.062 | DEBUG    | __main__:trials:24 - Trial = 7332/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.064 | DEBUG    | __main__:trials:29 - Trial = 7332/30000 | Total reward = 28.57
2022-01-26 14:17:00.067 | DEBUG    | __main__:trials:24 - Trial = 7333/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.069 | DEBUG    | __main__:trials:29 - Trial = 7333/30000 | Total reward = 47.21
2022-01-26 14:17:00.072 | DEBUG    | __main__:trials:24 - Trial = 7334/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.073 | DEBUG    | __main__:trials:29 - Trial = 7334/30000 | Total reward = 33.44
2022-01-26 14:17:00.076 | DEBUG    | __main__:trials:24 - Trial = 7335/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.078 | DEBUG    | __main__:trials:29 - Trial = 7335/30000 | Total reward = 34.17
2022-01-26 14:17:00.082 | DEBUG    | __main__:trials:24 - Trial = 7336/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.083 | DEBUG    | __main__:trials:29 - Trial = 7336/30000 | Total reward = 48.23
2022-01-26 14:17:00.087 | DEBUG    | __main__:trials:24 - Trial = 7337/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.089 | DEBUG    | __main__:trials:29 - Trial = 7337/30000 | Total reward = 40.97
2022-01-26 14:17:00.092 | DEBUG    | __main__:trials:24 - Trial = 7338/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.094 | DEBUG    | __main__:trials:29 - Trial = 7338/30000 | Total reward = 35.91
2022-01-26 14:17:00.097 | DEBUG    | __main__:trials:24 - Trial = 7339/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.099 | DEBUG    | __main__:trials:29 - Trial = 7339/30000 | Total reward = 34.43
2022-01-26 14:17:00.102 | DEBUG    | __main__:trials:24 - Trial = 7340/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.104 | DEBUG    | __main__:trials:29 - Trial = 7340/30000 | Total reward = 40.03
2022-01-26 14:17:00.108 | DEBUG    | __main__:trials:24 - Trial = 7341/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.108 | DEBUG    | __main__:trials:29 - Trial = 7341/30000 | Total reward = 46.97
2022-01-26 14:17:00.112 | DEBUG    | __main__:trials:24 - Trial = 7342/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.114 | DEBUG    | __main__:trials:29 - Trial = 7342/30000 | Total reward = 30.86
2022-01-26 14:17:00.117 | DEBUG    | __main__:trials:24 - Trial = 7343/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.119 | DEBUG    | __main__:trials:29 - Trial = 7343/30000 | Total reward = 43.41
2022-01-26 14:17:00.122 | DEBUG    | __main__:trials:24 - Trial = 7344/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.123 | DEBUG    | __main__:trials:29 - Trial = 7344/30000 | Total reward = 49.17
2022-01-26 14:17:00.127 | DEBUG    | __main__:trials:24 - Trial = 7345/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.128 | DEBUG    | __main__:trials:29 - Trial = 7345/30000 | Total reward = 42.50
2022-01-26 14:17:00.132 | DEBUG    | __main__:trials:24 - Trial = 7346/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.133 | DEBUG    | __main__:trials:29 - Trial = 7346/30000 | Total reward = 40.75
2022-01-26 14:17:00.137 | DEBUG    | __main__:trials:24 - Trial = 7347/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.138 | DEBUG    | __main__:trials:29 - Trial = 7347/30000 | Total reward = 48.24
2022-01-26 14:17:00.141 | DEBUG    | __main__:trials:24 - Trial = 7348/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.142 | DEBUG    | __main__:trials:29 - Trial = 7348/30000 | Total reward = 46.69
2022-01-26 14:17:00.145 | DEBUG    | __main__:trials:24 - Trial = 7349/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.146 | DEBUG    | __main__:trials:29 - Trial = 7349/30000 | Total reward = 43.66
2022-01-26 14:17:00.149 | DEBUG    | __main__:trials:24 - Trial = 7350/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.150 | DEBUG    | __main__:trials:29 - Trial = 7350/30000 | Total reward = 44.29
2022-01-26 14:17:00.154 | DEBUG    | __main__:trials:24 - Trial = 7351/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.156 | DEBUG    | __main__:trials:29 - Trial = 7351/30000 | Total reward = 42.06
2022-01-26 14:17:00.159 | DEBUG    | __main__:trials:24 - Trial = 7352/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.161 | DEBUG    | __main__:trials:29 - Trial = 7352/30000 | Total reward = 38.15
2022-01-26 14:17:00.164 | DEBUG    | __main__:trials:24 - Trial = 7353/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.166 | DEBUG    | __main__:trials:29 - Trial = 7353/30000 | Total reward = 50.29
2022-01-26 14:17:00.169 | DEBUG    | __main__:trials:24 - Trial = 7354/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.171 | DEBUG    | __main__:trials:29 - Trial = 7354/30000 | Total reward = 48.15
2022-01-26 14:17:00.175 | DEBUG    | __main__:trials:24 - Trial = 7355/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.176 | DEBUG    | __main__:trials:29 - Trial = 7355/30000 | Total reward = 54.17
2022-01-26 14:17:00.180 | DEBUG    | __main__:trials:24 - Trial = 7356/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.181 | DEBUG    | __main__:trials:29 - Trial = 7356/30000 | Total reward = 38.85
2022-01-26 14:17:00.185 | DEBUG    | __main__:trials:24 - Trial = 7357/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.187 | DEBUG    | __main__:trials:29 - Trial = 7357/30000 | Total reward = 38.28
2022-01-26 14:17:00.191 | DEBUG    | __main__:trials:24 - Trial = 7358/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.192 | DEBUG    | __main__:trials:29 - Trial = 7358/30000 | Total reward = 47.04
2022-01-26 14:17:00.196 | DEBUG    | __main__:trials:24 - Trial = 7359/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.197 | DEBUG    | __main__:trials:29 - Trial = 7359/30000 | Total reward = 40.27
2022-01-26 14:17:00.200 | DEBUG    | __main__:trials:24 - Trial = 7360/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.202 | DEBUG    | __main__:trials:29 - Trial = 7360/30000 | Total reward = 48.07
2022-01-26 14:17:00.206 | DEBUG    | __main__:trials:24 - Trial = 7361/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.207 | DEBUG    | __main__:trials:29 - Trial = 7361/30000 | Total reward = 41.38
2022-01-26 14:17:00.211 | DEBUG    | __main__:trials:24 - Trial = 7362/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.212 | DEBUG    | __main__:trials:29 - Trial = 7362/30000 | Total reward = 44.92
2022-01-26 14:17:00.216 | DEBUG    | __main__:trials:24 - Trial = 7363/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.217 | DEBUG    | __main__:trials:29 - Trial = 7363/30000 | Total reward = 36.15
2022-01-26 14:17:00.221 | DEBUG    | __main__:trials:24 - Trial = 7364/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.222 | DEBUG    | __main__:trials:29 - Trial = 7364/30000 | Total reward = 40.69
2022-01-26 14:17:00.226 | DEBUG    | __main__:trials:24 - Trial = 7365/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.228 | DEBUG    | __main__:trials:29 - Trial = 7365/30000 | Total reward = 45.73
2022-01-26 14:17:00.231 | DEBUG    | __main__:trials:24 - Trial = 7366/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.232 | DEBUG    | __main__:trials:29 - Trial = 7366/30000 | Total reward = 42.09
2022-01-26 14:17:00.236 | DEBUG    | __main__:trials:24 - Trial = 7367/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.238 | DEBUG    | __main__:trials:29 - Trial = 7367/30000 | Total reward = 43.28
2022-01-26 14:17:00.241 | DEBUG    | __main__:trials:24 - Trial = 7368/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.242 | DEBUG    | __main__:trials:29 - Trial = 7368/30000 | Total reward = 40.54
2022-01-26 14:17:00.246 | DEBUG    | __main__:trials:24 - Trial = 7369/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.248 | DEBUG    | __main__:trials:29 - Trial = 7369/30000 | Total reward = 35.31
2022-01-26 14:17:00.251 | DEBUG    | __main__:trials:24 - Trial = 7370/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.253 | DEBUG    | __main__:trials:29 - Trial = 7370/30000 | Total reward = 38.66
2022-01-26 14:17:00.256 | DEBUG    | __main__:trials:24 - Trial = 7371/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.257 | DEBUG    | __main__:trials:29 - Trial = 7371/30000 | Total reward = 38.50
2022-01-26 14:17:00.260 | DEBUG    | __main__:trials:26 - Trial = 7372/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:00.261 | DEBUG    | __main__:trials:29 - Trial = 7372/30000 | Total reward = 21.59
2022-01-26 14:17:00.265 | DEBUG    | __main__:trials:24 - Trial = 7373/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.266 | DEBUG    | __main__:trials:29 - Trial = 7373/30000 | Total reward = 37.00
2022-01-26 14:17:00.270 | DEBUG    | __main__:trials:24 - Trial = 7374/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.272 | DEBUG    | __main__:trials:29 - Trial = 7374/30000 | Total reward = 44.49
2022-01-26 14:17:00.275 | DEBUG    | __main__:trials:24 - Trial = 7375/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.277 | DEBUG    | __main__:trials:29 - Trial = 7375/30000 | Total reward = 42.05
2022-01-26 14:17:00.281 | DEBUG    | __main__:trials:24 - Trial = 7376/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.282 | DEBUG    | __main__:trials:29 - Trial = 7376/30000 | Total reward = 40.75
2022-01-26 14:17:00.285 | DEBUG    | __main__:trials:24 - Trial = 7377/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.286 | DEBUG    | __main__:trials:29 - Trial = 7377/30000 | Total reward = 45.22
2022-01-26 14:17:00.289 | DEBUG    | __main__:trials:24 - Trial = 7378/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.290 | DEBUG    | __main__:trials:29 - Trial = 7378/30000 | Total reward = 40.31
2022-01-26 14:17:00.293 | DEBUG    | __main__:trials:24 - Trial = 7379/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.294 | DEBUG    | __main__:trials:29 - Trial = 7379/30000 | Total reward = 39.10
2022-01-26 14:17:00.297 | DEBUG    | __main__:trials:24 - Trial = 7380/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.299 | DEBUG    | __main__:trials:29 - Trial = 7380/30000 | Total reward = 39.58
2022-01-26 14:17:00.302 | DEBUG    | __main__:trials:24 - Trial = 7381/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.303 | DEBUG    | __main__:trials:29 - Trial = 7381/30000 | Total reward = 59.17
2022-01-26 14:17:00.306 | DEBUG    | __main__:trials:24 - Trial = 7382/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.307 | DEBUG    | __main__:trials:29 - Trial = 7382/30000 | Total reward = 52.32
2022-01-26 14:17:00.310 | DEBUG    | __main__:trials:26 - Trial = 7383/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:00.311 | DEBUG    | __main__:trials:29 - Trial = 7383/30000 | Total reward = 29.87
2022-01-26 14:17:00.314 | DEBUG    | __main__:trials:24 - Trial = 7384/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.316 | DEBUG    | __main__:trials:29 - Trial = 7384/30000 | Total reward = 41.94
2022-01-26 14:17:00.320 | DEBUG    | __main__:trials:24 - Trial = 7385/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.322 | DEBUG    | __main__:trials:29 - Trial = 7385/30000 | Total reward = 43.97
2022-01-26 14:17:00.325 | DEBUG    | __main__:trials:24 - Trial = 7386/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.327 | DEBUG    | __main__:trials:29 - Trial = 7386/30000 | Total reward = 43.04
2022-01-26 14:17:00.330 | DEBUG    | __main__:trials:24 - Trial = 7387/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.331 | DEBUG    | __main__:trials:29 - Trial = 7387/30000 | Total reward = 48.87
2022-01-26 14:17:00.335 | DEBUG    | __main__:trials:24 - Trial = 7388/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.337 | DEBUG    | __main__:trials:29 - Trial = 7388/30000 | Total reward = 40.54
2022-01-26 14:17:00.340 | DEBUG    | __main__:trials:24 - Trial = 7389/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.342 | DEBUG    | __main__:trials:29 - Trial = 7389/30000 | Total reward = 40.66
2022-01-26 14:17:00.346 | DEBUG    | __main__:trials:24 - Trial = 7390/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.347 | DEBUG    | __main__:trials:29 - Trial = 7390/30000 | Total reward = 40.63
2022-01-26 14:17:00.351 | DEBUG    | __main__:trials:24 - Trial = 7391/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.353 | DEBUG    | __main__:trials:29 - Trial = 7391/30000 | Total reward = 36.70
2022-01-26 14:17:00.356 | DEBUG    | __main__:trials:24 - Trial = 7392/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.358 | DEBUG    | __main__:trials:29 - Trial = 7392/30000 | Total reward = 48.29
2022-01-26 14:17:00.362 | DEBUG    | __main__:trials:24 - Trial = 7393/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.363 | DEBUG    | __main__:trials:29 - Trial = 7393/30000 | Total reward = 51.01
2022-01-26 14:17:00.367 | DEBUG    | __main__:trials:24 - Trial = 7394/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.368 | DEBUG    | __main__:trials:29 - Trial = 7394/30000 | Total reward = 43.51
2022-01-26 14:17:00.372 | DEBUG    | __main__:trials:24 - Trial = 7395/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.373 | DEBUG    | __main__:trials:29 - Trial = 7395/30000 | Total reward = 40.62
2022-01-26 14:17:00.377 | DEBUG    | __main__:trials:24 - Trial = 7396/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.379 | DEBUG    | __main__:trials:29 - Trial = 7396/30000 | Total reward = 34.09
2022-01-26 14:17:00.383 | DEBUG    | __main__:trials:24 - Trial = 7397/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.384 | DEBUG    | __main__:trials:29 - Trial = 7397/30000 | Total reward = 41.49
2022-01-26 14:17:00.387 | DEBUG    | __main__:trials:26 - Trial = 7398/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:00.389 | DEBUG    | __main__:trials:29 - Trial = 7398/30000 | Total reward = 19.31
2022-01-26 14:17:00.392 | DEBUG    | __main__:trials:24 - Trial = 7399/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.394 | DEBUG    | __main__:trials:29 - Trial = 7399/30000 | Total reward = 49.75
2022-01-26 14:17:00.398 | DEBUG    | __main__:trials:24 - Trial = 7400/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.399 | DEBUG    | __main__:trials:29 - Trial = 7400/30000 | Total reward = 46.63
2022-01-26 14:17:00.403 | DEBUG    | __main__:trials:24 - Trial = 7401/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.404 | DEBUG    | __main__:trials:29 - Trial = 7401/30000 | Total reward = 38.85
2022-01-26 14:17:00.408 | DEBUG    | __main__:trials:24 - Trial = 7402/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.410 | DEBUG    | __main__:trials:29 - Trial = 7402/30000 | Total reward = 50.96
2022-01-26 14:17:00.414 | DEBUG    | __main__:trials:24 - Trial = 7403/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.415 | DEBUG    | __main__:trials:29 - Trial = 7403/30000 | Total reward = 34.85
2022-01-26 14:17:00.419 | DEBUG    | __main__:trials:24 - Trial = 7404/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.420 | DEBUG    | __main__:trials:29 - Trial = 7404/30000 | Total reward = 32.41
2022-01-26 14:17:00.423 | DEBUG    | __main__:trials:24 - Trial = 7405/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.425 | DEBUG    | __main__:trials:29 - Trial = 7405/30000 | Total reward = 48.68
2022-01-26 14:17:00.428 | DEBUG    | __main__:trials:24 - Trial = 7406/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.430 | DEBUG    | __main__:trials:29 - Trial = 7406/30000 | Total reward = 38.29
2022-01-26 14:17:00.433 | DEBUG    | __main__:trials:24 - Trial = 7407/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.434 | DEBUG    | __main__:trials:29 - Trial = 7407/30000 | Total reward = 56.04
2022-01-26 14:17:00.437 | DEBUG    | __main__:trials:24 - Trial = 7408/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.438 | DEBUG    | __main__:trials:29 - Trial = 7408/30000 | Total reward = 37.32
2022-01-26 14:17:00.441 | DEBUG    | __main__:trials:24 - Trial = 7409/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.442 | DEBUG    | __main__:trials:29 - Trial = 7409/30000 | Total reward = 37.18
2022-01-26 14:17:00.445 | DEBUG    | __main__:trials:24 - Trial = 7410/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.447 | DEBUG    | __main__:trials:29 - Trial = 7410/30000 | Total reward = 60.04
2022-01-26 14:17:00.451 | DEBUG    | __main__:trials:24 - Trial = 7411/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.452 | DEBUG    | __main__:trials:29 - Trial = 7411/30000 | Total reward = 45.77
2022-01-26 14:17:00.456 | DEBUG    | __main__:trials:24 - Trial = 7412/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.457 | DEBUG    | __main__:trials:29 - Trial = 7412/30000 | Total reward = 42.72
2022-01-26 14:17:00.460 | DEBUG    | __main__:trials:24 - Trial = 7413/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.462 | DEBUG    | __main__:trials:29 - Trial = 7413/30000 | Total reward = 42.13
2022-01-26 14:17:00.465 | DEBUG    | __main__:trials:24 - Trial = 7414/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.467 | DEBUG    | __main__:trials:29 - Trial = 7414/30000 | Total reward = 47.96
2022-01-26 14:17:00.471 | DEBUG    | __main__:trials:24 - Trial = 7415/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.472 | DEBUG    | __main__:trials:29 - Trial = 7415/30000 | Total reward = 37.46
2022-01-26 14:17:00.476 | DEBUG    | __main__:trials:24 - Trial = 7416/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.477 | DEBUG    | __main__:trials:29 - Trial = 7416/30000 | Total reward = 45.71
2022-01-26 14:17:00.481 | DEBUG    | __main__:trials:24 - Trial = 7417/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.482 | DEBUG    | __main__:trials:29 - Trial = 7417/30000 | Total reward = 36.84
2022-01-26 14:17:00.487 | DEBUG    | __main__:trials:24 - Trial = 7418/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.487 | DEBUG    | __main__:trials:29 - Trial = 7418/30000 | Total reward = 51.14
2022-01-26 14:17:00.491 | DEBUG    | __main__:trials:24 - Trial = 7419/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.493 | DEBUG    | __main__:trials:29 - Trial = 7419/30000 | Total reward = 51.52
2022-01-26 14:17:00.496 | DEBUG    | __main__:trials:24 - Trial = 7420/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.497 | DEBUG    | __main__:trials:29 - Trial = 7420/30000 | Total reward = 42.02
2022-01-26 14:17:00.502 | DEBUG    | __main__:trials:24 - Trial = 7421/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.502 | DEBUG    | __main__:trials:29 - Trial = 7421/30000 | Total reward = 41.51
2022-01-26 14:17:00.506 | DEBUG    | __main__:trials:24 - Trial = 7422/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.508 | DEBUG    | __main__:trials:29 - Trial = 7422/30000 | Total reward = 37.91
2022-01-26 14:17:00.512 | DEBUG    | __main__:trials:24 - Trial = 7423/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.513 | DEBUG    | __main__:trials:29 - Trial = 7423/30000 | Total reward = 56.23
2022-01-26 14:17:00.516 | DEBUG    | __main__:trials:24 - Trial = 7424/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.518 | DEBUG    | __main__:trials:29 - Trial = 7424/30000 | Total reward = 36.88
2022-01-26 14:17:00.521 | DEBUG    | __main__:trials:24 - Trial = 7425/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.523 | DEBUG    | __main__:trials:29 - Trial = 7425/30000 | Total reward = 34.39
2022-01-26 14:17:00.527 | DEBUG    | __main__:trials:24 - Trial = 7426/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.527 | DEBUG    | __main__:trials:29 - Trial = 7426/30000 | Total reward = 56.09
2022-01-26 14:17:00.532 | DEBUG    | __main__:trials:24 - Trial = 7427/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.533 | DEBUG    | __main__:trials:29 - Trial = 7427/30000 | Total reward = 35.38
2022-01-26 14:17:00.537 | DEBUG    | __main__:trials:24 - Trial = 7428/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.538 | DEBUG    | __main__:trials:29 - Trial = 7428/30000 | Total reward = 35.35
2022-01-26 14:17:00.541 | DEBUG    | __main__:trials:24 - Trial = 7429/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.542 | DEBUG    | __main__:trials:29 - Trial = 7429/30000 | Total reward = 35.23
2022-01-26 14:17:00.546 | DEBUG    | __main__:trials:24 - Trial = 7430/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.547 | DEBUG    | __main__:trials:29 - Trial = 7430/30000 | Total reward = 27.58
2022-01-26 14:17:00.551 | DEBUG    | __main__:trials:24 - Trial = 7431/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.551 | DEBUG    | __main__:trials:29 - Trial = 7431/30000 | Total reward = 35.15
2022-01-26 14:17:00.556 | DEBUG    | __main__:trials:24 - Trial = 7432/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.558 | DEBUG    | __main__:trials:29 - Trial = 7432/30000 | Total reward = 32.22
2022-01-26 14:17:00.561 | DEBUG    | __main__:trials:24 - Trial = 7433/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.562 | DEBUG    | __main__:trials:29 - Trial = 7433/30000 | Total reward = 44.37
2022-01-26 14:17:00.566 | DEBUG    | __main__:trials:24 - Trial = 7434/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.567 | DEBUG    | __main__:trials:29 - Trial = 7434/30000 | Total reward = 62.02
2022-01-26 14:17:00.571 | DEBUG    | __main__:trials:24 - Trial = 7435/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.573 | DEBUG    | __main__:trials:29 - Trial = 7435/30000 | Total reward = 31.32
2022-01-26 14:17:00.576 | DEBUG    | __main__:trials:24 - Trial = 7436/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.577 | DEBUG    | __main__:trials:29 - Trial = 7436/30000 | Total reward = 55.28
2022-01-26 14:17:00.581 | DEBUG    | __main__:trials:24 - Trial = 7437/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.582 | DEBUG    | __main__:trials:29 - Trial = 7437/30000 | Total reward = 42.04
2022-01-26 14:17:00.585 | DEBUG    | __main__:trials:24 - Trial = 7438/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.586 | DEBUG    | __main__:trials:29 - Trial = 7438/30000 | Total reward = 42.94
2022-01-26 14:17:00.589 | DEBUG    | __main__:trials:24 - Trial = 7439/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.590 | DEBUG    | __main__:trials:29 - Trial = 7439/30000 | Total reward = 34.84
2022-01-26 14:17:00.594 | DEBUG    | __main__:trials:24 - Trial = 7440/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.594 | DEBUG    | __main__:trials:29 - Trial = 7440/30000 | Total reward = 38.86
2022-01-26 14:17:00.598 | DEBUG    | __main__:trials:24 - Trial = 7441/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.600 | DEBUG    | __main__:trials:29 - Trial = 7441/30000 | Total reward = 30.92
2022-01-26 14:17:00.603 | DEBUG    | __main__:trials:24 - Trial = 7442/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.604 | DEBUG    | __main__:trials:29 - Trial = 7442/30000 | Total reward = 44.47
2022-01-26 14:17:00.608 | DEBUG    | __main__:trials:24 - Trial = 7443/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.609 | DEBUG    | __main__:trials:29 - Trial = 7443/30000 | Total reward = 35.23
2022-01-26 14:17:00.612 | DEBUG    | __main__:trials:24 - Trial = 7444/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.614 | DEBUG    | __main__:trials:29 - Trial = 7444/30000 | Total reward = 50.42
2022-01-26 14:17:00.618 | DEBUG    | __main__:trials:24 - Trial = 7445/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.619 | DEBUG    | __main__:trials:29 - Trial = 7445/30000 | Total reward = 48.27
2022-01-26 14:17:00.624 | DEBUG    | __main__:trials:24 - Trial = 7446/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.625 | DEBUG    | __main__:trials:29 - Trial = 7446/30000 | Total reward = 44.53
2022-01-26 14:17:00.629 | DEBUG    | __main__:trials:24 - Trial = 7447/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.630 | DEBUG    | __main__:trials:29 - Trial = 7447/30000 | Total reward = 34.54
2022-01-26 14:17:00.634 | DEBUG    | __main__:trials:24 - Trial = 7448/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.636 | DEBUG    | __main__:trials:29 - Trial = 7448/30000 | Total reward = 35.03
2022-01-26 14:17:00.639 | DEBUG    | __main__:trials:24 - Trial = 7449/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.641 | DEBUG    | __main__:trials:29 - Trial = 7449/30000 | Total reward = 44.92
2022-01-26 14:17:00.644 | DEBUG    | __main__:trials:24 - Trial = 7450/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.646 | DEBUG    | __main__:trials:29 - Trial = 7450/30000 | Total reward = 34.30
2022-01-26 14:17:00.650 | DEBUG    | __main__:trials:24 - Trial = 7451/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.650 | DEBUG    | __main__:trials:29 - Trial = 7451/30000 | Total reward = 47.03
2022-01-26 14:17:00.655 | DEBUG    | __main__:trials:24 - Trial = 7452/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.656 | DEBUG    | __main__:trials:29 - Trial = 7452/30000 | Total reward = 28.89
2022-01-26 14:17:00.660 | DEBUG    | __main__:trials:24 - Trial = 7453/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.662 | DEBUG    | __main__:trials:29 - Trial = 7453/30000 | Total reward = 28.91
2022-01-26 14:17:00.665 | DEBUG    | __main__:trials:24 - Trial = 7454/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.666 | DEBUG    | __main__:trials:29 - Trial = 7454/30000 | Total reward = 40.49
2022-01-26 14:17:00.671 | DEBUG    | __main__:trials:24 - Trial = 7455/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.672 | DEBUG    | __main__:trials:29 - Trial = 7455/30000 | Total reward = 43.03
2022-01-26 14:17:00.677 | DEBUG    | __main__:trials:24 - Trial = 7456/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.678 | DEBUG    | __main__:trials:29 - Trial = 7456/30000 | Total reward = 47.50
2022-01-26 14:17:00.682 | DEBUG    | __main__:trials:24 - Trial = 7457/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.684 | DEBUG    | __main__:trials:29 - Trial = 7457/30000 | Total reward = 38.91
2022-01-26 14:17:00.688 | DEBUG    | __main__:trials:24 - Trial = 7458/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.689 | DEBUG    | __main__:trials:29 - Trial = 7458/30000 | Total reward = 42.39
2022-01-26 14:17:00.693 | DEBUG    | __main__:trials:24 - Trial = 7459/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.694 | DEBUG    | __main__:trials:29 - Trial = 7459/30000 | Total reward = 41.49
2022-01-26 14:17:00.697 | DEBUG    | __main__:trials:24 - Trial = 7460/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.698 | DEBUG    | __main__:trials:29 - Trial = 7460/30000 | Total reward = 39.08
2022-01-26 14:17:00.703 | DEBUG    | __main__:trials:24 - Trial = 7461/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.705 | DEBUG    | __main__:trials:29 - Trial = 7461/30000 | Total reward = 41.65
2022-01-26 14:17:00.708 | DEBUG    | __main__:trials:24 - Trial = 7462/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.709 | DEBUG    | __main__:trials:29 - Trial = 7462/30000 | Total reward = 37.83
2022-01-26 14:17:00.713 | DEBUG    | __main__:trials:24 - Trial = 7463/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.715 | DEBUG    | __main__:trials:29 - Trial = 7463/30000 | Total reward = 43.36
2022-01-26 14:17:00.719 | DEBUG    | __main__:trials:24 - Trial = 7464/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.720 | DEBUG    | __main__:trials:29 - Trial = 7464/30000 | Total reward = 40.51
2022-01-26 14:17:00.726 | DEBUG    | __main__:trials:24 - Trial = 7465/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.727 | DEBUG    | __main__:trials:29 - Trial = 7465/30000 | Total reward = 39.03
2022-01-26 14:17:00.732 | DEBUG    | __main__:trials:24 - Trial = 7466/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.733 | DEBUG    | __main__:trials:29 - Trial = 7466/30000 | Total reward = 34.42
2022-01-26 14:17:00.737 | DEBUG    | __main__:trials:24 - Trial = 7467/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.738 | DEBUG    | __main__:trials:29 - Trial = 7467/30000 | Total reward = 45.25
2022-01-26 14:17:00.742 | DEBUG    | __main__:trials:24 - Trial = 7468/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.744 | DEBUG    | __main__:trials:29 - Trial = 7468/30000 | Total reward = 55.62
2022-01-26 14:17:00.747 | DEBUG    | __main__:trials:26 - Trial = 7469/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:00.748 | DEBUG    | __main__:trials:29 - Trial = 7469/30000 | Total reward = 28.70
2022-01-26 14:17:00.751 | DEBUG    | __main__:trials:24 - Trial = 7470/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.753 | DEBUG    | __main__:trials:29 - Trial = 7470/30000 | Total reward = 35.23
2022-01-26 14:17:00.757 | DEBUG    | __main__:trials:24 - Trial = 7471/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.758 | DEBUG    | __main__:trials:29 - Trial = 7471/30000 | Total reward = 37.80
2022-01-26 14:17:00.761 | DEBUG    | __main__:trials:24 - Trial = 7472/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.761 | DEBUG    | __main__:trials:29 - Trial = 7472/30000 | Total reward = 42.50
2022-01-26 14:17:00.766 | DEBUG    | __main__:trials:24 - Trial = 7473/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.768 | DEBUG    | __main__:trials:29 - Trial = 7473/30000 | Total reward = 37.50
2022-01-26 14:17:00.771 | DEBUG    | __main__:trials:24 - Trial = 7474/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.772 | DEBUG    | __main__:trials:29 - Trial = 7474/30000 | Total reward = 35.23
2022-01-26 14:17:00.776 | DEBUG    | __main__:trials:24 - Trial = 7475/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.777 | DEBUG    | __main__:trials:29 - Trial = 7475/30000 | Total reward = 35.23
2022-01-26 14:17:00.781 | DEBUG    | __main__:trials:24 - Trial = 7476/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.783 | DEBUG    | __main__:trials:29 - Trial = 7476/30000 | Total reward = 32.98
2022-01-26 14:17:00.786 | DEBUG    | __main__:trials:24 - Trial = 7477/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.787 | DEBUG    | __main__:trials:29 - Trial = 7477/30000 | Total reward = 43.83
2022-01-26 14:17:00.791 | DEBUG    | __main__:trials:24 - Trial = 7478/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.793 | DEBUG    | __main__:trials:29 - Trial = 7478/30000 | Total reward = 51.86
2022-01-26 14:17:00.796 | DEBUG    | __main__:trials:24 - Trial = 7479/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.798 | DEBUG    | __main__:trials:29 - Trial = 7479/30000 | Total reward = 38.43
2022-01-26 14:17:00.802 | DEBUG    | __main__:trials:24 - Trial = 7480/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.803 | DEBUG    | __main__:trials:29 - Trial = 7480/30000 | Total reward = 35.35
2022-01-26 14:17:00.807 | DEBUG    | __main__:trials:24 - Trial = 7481/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.808 | DEBUG    | __main__:trials:29 - Trial = 7481/30000 | Total reward = 39.42
2022-01-26 14:17:00.812 | DEBUG    | __main__:trials:24 - Trial = 7482/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.813 | DEBUG    | __main__:trials:29 - Trial = 7482/30000 | Total reward = 48.35
2022-01-26 14:17:00.816 | DEBUG    | __main__:trials:24 - Trial = 7483/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.818 | DEBUG    | __main__:trials:29 - Trial = 7483/30000 | Total reward = 39.94
2022-01-26 14:17:00.822 | DEBUG    | __main__:trials:24 - Trial = 7484/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.823 | DEBUG    | __main__:trials:29 - Trial = 7484/30000 | Total reward = 54.73
2022-01-26 14:17:00.827 | DEBUG    | __main__:trials:24 - Trial = 7485/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.829 | DEBUG    | __main__:trials:29 - Trial = 7485/30000 | Total reward = 44.73
2022-01-26 14:17:00.832 | DEBUG    | __main__:trials:24 - Trial = 7486/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.833 | DEBUG    | __main__:trials:29 - Trial = 7486/30000 | Total reward = 43.54
2022-01-26 14:17:00.837 | DEBUG    | __main__:trials:24 - Trial = 7487/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.838 | DEBUG    | __main__:trials:29 - Trial = 7487/30000 | Total reward = 38.71
2022-01-26 14:17:00.841 | DEBUG    | __main__:trials:24 - Trial = 7488/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.842 | DEBUG    | __main__:trials:29 - Trial = 7488/30000 | Total reward = 31.02
2022-01-26 14:17:00.845 | DEBUG    | __main__:trials:24 - Trial = 7489/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.847 | DEBUG    | __main__:trials:29 - Trial = 7489/30000 | Total reward = 44.60
2022-01-26 14:17:00.850 | DEBUG    | __main__:trials:24 - Trial = 7490/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.852 | DEBUG    | __main__:trials:29 - Trial = 7490/30000 | Total reward = 35.15
2022-01-26 14:17:00.855 | DEBUG    | __main__:trials:24 - Trial = 7491/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.858 | DEBUG    | __main__:trials:29 - Trial = 7491/30000 | Total reward = 34.31
2022-01-26 14:17:00.860 | DEBUG    | __main__:trials:24 - Trial = 7492/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.861 | DEBUG    | __main__:trials:29 - Trial = 7492/30000 | Total reward = 40.22
2022-01-26 14:17:00.864 | DEBUG    | __main__:trials:24 - Trial = 7493/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.865 | DEBUG    | __main__:trials:29 - Trial = 7493/30000 | Total reward = 34.01
2022-01-26 14:17:00.868 | DEBUG    | __main__:trials:24 - Trial = 7494/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.870 | DEBUG    | __main__:trials:29 - Trial = 7494/30000 | Total reward = 47.61
2022-01-26 14:17:00.873 | DEBUG    | __main__:trials:24 - Trial = 7495/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.875 | DEBUG    | __main__:trials:29 - Trial = 7495/30000 | Total reward = 34.39
2022-01-26 14:17:00.879 | DEBUG    | __main__:trials:24 - Trial = 7496/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.879 | DEBUG    | __main__:trials:29 - Trial = 7496/30000 | Total reward = 44.30
2022-01-26 14:17:00.884 | DEBUG    | __main__:trials:24 - Trial = 7497/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.885 | DEBUG    | __main__:trials:29 - Trial = 7497/30000 | Total reward = 32.14
2022-01-26 14:17:00.889 | DEBUG    | __main__:trials:24 - Trial = 7498/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.891 | DEBUG    | __main__:trials:29 - Trial = 7498/30000 | Total reward = 53.24
2022-01-26 14:17:00.894 | DEBUG    | __main__:trials:24 - Trial = 7499/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.896 | DEBUG    | __main__:trials:29 - Trial = 7499/30000 | Total reward = 47.39
2022-01-26 14:17:00.899 | DEBUG    | __main__:trials:24 - Trial = 7500/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.900 | DEBUG    | __main__:trials:29 - Trial = 7500/30000 | Total reward = 35.91
2022-01-26 14:17:00.904 | DEBUG    | __main__:trials:24 - Trial = 7501/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.905 | DEBUG    | __main__:trials:29 - Trial = 7501/30000 | Total reward = 48.87
2022-01-26 14:17:00.908 | DEBUG    | __main__:trials:24 - Trial = 7502/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.910 | DEBUG    | __main__:trials:29 - Trial = 7502/30000 | Total reward = 62.59
2022-01-26 14:17:00.913 | DEBUG    | __main__:trials:24 - Trial = 7503/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.914 | DEBUG    | __main__:trials:29 - Trial = 7503/30000 | Total reward = 43.34
2022-01-26 14:17:00.918 | DEBUG    | __main__:trials:24 - Trial = 7504/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.920 | DEBUG    | __main__:trials:29 - Trial = 7504/30000 | Total reward = 31.93
2022-01-26 14:17:00.923 | DEBUG    | __main__:trials:24 - Trial = 7505/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.924 | DEBUG    | __main__:trials:29 - Trial = 7505/30000 | Total reward = 41.84
2022-01-26 14:17:00.927 | DEBUG    | __main__:trials:24 - Trial = 7506/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.929 | DEBUG    | __main__:trials:29 - Trial = 7506/30000 | Total reward = 32.90
2022-01-26 14:17:00.932 | DEBUG    | __main__:trials:24 - Trial = 7507/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.934 | DEBUG    | __main__:trials:29 - Trial = 7507/30000 | Total reward = 42.80
2022-01-26 14:17:00.937 | DEBUG    | __main__:trials:24 - Trial = 7508/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.939 | DEBUG    | __main__:trials:29 - Trial = 7508/30000 | Total reward = 36.10
2022-01-26 14:17:00.942 | DEBUG    | __main__:trials:24 - Trial = 7509/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.944 | DEBUG    | __main__:trials:29 - Trial = 7509/30000 | Total reward = 49.34
2022-01-26 14:17:00.947 | DEBUG    | __main__:trials:24 - Trial = 7510/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.949 | DEBUG    | __main__:trials:29 - Trial = 7510/30000 | Total reward = 41.82
2022-01-26 14:17:00.952 | DEBUG    | __main__:trials:24 - Trial = 7511/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.954 | DEBUG    | __main__:trials:29 - Trial = 7511/30000 | Total reward = 31.51
2022-01-26 14:17:00.958 | DEBUG    | __main__:trials:24 - Trial = 7512/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.960 | DEBUG    | __main__:trials:29 - Trial = 7512/30000 | Total reward = 46.31
2022-01-26 14:17:00.963 | DEBUG    | __main__:trials:24 - Trial = 7513/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.964 | DEBUG    | __main__:trials:29 - Trial = 7513/30000 | Total reward = 39.62
2022-01-26 14:17:00.968 | DEBUG    | __main__:trials:24 - Trial = 7514/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.969 | DEBUG    | __main__:trials:29 - Trial = 7514/30000 | Total reward = 35.23
2022-01-26 14:17:00.974 | DEBUG    | __main__:trials:24 - Trial = 7515/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.975 | DEBUG    | __main__:trials:29 - Trial = 7515/30000 | Total reward = 35.73
2022-01-26 14:17:00.979 | DEBUG    | __main__:trials:24 - Trial = 7516/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.981 | DEBUG    | __main__:trials:29 - Trial = 7516/30000 | Total reward = 49.42
2022-01-26 14:17:00.984 | DEBUG    | __main__:trials:24 - Trial = 7517/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.986 | DEBUG    | __main__:trials:29 - Trial = 7517/30000 | Total reward = 56.07
2022-01-26 14:17:00.989 | DEBUG    | __main__:trials:24 - Trial = 7518/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.990 | DEBUG    | __main__:trials:29 - Trial = 7518/30000 | Total reward = 50.00
2022-01-26 14:17:00.994 | DEBUG    | __main__:trials:24 - Trial = 7519/30000 | Max number of steps (20) reached
2022-01-26 14:17:00.996 | DEBUG    | __main__:trials:29 - Trial = 7519/30000 | Total reward = 40.25
2022-01-26 14:17:01.000 | DEBUG    | __main__:trials:24 - Trial = 7520/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.000 | DEBUG    | __main__:trials:29 - Trial = 7520/30000 | Total reward = 35.15
2022-01-26 14:17:01.004 | DEBUG    | __main__:trials:24 - Trial = 7521/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.006 | DEBUG    | __main__:trials:29 - Trial = 7521/30000 | Total reward = 55.68
2022-01-26 14:17:01.009 | DEBUG    | __main__:trials:24 - Trial = 7522/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.010 | DEBUG    | __main__:trials:29 - Trial = 7522/30000 | Total reward = 43.32
2022-01-26 14:17:01.013 | DEBUG    | __main__:trials:24 - Trial = 7523/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.015 | DEBUG    | __main__:trials:29 - Trial = 7523/30000 | Total reward = 28.81
2022-01-26 14:17:01.018 | DEBUG    | __main__:trials:24 - Trial = 7524/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.018 | DEBUG    | __main__:trials:29 - Trial = 7524/30000 | Total reward = 27.08
2022-01-26 14:17:01.022 | DEBUG    | __main__:trials:24 - Trial = 7525/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.022 | DEBUG    | __main__:trials:29 - Trial = 7525/30000 | Total reward = 35.35
2022-01-26 14:17:01.026 | DEBUG    | __main__:trials:24 - Trial = 7526/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.028 | DEBUG    | __main__:trials:29 - Trial = 7526/30000 | Total reward = 35.23
2022-01-26 14:17:01.030 | DEBUG    | __main__:trials:24 - Trial = 7527/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.032 | DEBUG    | __main__:trials:29 - Trial = 7527/30000 | Total reward = 34.27
2022-01-26 14:17:01.035 | DEBUG    | __main__:trials:24 - Trial = 7528/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.037 | DEBUG    | __main__:trials:29 - Trial = 7528/30000 | Total reward = 40.69
2022-01-26 14:17:01.041 | DEBUG    | __main__:trials:24 - Trial = 7529/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.041 | DEBUG    | __main__:trials:29 - Trial = 7529/30000 | Total reward = 31.40
2022-01-26 14:17:01.046 | DEBUG    | __main__:trials:24 - Trial = 7530/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.046 | DEBUG    | __main__:trials:29 - Trial = 7530/30000 | Total reward = 35.54
2022-01-26 14:17:01.050 | DEBUG    | __main__:trials:24 - Trial = 7531/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.051 | DEBUG    | __main__:trials:29 - Trial = 7531/30000 | Total reward = 36.39
2022-01-26 14:17:01.055 | DEBUG    | __main__:trials:24 - Trial = 7532/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.056 | DEBUG    | __main__:trials:29 - Trial = 7532/30000 | Total reward = 35.15
2022-01-26 14:17:01.060 | DEBUG    | __main__:trials:24 - Trial = 7533/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.061 | DEBUG    | __main__:trials:29 - Trial = 7533/30000 | Total reward = 51.15
2022-01-26 14:17:01.066 | DEBUG    | __main__:trials:24 - Trial = 7534/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.067 | DEBUG    | __main__:trials:29 - Trial = 7534/30000 | Total reward = 37.66
2022-01-26 14:17:01.071 | DEBUG    | __main__:trials:24 - Trial = 7535/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.073 | DEBUG    | __main__:trials:29 - Trial = 7535/30000 | Total reward = 32.06
2022-01-26 14:17:01.076 | DEBUG    | __main__:trials:24 - Trial = 7536/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.077 | DEBUG    | __main__:trials:29 - Trial = 7536/30000 | Total reward = 55.32
2022-01-26 14:17:01.081 | DEBUG    | __main__:trials:24 - Trial = 7537/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.082 | DEBUG    | __main__:trials:29 - Trial = 7537/30000 | Total reward = 42.92
2022-01-26 14:17:01.085 | DEBUG    | __main__:trials:24 - Trial = 7538/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.086 | DEBUG    | __main__:trials:29 - Trial = 7538/30000 | Total reward = 35.35
2022-01-26 14:17:01.089 | DEBUG    | __main__:trials:24 - Trial = 7539/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.091 | DEBUG    | __main__:trials:29 - Trial = 7539/30000 | Total reward = 35.93
2022-01-26 14:17:01.094 | DEBUG    | __main__:trials:24 - Trial = 7540/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.095 | DEBUG    | __main__:trials:29 - Trial = 7540/30000 | Total reward = 32.22
2022-01-26 14:17:01.099 | DEBUG    | __main__:trials:24 - Trial = 7541/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.101 | DEBUG    | __main__:trials:29 - Trial = 7541/30000 | Total reward = 42.05
2022-01-26 14:17:01.104 | DEBUG    | __main__:trials:24 - Trial = 7542/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.106 | DEBUG    | __main__:trials:29 - Trial = 7542/30000 | Total reward = 47.21
2022-01-26 14:17:01.110 | DEBUG    | __main__:trials:24 - Trial = 7543/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.111 | DEBUG    | __main__:trials:29 - Trial = 7543/30000 | Total reward = 42.39
2022-01-26 14:17:01.115 | DEBUG    | __main__:trials:24 - Trial = 7544/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.116 | DEBUG    | __main__:trials:29 - Trial = 7544/30000 | Total reward = 54.97
2022-01-26 14:17:01.120 | DEBUG    | __main__:trials:24 - Trial = 7545/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.122 | DEBUG    | __main__:trials:29 - Trial = 7545/30000 | Total reward = 39.59
2022-01-26 14:17:01.125 | DEBUG    | __main__:trials:24 - Trial = 7546/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.126 | DEBUG    | __main__:trials:29 - Trial = 7546/30000 | Total reward = 51.48
2022-01-26 14:17:01.130 | DEBUG    | __main__:trials:24 - Trial = 7547/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.131 | DEBUG    | __main__:trials:29 - Trial = 7547/30000 | Total reward = 45.67
2022-01-26 14:17:01.135 | DEBUG    | __main__:trials:24 - Trial = 7548/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.137 | DEBUG    | __main__:trials:29 - Trial = 7548/30000 | Total reward = 51.24
2022-01-26 14:17:01.140 | DEBUG    | __main__:trials:24 - Trial = 7549/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.141 | DEBUG    | __main__:trials:29 - Trial = 7549/30000 | Total reward = 43.07
2022-01-26 14:17:01.146 | DEBUG    | __main__:trials:24 - Trial = 7550/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.147 | DEBUG    | __main__:trials:29 - Trial = 7550/30000 | Total reward = 43.22
2022-01-26 14:17:01.150 | DEBUG    | __main__:trials:24 - Trial = 7551/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.152 | DEBUG    | __main__:trials:29 - Trial = 7551/30000 | Total reward = 48.83
2022-01-26 14:17:01.155 | DEBUG    | __main__:trials:24 - Trial = 7552/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.157 | DEBUG    | __main__:trials:29 - Trial = 7552/30000 | Total reward = 35.79
2022-01-26 14:17:01.160 | DEBUG    | __main__:trials:24 - Trial = 7553/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.161 | DEBUG    | __main__:trials:29 - Trial = 7553/30000 | Total reward = 44.34
2022-01-26 14:17:01.164 | DEBUG    | __main__:trials:24 - Trial = 7554/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.166 | DEBUG    | __main__:trials:29 - Trial = 7554/30000 | Total reward = 34.04
2022-01-26 14:17:01.169 | DEBUG    | __main__:trials:24 - Trial = 7555/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.170 | DEBUG    | __main__:trials:29 - Trial = 7555/30000 | Total reward = 40.31
2022-01-26 14:17:01.173 | DEBUG    | __main__:trials:24 - Trial = 7556/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.174 | DEBUG    | __main__:trials:29 - Trial = 7556/30000 | Total reward = 37.91
2022-01-26 14:17:01.177 | DEBUG    | __main__:trials:24 - Trial = 7557/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.178 | DEBUG    | __main__:trials:29 - Trial = 7557/30000 | Total reward = 47.68
2022-01-26 14:17:01.181 | DEBUG    | __main__:trials:24 - Trial = 7558/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.182 | DEBUG    | __main__:trials:29 - Trial = 7558/30000 | Total reward = 35.11
2022-01-26 14:17:01.185 | DEBUG    | __main__:trials:24 - Trial = 7559/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.186 | DEBUG    | __main__:trials:29 - Trial = 7559/30000 | Total reward = 48.74
2022-01-26 14:17:01.189 | DEBUG    | __main__:trials:24 - Trial = 7560/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.191 | DEBUG    | __main__:trials:29 - Trial = 7560/30000 | Total reward = 41.43
2022-01-26 14:17:01.194 | DEBUG    | __main__:trials:24 - Trial = 7561/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.194 | DEBUG    | __main__:trials:29 - Trial = 7561/30000 | Total reward = 44.29
2022-01-26 14:17:01.197 | DEBUG    | __main__:trials:24 - Trial = 7562/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.198 | DEBUG    | __main__:trials:29 - Trial = 7562/30000 | Total reward = 40.38
2022-01-26 14:17:01.201 | DEBUG    | __main__:trials:24 - Trial = 7563/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.202 | DEBUG    | __main__:trials:29 - Trial = 7563/30000 | Total reward = 41.94
2022-01-26 14:17:01.205 | DEBUG    | __main__:trials:24 - Trial = 7564/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.205 | DEBUG    | __main__:trials:29 - Trial = 7564/30000 | Total reward = 31.40
2022-01-26 14:17:01.209 | DEBUG    | __main__:trials:24 - Trial = 7565/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.210 | DEBUG    | __main__:trials:29 - Trial = 7565/30000 | Total reward = 37.76
2022-01-26 14:17:01.213 | DEBUG    | __main__:trials:24 - Trial = 7566/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.215 | DEBUG    | __main__:trials:29 - Trial = 7566/30000 | Total reward = 60.62
2022-01-26 14:17:01.218 | DEBUG    | __main__:trials:24 - Trial = 7567/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.220 | DEBUG    | __main__:trials:29 - Trial = 7567/30000 | Total reward = 43.24
2022-01-26 14:17:01.223 | DEBUG    | __main__:trials:24 - Trial = 7568/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.224 | DEBUG    | __main__:trials:29 - Trial = 7568/30000 | Total reward = 62.01
2022-01-26 14:17:01.227 | DEBUG    | __main__:trials:24 - Trial = 7569/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.229 | DEBUG    | __main__:trials:29 - Trial = 7569/30000 | Total reward = 40.69
2022-01-26 14:17:01.232 | DEBUG    | __main__:trials:24 - Trial = 7570/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.233 | DEBUG    | __main__:trials:29 - Trial = 7570/30000 | Total reward = 41.51
2022-01-26 14:17:01.236 | DEBUG    | __main__:trials:24 - Trial = 7571/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.238 | DEBUG    | __main__:trials:29 - Trial = 7571/30000 | Total reward = 42.16
2022-01-26 14:17:01.241 | DEBUG    | __main__:trials:24 - Trial = 7572/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.242 | DEBUG    | __main__:trials:29 - Trial = 7572/30000 | Total reward = 41.46
2022-01-26 14:17:01.245 | DEBUG    | __main__:trials:24 - Trial = 7573/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.246 | DEBUG    | __main__:trials:29 - Trial = 7573/30000 | Total reward = 35.35
2022-01-26 14:17:01.249 | DEBUG    | __main__:trials:24 - Trial = 7574/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.251 | DEBUG    | __main__:trials:29 - Trial = 7574/30000 | Total reward = 50.61
2022-01-26 14:17:01.255 | DEBUG    | __main__:trials:24 - Trial = 7575/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.256 | DEBUG    | __main__:trials:29 - Trial = 7575/30000 | Total reward = 38.47
2022-01-26 14:17:01.259 | DEBUG    | __main__:trials:24 - Trial = 7576/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.261 | DEBUG    | __main__:trials:29 - Trial = 7576/30000 | Total reward = 35.35
2022-01-26 14:17:01.264 | DEBUG    | __main__:trials:24 - Trial = 7577/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.266 | DEBUG    | __main__:trials:29 - Trial = 7577/30000 | Total reward = 36.78
2022-01-26 14:17:01.268 | DEBUG    | __main__:trials:26 - Trial = 7578/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:01.270 | DEBUG    | __main__:trials:29 - Trial = 7578/30000 | Total reward = 25.36
2022-01-26 14:17:01.273 | DEBUG    | __main__:trials:24 - Trial = 7579/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.275 | DEBUG    | __main__:trials:29 - Trial = 7579/30000 | Total reward = 43.61
2022-01-26 14:17:01.278 | DEBUG    | __main__:trials:24 - Trial = 7580/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.278 | DEBUG    | __main__:trials:29 - Trial = 7580/30000 | Total reward = 43.50
2022-01-26 14:17:01.282 | DEBUG    | __main__:trials:24 - Trial = 7581/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.282 | DEBUG    | __main__:trials:29 - Trial = 7581/30000 | Total reward = 44.09
2022-01-26 14:17:01.286 | DEBUG    | __main__:trials:24 - Trial = 7582/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.287 | DEBUG    | __main__:trials:29 - Trial = 7582/30000 | Total reward = 42.55
2022-01-26 14:17:01.290 | DEBUG    | __main__:trials:24 - Trial = 7583/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.292 | DEBUG    | __main__:trials:29 - Trial = 7583/30000 | Total reward = 25.34
2022-01-26 14:17:01.296 | DEBUG    | __main__:trials:24 - Trial = 7584/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.298 | DEBUG    | __main__:trials:29 - Trial = 7584/30000 | Total reward = 48.76
2022-01-26 14:17:01.301 | DEBUG    | __main__:trials:24 - Trial = 7585/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.301 | DEBUG    | __main__:trials:29 - Trial = 7585/30000 | Total reward = 42.39
2022-01-26 14:17:01.305 | DEBUG    | __main__:trials:24 - Trial = 7586/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.306 | DEBUG    | __main__:trials:29 - Trial = 7586/30000 | Total reward = 42.07
2022-01-26 14:17:01.309 | DEBUG    | __main__:trials:24 - Trial = 7587/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.310 | DEBUG    | __main__:trials:29 - Trial = 7587/30000 | Total reward = 43.28
2022-01-26 14:17:01.313 | DEBUG    | __main__:trials:24 - Trial = 7588/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.314 | DEBUG    | __main__:trials:29 - Trial = 7588/30000 | Total reward = 38.02
2022-01-26 14:17:01.317 | DEBUG    | __main__:trials:24 - Trial = 7589/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.318 | DEBUG    | __main__:trials:29 - Trial = 7589/30000 | Total reward = 28.73
2022-01-26 14:17:01.321 | DEBUG    | __main__:trials:24 - Trial = 7590/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.323 | DEBUG    | __main__:trials:29 - Trial = 7590/30000 | Total reward = 42.39
2022-01-26 14:17:01.326 | DEBUG    | __main__:trials:24 - Trial = 7591/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.327 | DEBUG    | __main__:trials:29 - Trial = 7591/30000 | Total reward = 41.12
2022-01-26 14:17:01.330 | DEBUG    | __main__:trials:24 - Trial = 7592/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.331 | DEBUG    | __main__:trials:29 - Trial = 7592/30000 | Total reward = 45.48
2022-01-26 14:17:01.334 | DEBUG    | __main__:trials:24 - Trial = 7593/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.336 | DEBUG    | __main__:trials:29 - Trial = 7593/30000 | Total reward = 49.86
2022-01-26 14:17:01.339 | DEBUG    | __main__:trials:24 - Trial = 7594/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.340 | DEBUG    | __main__:trials:29 - Trial = 7594/30000 | Total reward = 44.20
2022-01-26 14:17:01.344 | DEBUG    | __main__:trials:24 - Trial = 7595/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.344 | DEBUG    | __main__:trials:29 - Trial = 7595/30000 | Total reward = 46.65
2022-01-26 14:17:01.348 | DEBUG    | __main__:trials:24 - Trial = 7596/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.349 | DEBUG    | __main__:trials:29 - Trial = 7596/30000 | Total reward = 44.46
2022-01-26 14:17:01.353 | DEBUG    | __main__:trials:24 - Trial = 7597/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.353 | DEBUG    | __main__:trials:29 - Trial = 7597/30000 | Total reward = 44.88
2022-01-26 14:17:01.357 | DEBUG    | __main__:trials:24 - Trial = 7598/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.357 | DEBUG    | __main__:trials:29 - Trial = 7598/30000 | Total reward = 31.69
2022-01-26 14:17:01.361 | DEBUG    | __main__:trials:24 - Trial = 7599/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.362 | DEBUG    | __main__:trials:29 - Trial = 7599/30000 | Total reward = 38.98
2022-01-26 14:17:01.367 | DEBUG    | __main__:trials:24 - Trial = 7600/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.367 | DEBUG    | __main__:trials:29 - Trial = 7600/30000 | Total reward = 45.11
2022-01-26 14:17:01.373 | DEBUG    | __main__:trials:24 - Trial = 7601/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.374 | DEBUG    | __main__:trials:29 - Trial = 7601/30000 | Total reward = 34.21
2022-01-26 14:17:01.377 | DEBUG    | __main__:trials:24 - Trial = 7602/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.379 | DEBUG    | __main__:trials:29 - Trial = 7602/30000 | Total reward = 43.84
2022-01-26 14:17:01.382 | DEBUG    | __main__:trials:24 - Trial = 7603/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.385 | DEBUG    | __main__:trials:29 - Trial = 7603/30000 | Total reward = 44.46
2022-01-26 14:17:01.389 | DEBUG    | __main__:trials:24 - Trial = 7604/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.390 | DEBUG    | __main__:trials:29 - Trial = 7604/30000 | Total reward = 45.92
2022-01-26 14:17:01.393 | DEBUG    | __main__:trials:24 - Trial = 7605/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.394 | DEBUG    | __main__:trials:29 - Trial = 7605/30000 | Total reward = 53.17
2022-01-26 14:17:01.398 | DEBUG    | __main__:trials:24 - Trial = 7606/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.399 | DEBUG    | __main__:trials:29 - Trial = 7606/30000 | Total reward = 51.10
2022-01-26 14:17:01.403 | DEBUG    | __main__:trials:24 - Trial = 7607/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.404 | DEBUG    | __main__:trials:29 - Trial = 7607/30000 | Total reward = 42.61
2022-01-26 14:17:01.408 | DEBUG    | __main__:trials:24 - Trial = 7608/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.410 | DEBUG    | __main__:trials:29 - Trial = 7608/30000 | Total reward = 36.13
2022-01-26 14:17:01.413 | DEBUG    | __main__:trials:24 - Trial = 7609/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.415 | DEBUG    | __main__:trials:29 - Trial = 7609/30000 | Total reward = 49.52
2022-01-26 14:17:01.419 | DEBUG    | __main__:trials:24 - Trial = 7610/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.420 | DEBUG    | __main__:trials:29 - Trial = 7610/30000 | Total reward = 44.86
2022-01-26 14:17:01.424 | DEBUG    | __main__:trials:24 - Trial = 7611/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.425 | DEBUG    | __main__:trials:29 - Trial = 7611/30000 | Total reward = 40.98
2022-01-26 14:17:01.429 | DEBUG    | __main__:trials:24 - Trial = 7612/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.431 | DEBUG    | __main__:trials:29 - Trial = 7612/30000 | Total reward = 47.80
2022-01-26 14:17:01.589 | DEBUG    | __main__:trials:24 - Trial = 7613/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.590 | DEBUG    | __main__:trials:29 - Trial = 7613/30000 | Total reward = 41.59
2022-01-26 14:17:01.593 | DEBUG    | __main__:trials:24 - Trial = 7614/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.596 | DEBUG    | __main__:trials:29 - Trial = 7614/30000 | Total reward = 47.80
2022-01-26 14:17:01.600 | DEBUG    | __main__:trials:24 - Trial = 7615/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.602 | DEBUG    | __main__:trials:29 - Trial = 7615/30000 | Total reward = 49.53
2022-01-26 14:17:01.606 | DEBUG    | __main__:trials:24 - Trial = 7616/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.607 | DEBUG    | __main__:trials:29 - Trial = 7616/30000 | Total reward = 46.89
2022-01-26 14:17:01.611 | DEBUG    | __main__:trials:24 - Trial = 7617/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.613 | DEBUG    | __main__:trials:29 - Trial = 7617/30000 | Total reward = 46.78
2022-01-26 14:17:01.617 | DEBUG    | __main__:trials:24 - Trial = 7618/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.619 | DEBUG    | __main__:trials:29 - Trial = 7618/30000 | Total reward = 47.03
2022-01-26 14:17:01.622 | DEBUG    | __main__:trials:24 - Trial = 7619/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.623 | DEBUG    | __main__:trials:29 - Trial = 7619/30000 | Total reward = 41.92
2022-01-26 14:17:01.627 | DEBUG    | __main__:trials:24 - Trial = 7620/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.629 | DEBUG    | __main__:trials:29 - Trial = 7620/30000 | Total reward = 42.39
2022-01-26 14:17:01.632 | DEBUG    | __main__:trials:24 - Trial = 7621/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.634 | DEBUG    | __main__:trials:29 - Trial = 7621/30000 | Total reward = 44.08
2022-01-26 14:17:01.637 | DEBUG    | __main__:trials:24 - Trial = 7622/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.639 | DEBUG    | __main__:trials:29 - Trial = 7622/30000 | Total reward = 46.77
2022-01-26 14:17:01.643 | DEBUG    | __main__:trials:24 - Trial = 7623/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.645 | DEBUG    | __main__:trials:29 - Trial = 7623/30000 | Total reward = 44.19
2022-01-26 14:17:01.649 | DEBUG    | __main__:trials:24 - Trial = 7624/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.650 | DEBUG    | __main__:trials:29 - Trial = 7624/30000 | Total reward = 37.69
2022-01-26 14:17:01.654 | DEBUG    | __main__:trials:24 - Trial = 7625/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.654 | DEBUG    | __main__:trials:29 - Trial = 7625/30000 | Total reward = 36.35
2022-01-26 14:17:01.658 | DEBUG    | __main__:trials:24 - Trial = 7626/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.660 | DEBUG    | __main__:trials:29 - Trial = 7626/30000 | Total reward = 41.81
2022-01-26 14:17:01.663 | DEBUG    | __main__:trials:24 - Trial = 7627/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.665 | DEBUG    | __main__:trials:29 - Trial = 7627/30000 | Total reward = 41.81
2022-01-26 14:17:01.668 | DEBUG    | __main__:trials:24 - Trial = 7628/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.670 | DEBUG    | __main__:trials:29 - Trial = 7628/30000 | Total reward = 33.28
2022-01-26 14:17:01.674 | DEBUG    | __main__:trials:24 - Trial = 7629/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.676 | DEBUG    | __main__:trials:29 - Trial = 7629/30000 | Total reward = 44.91
2022-01-26 14:17:01.679 | DEBUG    | __main__:trials:24 - Trial = 7630/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.680 | DEBUG    | __main__:trials:29 - Trial = 7630/30000 | Total reward = 38.11
2022-01-26 14:17:01.684 | DEBUG    | __main__:trials:24 - Trial = 7631/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.686 | DEBUG    | __main__:trials:29 - Trial = 7631/30000 | Total reward = 35.93
2022-01-26 14:17:01.689 | DEBUG    | __main__:trials:24 - Trial = 7632/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.691 | DEBUG    | __main__:trials:29 - Trial = 7632/30000 | Total reward = 47.79
2022-01-26 14:17:01.694 | DEBUG    | __main__:trials:24 - Trial = 7633/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.696 | DEBUG    | __main__:trials:29 - Trial = 7633/30000 | Total reward = 51.92
2022-01-26 14:17:01.700 | DEBUG    | __main__:trials:24 - Trial = 7634/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.701 | DEBUG    | __main__:trials:29 - Trial = 7634/30000 | Total reward = 53.56
2022-01-26 14:17:01.705 | DEBUG    | __main__:trials:24 - Trial = 7635/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.706 | DEBUG    | __main__:trials:29 - Trial = 7635/30000 | Total reward = 29.08
2022-01-26 14:17:01.710 | DEBUG    | __main__:trials:24 - Trial = 7636/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.712 | DEBUG    | __main__:trials:29 - Trial = 7636/30000 | Total reward = 55.23
2022-01-26 14:17:01.715 | DEBUG    | __main__:trials:24 - Trial = 7637/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.717 | DEBUG    | __main__:trials:29 - Trial = 7637/30000 | Total reward = 42.76
2022-01-26 14:17:01.720 | DEBUG    | __main__:trials:24 - Trial = 7638/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.722 | DEBUG    | __main__:trials:29 - Trial = 7638/30000 | Total reward = 40.54
2022-01-26 14:17:01.725 | DEBUG    | __main__:trials:24 - Trial = 7639/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.726 | DEBUG    | __main__:trials:29 - Trial = 7639/30000 | Total reward = 31.86
2022-01-26 14:17:01.730 | DEBUG    | __main__:trials:24 - Trial = 7640/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.732 | DEBUG    | __main__:trials:29 - Trial = 7640/30000 | Total reward = 52.90
2022-01-26 14:17:01.736 | DEBUG    | __main__:trials:24 - Trial = 7641/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.737 | DEBUG    | __main__:trials:29 - Trial = 7641/30000 | Total reward = 44.13
2022-01-26 14:17:01.741 | DEBUG    | __main__:trials:24 - Trial = 7642/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.742 | DEBUG    | __main__:trials:29 - Trial = 7642/30000 | Total reward = 37.95
2022-01-26 14:17:01.746 | DEBUG    | __main__:trials:24 - Trial = 7643/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.747 | DEBUG    | __main__:trials:29 - Trial = 7643/30000 | Total reward = 48.15
2022-01-26 14:17:01.751 | DEBUG    | __main__:trials:24 - Trial = 7644/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.753 | DEBUG    | __main__:trials:29 - Trial = 7644/30000 | Total reward = 40.24
2022-01-26 14:17:01.757 | DEBUG    | __main__:trials:24 - Trial = 7645/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.758 | DEBUG    | __main__:trials:29 - Trial = 7645/30000 | Total reward = 64.15
2022-01-26 14:17:01.762 | DEBUG    | __main__:trials:24 - Trial = 7646/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.764 | DEBUG    | __main__:trials:29 - Trial = 7646/30000 | Total reward = 48.69
2022-01-26 14:17:01.766 | DEBUG    | __main__:trials:24 - Trial = 7647/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.768 | DEBUG    | __main__:trials:29 - Trial = 7647/30000 | Total reward = 51.36
2022-01-26 14:17:01.772 | DEBUG    | __main__:trials:24 - Trial = 7648/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.773 | DEBUG    | __main__:trials:29 - Trial = 7648/30000 | Total reward = 45.57
2022-01-26 14:17:01.777 | DEBUG    | __main__:trials:24 - Trial = 7649/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.779 | DEBUG    | __main__:trials:29 - Trial = 7649/30000 | Total reward = 42.74
2022-01-26 14:17:01.783 | DEBUG    | __main__:trials:24 - Trial = 7650/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.784 | DEBUG    | __main__:trials:29 - Trial = 7650/30000 | Total reward = 52.43
2022-01-26 14:17:01.788 | DEBUG    | __main__:trials:24 - Trial = 7651/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.790 | DEBUG    | __main__:trials:29 - Trial = 7651/30000 | Total reward = 42.39
2022-01-26 14:17:01.794 | DEBUG    | __main__:trials:24 - Trial = 7652/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.795 | DEBUG    | __main__:trials:29 - Trial = 7652/30000 | Total reward = 50.16
2022-01-26 14:17:01.799 | DEBUG    | __main__:trials:24 - Trial = 7653/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.800 | DEBUG    | __main__:trials:29 - Trial = 7653/30000 | Total reward = 50.81
2022-01-26 14:17:01.804 | DEBUG    | __main__:trials:24 - Trial = 7654/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.806 | DEBUG    | __main__:trials:29 - Trial = 7654/30000 | Total reward = 42.72
2022-01-26 14:17:01.810 | DEBUG    | __main__:trials:24 - Trial = 7655/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.811 | DEBUG    | __main__:trials:29 - Trial = 7655/30000 | Total reward = 42.19
2022-01-26 14:17:01.815 | DEBUG    | __main__:trials:24 - Trial = 7656/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.817 | DEBUG    | __main__:trials:29 - Trial = 7656/30000 | Total reward = 40.27
2022-01-26 14:17:01.820 | DEBUG    | __main__:trials:24 - Trial = 7657/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.822 | DEBUG    | __main__:trials:29 - Trial = 7657/30000 | Total reward = 38.86
2022-01-26 14:17:01.825 | DEBUG    | __main__:trials:24 - Trial = 7658/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.826 | DEBUG    | __main__:trials:29 - Trial = 7658/30000 | Total reward = 35.48
2022-01-26 14:17:01.829 | DEBUG    | __main__:trials:24 - Trial = 7659/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.830 | DEBUG    | __main__:trials:29 - Trial = 7659/30000 | Total reward = 36.59
2022-01-26 14:17:01.834 | DEBUG    | __main__:trials:24 - Trial = 7660/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.835 | DEBUG    | __main__:trials:29 - Trial = 7660/30000 | Total reward = 39.50
2022-01-26 14:17:01.839 | DEBUG    | __main__:trials:24 - Trial = 7661/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.840 | DEBUG    | __main__:trials:29 - Trial = 7661/30000 | Total reward = 41.29
2022-01-26 14:17:01.844 | DEBUG    | __main__:trials:24 - Trial = 7662/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.845 | DEBUG    | __main__:trials:29 - Trial = 7662/30000 | Total reward = 42.12
2022-01-26 14:17:01.849 | DEBUG    | __main__:trials:24 - Trial = 7663/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.851 | DEBUG    | __main__:trials:29 - Trial = 7663/30000 | Total reward = 49.96
2022-01-26 14:17:01.854 | DEBUG    | __main__:trials:24 - Trial = 7664/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.856 | DEBUG    | __main__:trials:29 - Trial = 7664/30000 | Total reward = 60.26
2022-01-26 14:17:01.860 | DEBUG    | __main__:trials:24 - Trial = 7665/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.862 | DEBUG    | __main__:trials:29 - Trial = 7665/30000 | Total reward = 41.49
2022-01-26 14:17:01.865 | DEBUG    | __main__:trials:24 - Trial = 7666/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.867 | DEBUG    | __main__:trials:29 - Trial = 7666/30000 | Total reward = 39.90
2022-01-26 14:17:01.871 | DEBUG    | __main__:trials:24 - Trial = 7667/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.872 | DEBUG    | __main__:trials:29 - Trial = 7667/30000 | Total reward = 34.97
2022-01-26 14:17:01.875 | DEBUG    | __main__:trials:24 - Trial = 7668/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.877 | DEBUG    | __main__:trials:29 - Trial = 7668/30000 | Total reward = 34.43
2022-01-26 14:17:01.880 | DEBUG    | __main__:trials:24 - Trial = 7669/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.881 | DEBUG    | __main__:trials:29 - Trial = 7669/30000 | Total reward = 52.50
2022-01-26 14:17:01.885 | DEBUG    | __main__:trials:24 - Trial = 7670/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.887 | DEBUG    | __main__:trials:29 - Trial = 7670/30000 | Total reward = 39.30
2022-01-26 14:17:01.891 | DEBUG    | __main__:trials:24 - Trial = 7671/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.892 | DEBUG    | __main__:trials:29 - Trial = 7671/30000 | Total reward = 54.72
2022-01-26 14:17:01.896 | DEBUG    | __main__:trials:24 - Trial = 7672/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.897 | DEBUG    | __main__:trials:29 - Trial = 7672/30000 | Total reward = 47.19
2022-01-26 14:17:01.901 | DEBUG    | __main__:trials:24 - Trial = 7673/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.903 | DEBUG    | __main__:trials:29 - Trial = 7673/30000 | Total reward = 46.95
2022-01-26 14:17:01.907 | DEBUG    | __main__:trials:24 - Trial = 7674/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.908 | DEBUG    | __main__:trials:29 - Trial = 7674/30000 | Total reward = 39.63
2022-01-26 14:17:01.912 | DEBUG    | __main__:trials:24 - Trial = 7675/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.914 | DEBUG    | __main__:trials:29 - Trial = 7675/30000 | Total reward = 35.56
2022-01-26 14:17:01.918 | DEBUG    | __main__:trials:24 - Trial = 7676/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.919 | DEBUG    | __main__:trials:29 - Trial = 7676/30000 | Total reward = 62.21
2022-01-26 14:17:01.923 | DEBUG    | __main__:trials:24 - Trial = 7677/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.925 | DEBUG    | __main__:trials:29 - Trial = 7677/30000 | Total reward = 51.34
2022-01-26 14:17:01.929 | DEBUG    | __main__:trials:24 - Trial = 7678/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.931 | DEBUG    | __main__:trials:29 - Trial = 7678/30000 | Total reward = 53.71
2022-01-26 14:17:01.934 | DEBUG    | __main__:trials:24 - Trial = 7679/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.936 | DEBUG    | __main__:trials:29 - Trial = 7679/30000 | Total reward = 45.77
2022-01-26 14:17:01.939 | DEBUG    | __main__:trials:24 - Trial = 7680/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.941 | DEBUG    | __main__:trials:29 - Trial = 7680/30000 | Total reward = 33.52
2022-01-26 14:17:01.945 | DEBUG    | __main__:trials:24 - Trial = 7681/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.945 | DEBUG    | __main__:trials:29 - Trial = 7681/30000 | Total reward = 55.42
2022-01-26 14:17:01.948 | DEBUG    | __main__:trials:26 - Trial = 7682/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:01.950 | DEBUG    | __main__:trials:29 - Trial = 7682/30000 | Total reward = 8.16
2022-01-26 14:17:01.953 | DEBUG    | __main__:trials:24 - Trial = 7683/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.954 | DEBUG    | __main__:trials:29 - Trial = 7683/30000 | Total reward = 56.03
2022-01-26 14:17:01.958 | DEBUG    | __main__:trials:24 - Trial = 7684/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.960 | DEBUG    | __main__:trials:29 - Trial = 7684/30000 | Total reward = 46.57
2022-01-26 14:17:01.963 | DEBUG    | __main__:trials:24 - Trial = 7685/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.965 | DEBUG    | __main__:trials:29 - Trial = 7685/30000 | Total reward = 40.94
2022-01-26 14:17:01.969 | DEBUG    | __main__:trials:24 - Trial = 7686/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.970 | DEBUG    | __main__:trials:29 - Trial = 7686/30000 | Total reward = 34.29
2022-01-26 14:17:01.973 | DEBUG    | __main__:trials:24 - Trial = 7687/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.974 | DEBUG    | __main__:trials:29 - Trial = 7687/30000 | Total reward = 33.95
2022-01-26 14:17:01.977 | DEBUG    | __main__:trials:26 - Trial = 7688/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:01.978 | DEBUG    | __main__:trials:29 - Trial = 7688/30000 | Total reward = 20.34
2022-01-26 14:17:01.983 | DEBUG    | __main__:trials:24 - Trial = 7689/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.983 | DEBUG    | __main__:trials:29 - Trial = 7689/30000 | Total reward = 31.09
2022-01-26 14:17:01.988 | DEBUG    | __main__:trials:24 - Trial = 7690/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.989 | DEBUG    | __main__:trials:29 - Trial = 7690/30000 | Total reward = 44.46
2022-01-26 14:17:01.993 | DEBUG    | __main__:trials:24 - Trial = 7691/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.994 | DEBUG    | __main__:trials:29 - Trial = 7691/30000 | Total reward = 44.46
2022-01-26 14:17:01.997 | DEBUG    | __main__:trials:24 - Trial = 7692/30000 | Max number of steps (20) reached
2022-01-26 14:17:01.998 | DEBUG    | __main__:trials:29 - Trial = 7692/30000 | Total reward = 42.66
2022-01-26 14:17:02.001 | DEBUG    | __main__:trials:24 - Trial = 7693/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.002 | DEBUG    | __main__:trials:29 - Trial = 7693/30000 | Total reward = 33.47
2022-01-26 14:17:02.006 | DEBUG    | __main__:trials:24 - Trial = 7694/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.008 | DEBUG    | __main__:trials:29 - Trial = 7694/30000 | Total reward = 26.97
2022-01-26 14:17:02.011 | DEBUG    | __main__:trials:24 - Trial = 7695/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.013 | DEBUG    | __main__:trials:29 - Trial = 7695/30000 | Total reward = 19.86
2022-01-26 14:17:02.016 | DEBUG    | __main__:trials:24 - Trial = 7696/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.018 | DEBUG    | __main__:trials:29 - Trial = 7696/30000 | Total reward = 24.81
2022-01-26 14:17:02.021 | DEBUG    | __main__:trials:24 - Trial = 7697/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.023 | DEBUG    | __main__:trials:29 - Trial = 7697/30000 | Total reward = 47.03
2022-01-26 14:17:02.026 | DEBUG    | __main__:trials:24 - Trial = 7698/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.028 | DEBUG    | __main__:trials:29 - Trial = 7698/30000 | Total reward = 46.82
2022-01-26 14:17:02.032 | DEBUG    | __main__:trials:24 - Trial = 7699/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.033 | DEBUG    | __main__:trials:29 - Trial = 7699/30000 | Total reward = 39.94
2022-01-26 14:17:02.037 | DEBUG    | __main__:trials:24 - Trial = 7700/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.039 | DEBUG    | __main__:trials:29 - Trial = 7700/30000 | Total reward = 35.25
2022-01-26 14:17:02.043 | DEBUG    | __main__:trials:24 - Trial = 7701/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.044 | DEBUG    | __main__:trials:29 - Trial = 7701/30000 | Total reward = 46.34
2022-01-26 14:17:02.048 | DEBUG    | __main__:trials:26 - Trial = 7702/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.049 | DEBUG    | __main__:trials:29 - Trial = 7702/30000 | Total reward = 18.38
2022-01-26 14:17:02.053 | DEBUG    | __main__:trials:24 - Trial = 7703/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.054 | DEBUG    | __main__:trials:29 - Trial = 7703/30000 | Total reward = 36.35
2022-01-26 14:17:02.057 | DEBUG    | __main__:trials:24 - Trial = 7704/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.058 | DEBUG    | __main__:trials:29 - Trial = 7704/30000 | Total reward = 52.74
2022-01-26 14:17:02.061 | DEBUG    | __main__:trials:24 - Trial = 7705/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.062 | DEBUG    | __main__:trials:29 - Trial = 7705/30000 | Total reward = 55.38
2022-01-26 14:17:02.066 | DEBUG    | __main__:trials:24 - Trial = 7706/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.068 | DEBUG    | __main__:trials:29 - Trial = 7706/30000 | Total reward = 46.65
2022-01-26 14:17:02.072 | DEBUG    | __main__:trials:24 - Trial = 7707/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.072 | DEBUG    | __main__:trials:29 - Trial = 7707/30000 | Total reward = 47.01
2022-01-26 14:17:02.077 | DEBUG    | __main__:trials:24 - Trial = 7708/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.078 | DEBUG    | __main__:trials:29 - Trial = 7708/30000 | Total reward = 37.45
2022-01-26 14:17:02.081 | DEBUG    | __main__:trials:26 - Trial = 7709/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.083 | DEBUG    | __main__:trials:29 - Trial = 7709/30000 | Total reward = 36.13
2022-01-26 14:17:02.086 | DEBUG    | __main__:trials:24 - Trial = 7710/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.086 | DEBUG    | __main__:trials:29 - Trial = 7710/30000 | Total reward = 41.37
2022-01-26 14:17:02.090 | DEBUG    | __main__:trials:24 - Trial = 7711/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.092 | DEBUG    | __main__:trials:29 - Trial = 7711/30000 | Total reward = 39.58
2022-01-26 14:17:02.096 | DEBUG    | __main__:trials:24 - Trial = 7712/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.097 | DEBUG    | __main__:trials:29 - Trial = 7712/30000 | Total reward = 46.77
2022-01-26 14:17:02.101 | DEBUG    | __main__:trials:24 - Trial = 7713/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.103 | DEBUG    | __main__:trials:29 - Trial = 7713/30000 | Total reward = 41.93
2022-01-26 14:17:02.107 | DEBUG    | __main__:trials:24 - Trial = 7714/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.108 | DEBUG    | __main__:trials:29 - Trial = 7714/30000 | Total reward = 46.96
2022-01-26 14:17:02.112 | DEBUG    | __main__:trials:24 - Trial = 7715/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.113 | DEBUG    | __main__:trials:29 - Trial = 7715/30000 | Total reward = 44.23
2022-01-26 14:17:02.117 | DEBUG    | __main__:trials:24 - Trial = 7716/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.118 | DEBUG    | __main__:trials:29 - Trial = 7716/30000 | Total reward = 31.78
2022-01-26 14:17:02.122 | DEBUG    | __main__:trials:24 - Trial = 7717/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.124 | DEBUG    | __main__:trials:29 - Trial = 7717/30000 | Total reward = 38.98
2022-01-26 14:17:02.128 | DEBUG    | __main__:trials:24 - Trial = 7718/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.129 | DEBUG    | __main__:trials:29 - Trial = 7718/30000 | Total reward = 62.90
2022-01-26 14:17:02.133 | DEBUG    | __main__:trials:24 - Trial = 7719/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.135 | DEBUG    | __main__:trials:29 - Trial = 7719/30000 | Total reward = 47.95
2022-01-26 14:17:02.139 | DEBUG    | __main__:trials:24 - Trial = 7720/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.140 | DEBUG    | __main__:trials:29 - Trial = 7720/30000 | Total reward = 41.71
2022-01-26 14:17:02.144 | DEBUG    | __main__:trials:24 - Trial = 7721/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.145 | DEBUG    | __main__:trials:29 - Trial = 7721/30000 | Total reward = 41.82
2022-01-26 14:17:02.149 | DEBUG    | __main__:trials:24 - Trial = 7722/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.150 | DEBUG    | __main__:trials:29 - Trial = 7722/30000 | Total reward = 39.76
2022-01-26 14:17:02.154 | DEBUG    | __main__:trials:24 - Trial = 7723/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.156 | DEBUG    | __main__:trials:29 - Trial = 7723/30000 | Total reward = 37.72
2022-01-26 14:17:02.160 | DEBUG    | __main__:trials:24 - Trial = 7724/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.161 | DEBUG    | __main__:trials:29 - Trial = 7724/30000 | Total reward = 41.91
2022-01-26 14:17:02.165 | DEBUG    | __main__:trials:24 - Trial = 7725/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.166 | DEBUG    | __main__:trials:29 - Trial = 7725/30000 | Total reward = 53.71
2022-01-26 14:17:02.170 | DEBUG    | __main__:trials:24 - Trial = 7726/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.172 | DEBUG    | __main__:trials:29 - Trial = 7726/30000 | Total reward = 46.69
2022-01-26 14:17:02.176 | DEBUG    | __main__:trials:24 - Trial = 7727/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.176 | DEBUG    | __main__:trials:29 - Trial = 7727/30000 | Total reward = 41.11
2022-01-26 14:17:02.181 | DEBUG    | __main__:trials:24 - Trial = 7728/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.181 | DEBUG    | __main__:trials:29 - Trial = 7728/30000 | Total reward = 56.69
2022-01-26 14:17:02.186 | DEBUG    | __main__:trials:24 - Trial = 7729/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.188 | DEBUG    | __main__:trials:29 - Trial = 7729/30000 | Total reward = 43.47
2022-01-26 14:17:02.191 | DEBUG    | __main__:trials:24 - Trial = 7730/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.193 | DEBUG    | __main__:trials:29 - Trial = 7730/30000 | Total reward = 52.85
2022-01-26 14:17:02.196 | DEBUG    | __main__:trials:24 - Trial = 7731/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.198 | DEBUG    | __main__:trials:29 - Trial = 7731/30000 | Total reward = 47.01
2022-01-26 14:17:02.202 | DEBUG    | __main__:trials:24 - Trial = 7732/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.204 | DEBUG    | __main__:trials:29 - Trial = 7732/30000 | Total reward = 46.20
2022-01-26 14:17:02.208 | DEBUG    | __main__:trials:24 - Trial = 7733/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.209 | DEBUG    | __main__:trials:29 - Trial = 7733/30000 | Total reward = 41.17
2022-01-26 14:17:02.213 | DEBUG    | __main__:trials:24 - Trial = 7734/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.215 | DEBUG    | __main__:trials:29 - Trial = 7734/30000 | Total reward = 34.09
2022-01-26 14:17:02.218 | DEBUG    | __main__:trials:24 - Trial = 7735/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.220 | DEBUG    | __main__:trials:29 - Trial = 7735/30000 | Total reward = 40.51
2022-01-26 14:17:02.224 | DEBUG    | __main__:trials:24 - Trial = 7736/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.225 | DEBUG    | __main__:trials:29 - Trial = 7736/30000 | Total reward = 45.55
2022-01-26 14:17:02.229 | DEBUG    | __main__:trials:24 - Trial = 7737/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.231 | DEBUG    | __main__:trials:29 - Trial = 7737/30000 | Total reward = 37.30
2022-01-26 14:17:02.234 | DEBUG    | __main__:trials:24 - Trial = 7738/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.236 | DEBUG    | __main__:trials:29 - Trial = 7738/30000 | Total reward = 41.70
2022-01-26 14:17:02.240 | DEBUG    | __main__:trials:24 - Trial = 7739/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.242 | DEBUG    | __main__:trials:29 - Trial = 7739/30000 | Total reward = 43.36
2022-01-26 14:17:02.246 | DEBUG    | __main__:trials:24 - Trial = 7740/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.247 | DEBUG    | __main__:trials:29 - Trial = 7740/30000 | Total reward = 47.21
2022-01-26 14:17:02.251 | DEBUG    | __main__:trials:26 - Trial = 7741/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.253 | DEBUG    | __main__:trials:29 - Trial = 7741/30000 | Total reward = 31.47
2022-01-26 14:17:02.256 | DEBUG    | __main__:trials:24 - Trial = 7742/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.258 | DEBUG    | __main__:trials:29 - Trial = 7742/30000 | Total reward = 32.98
2022-01-26 14:17:02.262 | DEBUG    | __main__:trials:24 - Trial = 7743/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.264 | DEBUG    | __main__:trials:29 - Trial = 7743/30000 | Total reward = 52.61
2022-01-26 14:17:02.267 | DEBUG    | __main__:trials:24 - Trial = 7744/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.268 | DEBUG    | __main__:trials:29 - Trial = 7744/30000 | Total reward = 29.34
2022-01-26 14:17:02.272 | DEBUG    | __main__:trials:24 - Trial = 7745/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.274 | DEBUG    | __main__:trials:29 - Trial = 7745/30000 | Total reward = 42.19
2022-01-26 14:17:02.278 | DEBUG    | __main__:trials:24 - Trial = 7746/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.278 | DEBUG    | __main__:trials:29 - Trial = 7746/30000 | Total reward = 34.29
2022-01-26 14:17:02.282 | DEBUG    | __main__:trials:24 - Trial = 7747/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.284 | DEBUG    | __main__:trials:29 - Trial = 7747/30000 | Total reward = 35.53
2022-01-26 14:17:02.288 | DEBUG    | __main__:trials:24 - Trial = 7748/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.289 | DEBUG    | __main__:trials:29 - Trial = 7748/30000 | Total reward = 47.72
2022-01-26 14:17:02.293 | DEBUG    | __main__:trials:24 - Trial = 7749/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.294 | DEBUG    | __main__:trials:29 - Trial = 7749/30000 | Total reward = 31.09
2022-01-26 14:17:02.298 | DEBUG    | __main__:trials:24 - Trial = 7750/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.300 | DEBUG    | __main__:trials:29 - Trial = 7750/30000 | Total reward = 19.64
2022-01-26 14:17:02.303 | DEBUG    | __main__:trials:24 - Trial = 7751/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.305 | DEBUG    | __main__:trials:29 - Trial = 7751/30000 | Total reward = 34.29
2022-01-26 14:17:02.309 | DEBUG    | __main__:trials:24 - Trial = 7752/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.311 | DEBUG    | __main__:trials:29 - Trial = 7752/30000 | Total reward = 54.13
2022-01-26 14:17:02.315 | DEBUG    | __main__:trials:24 - Trial = 7753/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.316 | DEBUG    | __main__:trials:29 - Trial = 7753/30000 | Total reward = 29.40
2022-01-26 14:17:02.320 | DEBUG    | __main__:trials:24 - Trial = 7754/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.322 | DEBUG    | __main__:trials:29 - Trial = 7754/30000 | Total reward = 50.95
2022-01-26 14:17:02.326 | DEBUG    | __main__:trials:24 - Trial = 7755/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.327 | DEBUG    | __main__:trials:29 - Trial = 7755/30000 | Total reward = 58.92
2022-01-26 14:17:02.330 | DEBUG    | __main__:trials:26 - Trial = 7756/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.332 | DEBUG    | __main__:trials:29 - Trial = 7756/30000 | Total reward = 16.11
2022-01-26 14:17:02.335 | DEBUG    | __main__:trials:24 - Trial = 7757/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.337 | DEBUG    | __main__:trials:29 - Trial = 7757/30000 | Total reward = 51.03
2022-01-26 14:17:02.340 | DEBUG    | __main__:trials:26 - Trial = 7758/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.341 | DEBUG    | __main__:trials:29 - Trial = 7758/30000 | Total reward = 34.84
2022-01-26 14:17:02.345 | DEBUG    | __main__:trials:24 - Trial = 7759/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.346 | DEBUG    | __main__:trials:29 - Trial = 7759/30000 | Total reward = 47.44
2022-01-26 14:17:02.349 | DEBUG    | __main__:trials:26 - Trial = 7760/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.351 | DEBUG    | __main__:trials:29 - Trial = 7760/30000 | Total reward = 21.47
2022-01-26 14:17:02.354 | DEBUG    | __main__:trials:24 - Trial = 7761/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.356 | DEBUG    | __main__:trials:29 - Trial = 7761/30000 | Total reward = 53.44
2022-01-26 14:17:02.360 | DEBUG    | __main__:trials:24 - Trial = 7762/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.361 | DEBUG    | __main__:trials:29 - Trial = 7762/30000 | Total reward = 47.03
2022-01-26 14:17:02.365 | DEBUG    | __main__:trials:24 - Trial = 7763/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.367 | DEBUG    | __main__:trials:29 - Trial = 7763/30000 | Total reward = 49.55
2022-01-26 14:17:02.371 | DEBUG    | __main__:trials:24 - Trial = 7764/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.372 | DEBUG    | __main__:trials:29 - Trial = 7764/30000 | Total reward = 46.71
2022-01-26 14:17:02.376 | DEBUG    | __main__:trials:24 - Trial = 7765/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.377 | DEBUG    | __main__:trials:29 - Trial = 7765/30000 | Total reward = 43.83
2022-01-26 14:17:02.381 | DEBUG    | __main__:trials:24 - Trial = 7766/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.382 | DEBUG    | __main__:trials:29 - Trial = 7766/30000 | Total reward = 41.09
2022-01-26 14:17:02.386 | DEBUG    | __main__:trials:24 - Trial = 7767/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.387 | DEBUG    | __main__:trials:29 - Trial = 7767/30000 | Total reward = 43.37
2022-01-26 14:17:02.391 | DEBUG    | __main__:trials:24 - Trial = 7768/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.393 | DEBUG    | __main__:trials:29 - Trial = 7768/30000 | Total reward = 52.81
2022-01-26 14:17:02.397 | DEBUG    | __main__:trials:24 - Trial = 7769/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.399 | DEBUG    | __main__:trials:29 - Trial = 7769/30000 | Total reward = 50.31
2022-01-26 14:17:02.402 | DEBUG    | __main__:trials:24 - Trial = 7770/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.402 | DEBUG    | __main__:trials:29 - Trial = 7770/30000 | Total reward = 51.65
2022-01-26 14:17:02.406 | DEBUG    | __main__:trials:24 - Trial = 7771/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.408 | DEBUG    | __main__:trials:29 - Trial = 7771/30000 | Total reward = 49.88
2022-01-26 14:17:02.412 | DEBUG    | __main__:trials:24 - Trial = 7772/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.414 | DEBUG    | __main__:trials:29 - Trial = 7772/30000 | Total reward = 43.47
2022-01-26 14:17:02.417 | DEBUG    | __main__:trials:24 - Trial = 7773/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.419 | DEBUG    | __main__:trials:29 - Trial = 7773/30000 | Total reward = 42.05
2022-01-26 14:17:02.423 | DEBUG    | __main__:trials:24 - Trial = 7774/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.425 | DEBUG    | __main__:trials:29 - Trial = 7774/30000 | Total reward = 56.30
2022-01-26 14:17:02.428 | DEBUG    | __main__:trials:24 - Trial = 7775/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.430 | DEBUG    | __main__:trials:29 - Trial = 7775/30000 | Total reward = 28.92
2022-01-26 14:17:02.434 | DEBUG    | __main__:trials:24 - Trial = 7776/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.435 | DEBUG    | __main__:trials:29 - Trial = 7776/30000 | Total reward = 41.39
2022-01-26 14:17:02.439 | DEBUG    | __main__:trials:24 - Trial = 7777/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.440 | DEBUG    | __main__:trials:29 - Trial = 7777/30000 | Total reward = 38.50
2022-01-26 14:17:02.444 | DEBUG    | __main__:trials:24 - Trial = 7778/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.446 | DEBUG    | __main__:trials:29 - Trial = 7778/30000 | Total reward = 33.14
2022-01-26 14:17:02.449 | DEBUG    | __main__:trials:24 - Trial = 7779/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.451 | DEBUG    | __main__:trials:29 - Trial = 7779/30000 | Total reward = 53.85
2022-01-26 14:17:02.454 | DEBUG    | __main__:trials:24 - Trial = 7780/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.456 | DEBUG    | __main__:trials:29 - Trial = 7780/30000 | Total reward = 49.92
2022-01-26 14:17:02.459 | DEBUG    | __main__:trials:24 - Trial = 7781/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.461 | DEBUG    | __main__:trials:29 - Trial = 7781/30000 | Total reward = 51.37
2022-01-26 14:17:02.465 | DEBUG    | __main__:trials:24 - Trial = 7782/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.466 | DEBUG    | __main__:trials:29 - Trial = 7782/30000 | Total reward = 35.46
2022-01-26 14:17:02.469 | DEBUG    | __main__:trials:24 - Trial = 7783/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.470 | DEBUG    | __main__:trials:29 - Trial = 7783/30000 | Total reward = 42.17
2022-01-26 14:17:02.473 | DEBUG    | __main__:trials:24 - Trial = 7784/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.474 | DEBUG    | __main__:trials:29 - Trial = 7784/30000 | Total reward = 42.12
2022-01-26 14:17:02.478 | DEBUG    | __main__:trials:24 - Trial = 7785/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.479 | DEBUG    | __main__:trials:29 - Trial = 7785/30000 | Total reward = 47.54
2022-01-26 14:17:02.483 | DEBUG    | __main__:trials:24 - Trial = 7786/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.485 | DEBUG    | __main__:trials:29 - Trial = 7786/30000 | Total reward = 37.50
2022-01-26 14:17:02.488 | DEBUG    | __main__:trials:24 - Trial = 7787/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.490 | DEBUG    | __main__:trials:29 - Trial = 7787/30000 | Total reward = 43.33
2022-01-26 14:17:02.494 | DEBUG    | __main__:trials:26 - Trial = 7788/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.495 | DEBUG    | __main__:trials:29 - Trial = 7788/30000 | Total reward = 30.63
2022-01-26 14:17:02.498 | DEBUG    | __main__:trials:24 - Trial = 7789/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.500 | DEBUG    | __main__:trials:29 - Trial = 7789/30000 | Total reward = 37.84
2022-01-26 14:17:02.504 | DEBUG    | __main__:trials:24 - Trial = 7790/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.505 | DEBUG    | __main__:trials:29 - Trial = 7790/30000 | Total reward = 44.77
2022-01-26 14:17:02.509 | DEBUG    | __main__:trials:24 - Trial = 7791/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.511 | DEBUG    | __main__:trials:29 - Trial = 7791/30000 | Total reward = 44.03
2022-01-26 14:17:02.515 | DEBUG    | __main__:trials:24 - Trial = 7792/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.516 | DEBUG    | __main__:trials:29 - Trial = 7792/30000 | Total reward = 50.83
2022-01-26 14:17:02.520 | DEBUG    | __main__:trials:24 - Trial = 7793/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.522 | DEBUG    | __main__:trials:29 - Trial = 7793/30000 | Total reward = 35.87
2022-01-26 14:17:02.525 | DEBUG    | __main__:trials:24 - Trial = 7794/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.526 | DEBUG    | __main__:trials:29 - Trial = 7794/30000 | Total reward = 41.54
2022-01-26 14:17:02.529 | DEBUG    | __main__:trials:24 - Trial = 7795/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.531 | DEBUG    | __main__:trials:29 - Trial = 7795/30000 | Total reward = 43.91
2022-01-26 14:17:02.535 | DEBUG    | __main__:trials:24 - Trial = 7796/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.536 | DEBUG    | __main__:trials:29 - Trial = 7796/30000 | Total reward = 42.10
2022-01-26 14:17:02.540 | DEBUG    | __main__:trials:24 - Trial = 7797/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.542 | DEBUG    | __main__:trials:29 - Trial = 7797/30000 | Total reward = 41.30
2022-01-26 14:17:02.545 | DEBUG    | __main__:trials:24 - Trial = 7798/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.547 | DEBUG    | __main__:trials:29 - Trial = 7798/30000 | Total reward = 50.84
2022-01-26 14:17:02.551 | DEBUG    | __main__:trials:24 - Trial = 7799/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.552 | DEBUG    | __main__:trials:29 - Trial = 7799/30000 | Total reward = 47.03
2022-01-26 14:17:02.556 | DEBUG    | __main__:trials:24 - Trial = 7800/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.557 | DEBUG    | __main__:trials:29 - Trial = 7800/30000 | Total reward = 48.57
2022-01-26 14:17:02.561 | DEBUG    | __main__:trials:24 - Trial = 7801/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.563 | DEBUG    | __main__:trials:29 - Trial = 7801/30000 | Total reward = 40.52
2022-01-26 14:17:02.567 | DEBUG    | __main__:trials:24 - Trial = 7802/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.568 | DEBUG    | __main__:trials:29 - Trial = 7802/30000 | Total reward = 59.99
2022-01-26 14:17:02.572 | DEBUG    | __main__:trials:24 - Trial = 7803/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.574 | DEBUG    | __main__:trials:29 - Trial = 7803/30000 | Total reward = 47.00
2022-01-26 14:17:02.578 | DEBUG    | __main__:trials:24 - Trial = 7804/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.580 | DEBUG    | __main__:trials:29 - Trial = 7804/30000 | Total reward = 48.55
2022-01-26 14:17:02.583 | DEBUG    | __main__:trials:24 - Trial = 7805/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.585 | DEBUG    | __main__:trials:29 - Trial = 7805/30000 | Total reward = 38.98
2022-01-26 14:17:02.589 | DEBUG    | __main__:trials:24 - Trial = 7806/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.590 | DEBUG    | __main__:trials:29 - Trial = 7806/30000 | Total reward = 61.26
2022-01-26 14:17:02.593 | DEBUG    | __main__:trials:24 - Trial = 7807/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.594 | DEBUG    | __main__:trials:29 - Trial = 7807/30000 | Total reward = 47.22
2022-01-26 14:17:02.598 | DEBUG    | __main__:trials:24 - Trial = 7808/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.598 | DEBUG    | __main__:trials:29 - Trial = 7808/30000 | Total reward = 46.70
2022-01-26 14:17:02.602 | DEBUG    | __main__:trials:24 - Trial = 7809/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.603 | DEBUG    | __main__:trials:29 - Trial = 7809/30000 | Total reward = 47.61
2022-01-26 14:17:02.607 | DEBUG    | __main__:trials:24 - Trial = 7810/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.609 | DEBUG    | __main__:trials:29 - Trial = 7810/30000 | Total reward = 47.29
2022-01-26 14:17:02.612 | DEBUG    | __main__:trials:24 - Trial = 7811/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.614 | DEBUG    | __main__:trials:29 - Trial = 7811/30000 | Total reward = 36.11
2022-01-26 14:17:02.618 | DEBUG    | __main__:trials:24 - Trial = 7812/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.619 | DEBUG    | __main__:trials:29 - Trial = 7812/30000 | Total reward = 35.09
2022-01-26 14:17:02.623 | DEBUG    | __main__:trials:24 - Trial = 7813/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.625 | DEBUG    | __main__:trials:29 - Trial = 7813/30000 | Total reward = 55.76
2022-01-26 14:17:02.629 | DEBUG    | __main__:trials:24 - Trial = 7814/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.630 | DEBUG    | __main__:trials:29 - Trial = 7814/30000 | Total reward = 43.60
2022-01-26 14:17:02.634 | DEBUG    | __main__:trials:24 - Trial = 7815/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.635 | DEBUG    | __main__:trials:29 - Trial = 7815/30000 | Total reward = 37.11
2022-01-26 14:17:02.639 | DEBUG    | __main__:trials:24 - Trial = 7816/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.640 | DEBUG    | __main__:trials:29 - Trial = 7816/30000 | Total reward = 31.97
2022-01-26 14:17:02.644 | DEBUG    | __main__:trials:24 - Trial = 7817/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.646 | DEBUG    | __main__:trials:29 - Trial = 7817/30000 | Total reward = 58.12
2022-01-26 14:17:02.647 | DEBUG    | __main__:trials:26 - Trial = 7818/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.649 | DEBUG    | __main__:trials:29 - Trial = 7818/30000 | Total reward = 10.37
2022-01-26 14:17:02.653 | DEBUG    | __main__:trials:24 - Trial = 7819/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.655 | DEBUG    | __main__:trials:29 - Trial = 7819/30000 | Total reward = 45.83
2022-01-26 14:17:02.658 | DEBUG    | __main__:trials:24 - Trial = 7820/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.660 | DEBUG    | __main__:trials:29 - Trial = 7820/30000 | Total reward = 45.57
2022-01-26 14:17:02.663 | DEBUG    | __main__:trials:24 - Trial = 7821/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.665 | DEBUG    | __main__:trials:29 - Trial = 7821/30000 | Total reward = 50.16
2022-01-26 14:17:02.668 | DEBUG    | __main__:trials:24 - Trial = 7822/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.670 | DEBUG    | __main__:trials:29 - Trial = 7822/30000 | Total reward = 50.55
2022-01-26 14:17:02.674 | DEBUG    | __main__:trials:24 - Trial = 7823/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.675 | DEBUG    | __main__:trials:29 - Trial = 7823/30000 | Total reward = 31.52
2022-01-26 14:17:02.679 | DEBUG    | __main__:trials:24 - Trial = 7824/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.681 | DEBUG    | __main__:trials:29 - Trial = 7824/30000 | Total reward = 32.22
2022-01-26 14:17:02.685 | DEBUG    | __main__:trials:24 - Trial = 7825/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.685 | DEBUG    | __main__:trials:29 - Trial = 7825/30000 | Total reward = 31.19
2022-01-26 14:17:02.690 | DEBUG    | __main__:trials:24 - Trial = 7826/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.692 | DEBUG    | __main__:trials:29 - Trial = 7826/30000 | Total reward = 63.51
2022-01-26 14:17:02.695 | DEBUG    | __main__:trials:24 - Trial = 7827/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.696 | DEBUG    | __main__:trials:29 - Trial = 7827/30000 | Total reward = 48.70
2022-01-26 14:17:02.700 | DEBUG    | __main__:trials:24 - Trial = 7828/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.702 | DEBUG    | __main__:trials:29 - Trial = 7828/30000 | Total reward = 45.70
2022-01-26 14:17:02.705 | DEBUG    | __main__:trials:24 - Trial = 7829/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.707 | DEBUG    | __main__:trials:29 - Trial = 7829/30000 | Total reward = 40.39
2022-01-26 14:17:02.710 | DEBUG    | __main__:trials:24 - Trial = 7830/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.712 | DEBUG    | __main__:trials:29 - Trial = 7830/30000 | Total reward = 41.27
2022-01-26 14:17:02.716 | DEBUG    | __main__:trials:24 - Trial = 7831/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.717 | DEBUG    | __main__:trials:29 - Trial = 7831/30000 | Total reward = 46.45
2022-01-26 14:17:02.721 | DEBUG    | __main__:trials:24 - Trial = 7832/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.722 | DEBUG    | __main__:trials:29 - Trial = 7832/30000 | Total reward = 48.98
2022-01-26 14:17:02.725 | DEBUG    | __main__:trials:24 - Trial = 7833/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.726 | DEBUG    | __main__:trials:29 - Trial = 7833/30000 | Total reward = 34.30
2022-01-26 14:17:02.730 | DEBUG    | __main__:trials:24 - Trial = 7834/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.731 | DEBUG    | __main__:trials:29 - Trial = 7834/30000 | Total reward = 51.16
2022-01-26 14:17:02.734 | DEBUG    | __main__:trials:26 - Trial = 7835/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.735 | DEBUG    | __main__:trials:29 - Trial = 7835/30000 | Total reward = 24.63
2022-01-26 14:17:02.739 | DEBUG    | __main__:trials:24 - Trial = 7836/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.740 | DEBUG    | __main__:trials:29 - Trial = 7836/30000 | Total reward = 45.67
2022-01-26 14:17:02.744 | DEBUG    | __main__:trials:24 - Trial = 7837/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.745 | DEBUG    | __main__:trials:29 - Trial = 7837/30000 | Total reward = 31.26
2022-01-26 14:17:02.748 | DEBUG    | __main__:trials:24 - Trial = 7838/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.749 | DEBUG    | __main__:trials:29 - Trial = 7838/30000 | Total reward = 32.07
2022-01-26 14:17:02.753 | DEBUG    | __main__:trials:24 - Trial = 7839/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.754 | DEBUG    | __main__:trials:29 - Trial = 7839/30000 | Total reward = 36.08
2022-01-26 14:17:02.758 | DEBUG    | __main__:trials:24 - Trial = 7840/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.759 | DEBUG    | __main__:trials:29 - Trial = 7840/30000 | Total reward = 48.30
2022-01-26 14:17:02.762 | DEBUG    | __main__:trials:24 - Trial = 7841/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.763 | DEBUG    | __main__:trials:29 - Trial = 7841/30000 | Total reward = 52.06
2022-01-26 14:17:02.767 | DEBUG    | __main__:trials:24 - Trial = 7842/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.769 | DEBUG    | __main__:trials:29 - Trial = 7842/30000 | Total reward = 40.02
2022-01-26 14:17:02.771 | DEBUG    | __main__:trials:26 - Trial = 7843/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.773 | DEBUG    | __main__:trials:29 - Trial = 7843/30000 | Total reward = 5.57
2022-01-26 14:17:02.777 | DEBUG    | __main__:trials:24 - Trial = 7844/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.777 | DEBUG    | __main__:trials:29 - Trial = 7844/30000 | Total reward = 45.49
2022-01-26 14:17:02.781 | DEBUG    | __main__:trials:24 - Trial = 7845/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.783 | DEBUG    | __main__:trials:29 - Trial = 7845/30000 | Total reward = 48.50
2022-01-26 14:17:02.787 | DEBUG    | __main__:trials:24 - Trial = 7846/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.789 | DEBUG    | __main__:trials:29 - Trial = 7846/30000 | Total reward = 40.16
2022-01-26 14:17:02.793 | DEBUG    | __main__:trials:24 - Trial = 7847/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.794 | DEBUG    | __main__:trials:29 - Trial = 7847/30000 | Total reward = 41.82
2022-01-26 14:17:02.798 | DEBUG    | __main__:trials:24 - Trial = 7848/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.799 | DEBUG    | __main__:trials:29 - Trial = 7848/30000 | Total reward = 46.74
2022-01-26 14:17:02.803 | DEBUG    | __main__:trials:24 - Trial = 7849/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.805 | DEBUG    | __main__:trials:29 - Trial = 7849/30000 | Total reward = 41.82
2022-01-26 14:17:02.808 | DEBUG    | __main__:trials:24 - Trial = 7850/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.811 | DEBUG    | __main__:trials:29 - Trial = 7850/30000 | Total reward = 40.04
2022-01-26 14:17:02.815 | DEBUG    | __main__:trials:24 - Trial = 7851/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.817 | DEBUG    | __main__:trials:29 - Trial = 7851/30000 | Total reward = 39.65
2022-01-26 14:17:02.821 | DEBUG    | __main__:trials:24 - Trial = 7852/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.821 | DEBUG    | __main__:trials:29 - Trial = 7852/30000 | Total reward = 38.97
2022-01-26 14:17:02.826 | DEBUG    | __main__:trials:24 - Trial = 7853/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.827 | DEBUG    | __main__:trials:29 - Trial = 7853/30000 | Total reward = 37.86
2022-01-26 14:17:02.832 | DEBUG    | __main__:trials:24 - Trial = 7854/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.833 | DEBUG    | __main__:trials:29 - Trial = 7854/30000 | Total reward = 38.93
2022-01-26 14:17:02.837 | DEBUG    | __main__:trials:24 - Trial = 7855/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.839 | DEBUG    | __main__:trials:29 - Trial = 7855/30000 | Total reward = 36.81
2022-01-26 14:17:02.843 | DEBUG    | __main__:trials:24 - Trial = 7856/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.844 | DEBUG    | __main__:trials:29 - Trial = 7856/30000 | Total reward = 45.48
2022-01-26 14:17:02.848 | DEBUG    | __main__:trials:24 - Trial = 7857/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.849 | DEBUG    | __main__:trials:29 - Trial = 7857/30000 | Total reward = 36.46
2022-01-26 14:17:02.853 | DEBUG    | __main__:trials:26 - Trial = 7858/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.854 | DEBUG    | __main__:trials:29 - Trial = 7858/30000 | Total reward = 28.23
2022-01-26 14:17:02.857 | DEBUG    | __main__:trials:24 - Trial = 7859/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.858 | DEBUG    | __main__:trials:29 - Trial = 7859/30000 | Total reward = 45.54
2022-01-26 14:17:02.862 | DEBUG    | __main__:trials:24 - Trial = 7860/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.862 | DEBUG    | __main__:trials:29 - Trial = 7860/30000 | Total reward = 33.70
2022-01-26 14:17:02.866 | DEBUG    | __main__:trials:24 - Trial = 7861/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.867 | DEBUG    | __main__:trials:29 - Trial = 7861/30000 | Total reward = 53.94
2022-01-26 14:17:02.871 | DEBUG    | __main__:trials:24 - Trial = 7862/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.872 | DEBUG    | __main__:trials:29 - Trial = 7862/30000 | Total reward = 27.78
2022-01-26 14:17:02.876 | DEBUG    | __main__:trials:24 - Trial = 7863/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.877 | DEBUG    | __main__:trials:29 - Trial = 7863/30000 | Total reward = 35.33
2022-01-26 14:17:02.880 | DEBUG    | __main__:trials:24 - Trial = 7864/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.882 | DEBUG    | __main__:trials:29 - Trial = 7864/30000 | Total reward = 39.37
2022-01-26 14:17:02.886 | DEBUG    | __main__:trials:24 - Trial = 7865/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.887 | DEBUG    | __main__:trials:29 - Trial = 7865/30000 | Total reward = 32.31
2022-01-26 14:17:02.890 | DEBUG    | __main__:trials:26 - Trial = 7866/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.891 | DEBUG    | __main__:trials:29 - Trial = 7866/30000 | Total reward = 11.37
2022-01-26 14:17:02.895 | DEBUG    | __main__:trials:24 - Trial = 7867/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.897 | DEBUG    | __main__:trials:29 - Trial = 7867/30000 | Total reward = 39.26
2022-01-26 14:17:02.900 | DEBUG    | __main__:trials:24 - Trial = 7868/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.901 | DEBUG    | __main__:trials:29 - Trial = 7868/30000 | Total reward = 48.25
2022-01-26 14:17:02.905 | DEBUG    | __main__:trials:24 - Trial = 7869/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.905 | DEBUG    | __main__:trials:29 - Trial = 7869/30000 | Total reward = 44.77
2022-01-26 14:17:02.910 | DEBUG    | __main__:trials:24 - Trial = 7870/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.912 | DEBUG    | __main__:trials:29 - Trial = 7870/30000 | Total reward = 44.62
2022-01-26 14:17:02.915 | DEBUG    | __main__:trials:24 - Trial = 7871/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.916 | DEBUG    | __main__:trials:29 - Trial = 7871/30000 | Total reward = 19.71
2022-01-26 14:17:02.920 | DEBUG    | __main__:trials:24 - Trial = 7872/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.921 | DEBUG    | __main__:trials:29 - Trial = 7872/30000 | Total reward = 47.35
2022-01-26 14:17:02.925 | DEBUG    | __main__:trials:24 - Trial = 7873/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.926 | DEBUG    | __main__:trials:29 - Trial = 7873/30000 | Total reward = 36.31
2022-01-26 14:17:02.930 | DEBUG    | __main__:trials:24 - Trial = 7874/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.932 | DEBUG    | __main__:trials:29 - Trial = 7874/30000 | Total reward = 32.42
2022-01-26 14:17:02.936 | DEBUG    | __main__:trials:24 - Trial = 7875/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.937 | DEBUG    | __main__:trials:29 - Trial = 7875/30000 | Total reward = 43.47
2022-01-26 14:17:02.940 | DEBUG    | __main__:trials:24 - Trial = 7876/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.942 | DEBUG    | __main__:trials:29 - Trial = 7876/30000 | Total reward = 36.43
2022-01-26 14:17:02.945 | DEBUG    | __main__:trials:26 - Trial = 7877/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:02.947 | DEBUG    | __main__:trials:29 - Trial = 7877/30000 | Total reward = 13.57
2022-01-26 14:17:02.950 | DEBUG    | __main__:trials:24 - Trial = 7878/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.952 | DEBUG    | __main__:trials:29 - Trial = 7878/30000 | Total reward = 33.04
2022-01-26 14:17:02.955 | DEBUG    | __main__:trials:24 - Trial = 7879/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.957 | DEBUG    | __main__:trials:29 - Trial = 7879/30000 | Total reward = 39.25
2022-01-26 14:17:02.960 | DEBUG    | __main__:trials:24 - Trial = 7880/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.962 | DEBUG    | __main__:trials:29 - Trial = 7880/30000 | Total reward = 43.42
2022-01-26 14:17:02.965 | DEBUG    | __main__:trials:24 - Trial = 7881/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.967 | DEBUG    | __main__:trials:29 - Trial = 7881/30000 | Total reward = 28.59
2022-01-26 14:17:02.971 | DEBUG    | __main__:trials:24 - Trial = 7882/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.973 | DEBUG    | __main__:trials:29 - Trial = 7882/30000 | Total reward = 41.45
2022-01-26 14:17:02.976 | DEBUG    | __main__:trials:24 - Trial = 7883/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.977 | DEBUG    | __main__:trials:29 - Trial = 7883/30000 | Total reward = 32.24
2022-01-26 14:17:02.980 | DEBUG    | __main__:trials:24 - Trial = 7884/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.983 | DEBUG    | __main__:trials:29 - Trial = 7884/30000 | Total reward = 48.01
2022-01-26 14:17:02.986 | DEBUG    | __main__:trials:24 - Trial = 7885/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.988 | DEBUG    | __main__:trials:29 - Trial = 7885/30000 | Total reward = 31.70
2022-01-26 14:17:02.992 | DEBUG    | __main__:trials:24 - Trial = 7886/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.993 | DEBUG    | __main__:trials:29 - Trial = 7886/30000 | Total reward = 44.03
2022-01-26 14:17:02.997 | DEBUG    | __main__:trials:24 - Trial = 7887/30000 | Max number of steps (20) reached
2022-01-26 14:17:02.999 | DEBUG    | __main__:trials:29 - Trial = 7887/30000 | Total reward = 31.75
2022-01-26 14:17:03.002 | DEBUG    | __main__:trials:24 - Trial = 7888/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.004 | DEBUG    | __main__:trials:29 - Trial = 7888/30000 | Total reward = 42.81
2022-01-26 14:17:03.006 | DEBUG    | __main__:trials:26 - Trial = 7889/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.007 | DEBUG    | __main__:trials:29 - Trial = 7889/30000 | Total reward = 15.31
2022-01-26 14:17:03.010 | DEBUG    | __main__:trials:24 - Trial = 7890/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.010 | DEBUG    | __main__:trials:29 - Trial = 7890/30000 | Total reward = 38.00
2022-01-26 14:17:03.014 | DEBUG    | __main__:trials:24 - Trial = 7891/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.014 | DEBUG    | __main__:trials:29 - Trial = 7891/30000 | Total reward = 28.57
2022-01-26 14:17:03.018 | DEBUG    | __main__:trials:24 - Trial = 7892/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.019 | DEBUG    | __main__:trials:29 - Trial = 7892/30000 | Total reward = 32.33
2022-01-26 14:17:03.022 | DEBUG    | __main__:trials:24 - Trial = 7893/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.024 | DEBUG    | __main__:trials:29 - Trial = 7893/30000 | Total reward = 23.85
2022-01-26 14:17:03.027 | DEBUG    | __main__:trials:24 - Trial = 7894/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.029 | DEBUG    | __main__:trials:29 - Trial = 7894/30000 | Total reward = 30.41
2022-01-26 14:17:03.033 | DEBUG    | __main__:trials:24 - Trial = 7895/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.033 | DEBUG    | __main__:trials:29 - Trial = 7895/30000 | Total reward = 24.60
2022-01-26 14:17:03.037 | DEBUG    | __main__:trials:24 - Trial = 7896/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.037 | DEBUG    | __main__:trials:29 - Trial = 7896/30000 | Total reward = 37.97
2022-01-26 14:17:03.041 | DEBUG    | __main__:trials:24 - Trial = 7897/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.042 | DEBUG    | __main__:trials:29 - Trial = 7897/30000 | Total reward = 39.47
2022-01-26 14:17:03.046 | DEBUG    | __main__:trials:24 - Trial = 7898/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.048 | DEBUG    | __main__:trials:29 - Trial = 7898/30000 | Total reward = 39.22
2022-01-26 14:17:03.052 | DEBUG    | __main__:trials:24 - Trial = 7899/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.052 | DEBUG    | __main__:trials:29 - Trial = 7899/30000 | Total reward = 38.81
2022-01-26 14:17:03.057 | DEBUG    | __main__:trials:24 - Trial = 7900/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.057 | DEBUG    | __main__:trials:29 - Trial = 7900/30000 | Total reward = 45.41
2022-01-26 14:17:03.061 | DEBUG    | __main__:trials:24 - Trial = 7901/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.062 | DEBUG    | __main__:trials:29 - Trial = 7901/30000 | Total reward = 50.04
2022-01-26 14:17:03.065 | DEBUG    | __main__:trials:24 - Trial = 7902/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.067 | DEBUG    | __main__:trials:29 - Trial = 7902/30000 | Total reward = 48.45
2022-01-26 14:17:03.071 | DEBUG    | __main__:trials:24 - Trial = 7903/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.072 | DEBUG    | __main__:trials:29 - Trial = 7903/30000 | Total reward = 47.62
2022-01-26 14:17:03.075 | DEBUG    | __main__:trials:26 - Trial = 7904/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.076 | DEBUG    | __main__:trials:29 - Trial = 7904/30000 | Total reward = 15.04
2022-01-26 14:17:03.080 | DEBUG    | __main__:trials:24 - Trial = 7905/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.081 | DEBUG    | __main__:trials:29 - Trial = 7905/30000 | Total reward = 55.36
2022-01-26 14:17:03.085 | DEBUG    | __main__:trials:24 - Trial = 7906/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.087 | DEBUG    | __main__:trials:29 - Trial = 7906/30000 | Total reward = 43.98
2022-01-26 14:17:03.091 | DEBUG    | __main__:trials:24 - Trial = 7907/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.093 | DEBUG    | __main__:trials:29 - Trial = 7907/30000 | Total reward = 37.09
2022-01-26 14:17:03.095 | DEBUG    | __main__:trials:26 - Trial = 7908/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.097 | DEBUG    | __main__:trials:29 - Trial = 7908/30000 | Total reward = 12.50
2022-01-26 14:17:03.101 | DEBUG    | __main__:trials:24 - Trial = 7909/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.103 | DEBUG    | __main__:trials:29 - Trial = 7909/30000 | Total reward = 51.02
2022-01-26 14:17:03.107 | DEBUG    | __main__:trials:24 - Trial = 7910/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.107 | DEBUG    | __main__:trials:29 - Trial = 7910/30000 | Total reward = 44.99
2022-01-26 14:17:03.112 | DEBUG    | __main__:trials:24 - Trial = 7911/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.114 | DEBUG    | __main__:trials:29 - Trial = 7911/30000 | Total reward = 24.17
2022-01-26 14:17:03.118 | DEBUG    | __main__:trials:24 - Trial = 7912/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.121 | DEBUG    | __main__:trials:29 - Trial = 7912/30000 | Total reward = 30.41
2022-01-26 14:17:03.124 | DEBUG    | __main__:trials:26 - Trial = 7913/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.127 | DEBUG    | __main__:trials:29 - Trial = 7913/30000 | Total reward = 26.42
2022-01-26 14:17:03.130 | DEBUG    | __main__:trials:24 - Trial = 7914/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.133 | DEBUG    | __main__:trials:29 - Trial = 7914/30000 | Total reward = 49.84
2022-01-26 14:17:03.137 | DEBUG    | __main__:trials:24 - Trial = 7915/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.138 | DEBUG    | __main__:trials:29 - Trial = 7915/30000 | Total reward = 37.09
2022-01-26 14:17:03.141 | DEBUG    | __main__:trials:26 - Trial = 7916/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.142 | DEBUG    | __main__:trials:29 - Trial = 7916/30000 | Total reward = 24.82
2022-01-26 14:17:03.145 | DEBUG    | __main__:trials:24 - Trial = 7917/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.147 | DEBUG    | __main__:trials:29 - Trial = 7917/30000 | Total reward = 31.19
2022-01-26 14:17:03.151 | DEBUG    | __main__:trials:24 - Trial = 7918/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.153 | DEBUG    | __main__:trials:29 - Trial = 7918/30000 | Total reward = 26.26
2022-01-26 14:17:03.156 | DEBUG    | __main__:trials:24 - Trial = 7919/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.158 | DEBUG    | __main__:trials:29 - Trial = 7919/30000 | Total reward = 44.82
2022-01-26 14:17:03.162 | DEBUG    | __main__:trials:24 - Trial = 7920/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.163 | DEBUG    | __main__:trials:29 - Trial = 7920/30000 | Total reward = 34.26
2022-01-26 14:17:03.167 | DEBUG    | __main__:trials:24 - Trial = 7921/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.169 | DEBUG    | __main__:trials:29 - Trial = 7921/30000 | Total reward = 31.99
2022-01-26 14:17:03.171 | DEBUG    | __main__:trials:24 - Trial = 7922/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.173 | DEBUG    | __main__:trials:29 - Trial = 7922/30000 | Total reward = 35.97
2022-01-26 14:17:03.177 | DEBUG    | __main__:trials:24 - Trial = 7923/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.179 | DEBUG    | __main__:trials:29 - Trial = 7923/30000 | Total reward = 50.98
2022-01-26 14:17:03.182 | DEBUG    | __main__:trials:24 - Trial = 7924/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.184 | DEBUG    | __main__:trials:29 - Trial = 7924/30000 | Total reward = 47.57
2022-01-26 14:17:03.188 | DEBUG    | __main__:trials:24 - Trial = 7925/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.189 | DEBUG    | __main__:trials:29 - Trial = 7925/30000 | Total reward = 32.03
2022-01-26 14:17:03.193 | DEBUG    | __main__:trials:24 - Trial = 7926/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.194 | DEBUG    | __main__:trials:29 - Trial = 7926/30000 | Total reward = 32.42
2022-01-26 14:17:03.197 | DEBUG    | __main__:trials:24 - Trial = 7927/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.199 | DEBUG    | __main__:trials:29 - Trial = 7927/30000 | Total reward = 33.02
2022-01-26 14:17:03.203 | DEBUG    | __main__:trials:24 - Trial = 7928/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.205 | DEBUG    | __main__:trials:29 - Trial = 7928/30000 | Total reward = 50.70
2022-01-26 14:17:03.209 | DEBUG    | __main__:trials:24 - Trial = 7929/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.210 | DEBUG    | __main__:trials:29 - Trial = 7929/30000 | Total reward = 33.86
2022-01-26 14:17:03.214 | DEBUG    | __main__:trials:24 - Trial = 7930/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.215 | DEBUG    | __main__:trials:29 - Trial = 7930/30000 | Total reward = 41.15
2022-01-26 14:17:03.219 | DEBUG    | __main__:trials:24 - Trial = 7931/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.219 | DEBUG    | __main__:trials:29 - Trial = 7931/30000 | Total reward = 23.00
2022-01-26 14:17:03.223 | DEBUG    | __main__:trials:24 - Trial = 7932/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.224 | DEBUG    | __main__:trials:29 - Trial = 7932/30000 | Total reward = 49.39
2022-01-26 14:17:03.228 | DEBUG    | __main__:trials:26 - Trial = 7933/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.228 | DEBUG    | __main__:trials:29 - Trial = 7933/30000 | Total reward = 24.22
2022-01-26 14:17:03.232 | DEBUG    | __main__:trials:24 - Trial = 7934/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.232 | DEBUG    | __main__:trials:29 - Trial = 7934/30000 | Total reward = 46.63
2022-01-26 14:17:03.236 | DEBUG    | __main__:trials:24 - Trial = 7935/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.238 | DEBUG    | __main__:trials:29 - Trial = 7935/30000 | Total reward = 50.83
2022-01-26 14:17:03.241 | DEBUG    | __main__:trials:24 - Trial = 7936/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.243 | DEBUG    | __main__:trials:29 - Trial = 7936/30000 | Total reward = 42.39
2022-01-26 14:17:03.247 | DEBUG    | __main__:trials:24 - Trial = 7937/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.249 | DEBUG    | __main__:trials:29 - Trial = 7937/30000 | Total reward = 33.21
2022-01-26 14:17:03.252 | DEBUG    | __main__:trials:24 - Trial = 7938/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.254 | DEBUG    | __main__:trials:29 - Trial = 7938/30000 | Total reward = 40.34
2022-01-26 14:17:03.257 | DEBUG    | __main__:trials:24 - Trial = 7939/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.259 | DEBUG    | __main__:trials:29 - Trial = 7939/30000 | Total reward = 38.82
2022-01-26 14:17:03.263 | DEBUG    | __main__:trials:24 - Trial = 7940/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.263 | DEBUG    | __main__:trials:29 - Trial = 7940/30000 | Total reward = 46.45
2022-01-26 14:17:03.268 | DEBUG    | __main__:trials:24 - Trial = 7941/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.269 | DEBUG    | __main__:trials:29 - Trial = 7941/30000 | Total reward = 46.63
2022-01-26 14:17:03.272 | DEBUG    | __main__:trials:24 - Trial = 7942/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.275 | DEBUG    | __main__:trials:29 - Trial = 7942/30000 | Total reward = 41.93
2022-01-26 14:17:03.278 | DEBUG    | __main__:trials:24 - Trial = 7943/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.280 | DEBUG    | __main__:trials:29 - Trial = 7943/30000 | Total reward = 41.42
2022-01-26 14:17:03.284 | DEBUG    | __main__:trials:24 - Trial = 7944/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.285 | DEBUG    | __main__:trials:29 - Trial = 7944/30000 | Total reward = 46.63
2022-01-26 14:17:03.289 | DEBUG    | __main__:trials:24 - Trial = 7945/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.291 | DEBUG    | __main__:trials:29 - Trial = 7945/30000 | Total reward = 36.50
2022-01-26 14:17:03.295 | DEBUG    | __main__:trials:24 - Trial = 7946/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.297 | DEBUG    | __main__:trials:29 - Trial = 7946/30000 | Total reward = 49.12
2022-01-26 14:17:03.301 | DEBUG    | __main__:trials:24 - Trial = 7947/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.303 | DEBUG    | __main__:trials:29 - Trial = 7947/30000 | Total reward = 45.23
2022-01-26 14:17:03.306 | DEBUG    | __main__:trials:24 - Trial = 7948/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.308 | DEBUG    | __main__:trials:29 - Trial = 7948/30000 | Total reward = 44.49
2022-01-26 14:17:03.311 | DEBUG    | __main__:trials:24 - Trial = 7949/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.313 | DEBUG    | __main__:trials:29 - Trial = 7949/30000 | Total reward = 39.30
2022-01-26 14:17:03.316 | DEBUG    | __main__:trials:24 - Trial = 7950/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.318 | DEBUG    | __main__:trials:29 - Trial = 7950/30000 | Total reward = 59.15
2022-01-26 14:17:03.321 | DEBUG    | __main__:trials:24 - Trial = 7951/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.323 | DEBUG    | __main__:trials:29 - Trial = 7951/30000 | Total reward = 42.89
2022-01-26 14:17:03.326 | DEBUG    | __main__:trials:24 - Trial = 7952/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.327 | DEBUG    | __main__:trials:29 - Trial = 7952/30000 | Total reward = 46.63
2022-01-26 14:17:03.331 | DEBUG    | __main__:trials:24 - Trial = 7953/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.333 | DEBUG    | __main__:trials:29 - Trial = 7953/30000 | Total reward = 30.38
2022-01-26 14:17:03.337 | DEBUG    | __main__:trials:24 - Trial = 7954/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.339 | DEBUG    | __main__:trials:29 - Trial = 7954/30000 | Total reward = 29.65
2022-01-26 14:17:03.342 | DEBUG    | __main__:trials:24 - Trial = 7955/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.344 | DEBUG    | __main__:trials:29 - Trial = 7955/30000 | Total reward = 47.80
2022-01-26 14:17:03.348 | DEBUG    | __main__:trials:24 - Trial = 7956/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.349 | DEBUG    | __main__:trials:29 - Trial = 7956/30000 | Total reward = 46.83
2022-01-26 14:17:03.353 | DEBUG    | __main__:trials:24 - Trial = 7957/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.355 | DEBUG    | __main__:trials:29 - Trial = 7957/30000 | Total reward = 55.82
2022-01-26 14:17:03.358 | DEBUG    | __main__:trials:24 - Trial = 7958/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.360 | DEBUG    | __main__:trials:29 - Trial = 7958/30000 | Total reward = 52.38
2022-01-26 14:17:03.363 | DEBUG    | __main__:trials:24 - Trial = 7959/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.365 | DEBUG    | __main__:trials:29 - Trial = 7959/30000 | Total reward = 55.27
2022-01-26 14:17:03.368 | DEBUG    | __main__:trials:24 - Trial = 7960/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.370 | DEBUG    | __main__:trials:29 - Trial = 7960/30000 | Total reward = 38.47
2022-01-26 14:17:03.374 | DEBUG    | __main__:trials:24 - Trial = 7961/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.376 | DEBUG    | __main__:trials:29 - Trial = 7961/30000 | Total reward = 60.39
2022-01-26 14:17:03.379 | DEBUG    | __main__:trials:24 - Trial = 7962/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.381 | DEBUG    | __main__:trials:29 - Trial = 7962/30000 | Total reward = 50.83
2022-01-26 14:17:03.385 | DEBUG    | __main__:trials:24 - Trial = 7963/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.386 | DEBUG    | __main__:trials:29 - Trial = 7963/30000 | Total reward = 49.16
2022-01-26 14:17:03.390 | DEBUG    | __main__:trials:24 - Trial = 7964/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.392 | DEBUG    | __main__:trials:29 - Trial = 7964/30000 | Total reward = 51.13
2022-01-26 14:17:03.396 | DEBUG    | __main__:trials:24 - Trial = 7965/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.397 | DEBUG    | __main__:trials:29 - Trial = 7965/30000 | Total reward = 51.65
2022-01-26 14:17:03.401 | DEBUG    | __main__:trials:24 - Trial = 7966/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.402 | DEBUG    | __main__:trials:29 - Trial = 7966/30000 | Total reward = 52.56
2022-01-26 14:17:03.405 | DEBUG    | __main__:trials:24 - Trial = 7967/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.407 | DEBUG    | __main__:trials:29 - Trial = 7967/30000 | Total reward = 60.87
2022-01-26 14:17:03.411 | DEBUG    | __main__:trials:24 - Trial = 7968/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.412 | DEBUG    | __main__:trials:29 - Trial = 7968/30000 | Total reward = 47.79
2022-01-26 14:17:03.415 | DEBUG    | __main__:trials:24 - Trial = 7969/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.418 | DEBUG    | __main__:trials:29 - Trial = 7969/30000 | Total reward = 51.71
2022-01-26 14:17:03.421 | DEBUG    | __main__:trials:24 - Trial = 7970/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.423 | DEBUG    | __main__:trials:29 - Trial = 7970/30000 | Total reward = 38.40
2022-01-26 14:17:03.427 | DEBUG    | __main__:trials:24 - Trial = 7971/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.429 | DEBUG    | __main__:trials:29 - Trial = 7971/30000 | Total reward = 50.38
2022-01-26 14:17:03.432 | DEBUG    | __main__:trials:24 - Trial = 7972/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.434 | DEBUG    | __main__:trials:29 - Trial = 7972/30000 | Total reward = 38.65
2022-01-26 14:17:03.437 | DEBUG    | __main__:trials:24 - Trial = 7973/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.439 | DEBUG    | __main__:trials:29 - Trial = 7973/30000 | Total reward = 45.33
2022-01-26 14:17:03.443 | DEBUG    | __main__:trials:24 - Trial = 7974/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.444 | DEBUG    | __main__:trials:29 - Trial = 7974/30000 | Total reward = 52.88
2022-01-26 14:17:03.448 | DEBUG    | __main__:trials:24 - Trial = 7975/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.449 | DEBUG    | __main__:trials:29 - Trial = 7975/30000 | Total reward = 45.03
2022-01-26 14:17:03.453 | DEBUG    | __main__:trials:24 - Trial = 7976/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.455 | DEBUG    | __main__:trials:29 - Trial = 7976/30000 | Total reward = 47.31
2022-01-26 14:17:03.458 | DEBUG    | __main__:trials:24 - Trial = 7977/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.460 | DEBUG    | __main__:trials:29 - Trial = 7977/30000 | Total reward = 52.77
2022-01-26 14:17:03.463 | DEBUG    | __main__:trials:24 - Trial = 7978/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.465 | DEBUG    | __main__:trials:29 - Trial = 7978/30000 | Total reward = 43.46
2022-01-26 14:17:03.468 | DEBUG    | __main__:trials:24 - Trial = 7979/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.469 | DEBUG    | __main__:trials:29 - Trial = 7979/30000 | Total reward = 47.23
2022-01-26 14:17:03.473 | DEBUG    | __main__:trials:24 - Trial = 7980/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.474 | DEBUG    | __main__:trials:29 - Trial = 7980/30000 | Total reward = 53.58
2022-01-26 14:17:03.477 | DEBUG    | __main__:trials:24 - Trial = 7981/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.478 | DEBUG    | __main__:trials:29 - Trial = 7981/30000 | Total reward = 34.92
2022-01-26 14:17:03.481 | DEBUG    | __main__:trials:24 - Trial = 7982/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.482 | DEBUG    | __main__:trials:29 - Trial = 7982/30000 | Total reward = 40.36
2022-01-26 14:17:03.486 | DEBUG    | __main__:trials:24 - Trial = 7983/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.488 | DEBUG    | __main__:trials:29 - Trial = 7983/30000 | Total reward = 59.63
2022-01-26 14:17:03.491 | DEBUG    | __main__:trials:24 - Trial = 7984/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.493 | DEBUG    | __main__:trials:29 - Trial = 7984/30000 | Total reward = 51.20
2022-01-26 14:17:03.497 | DEBUG    | __main__:trials:24 - Trial = 7985/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.498 | DEBUG    | __main__:trials:29 - Trial = 7985/30000 | Total reward = 42.14
2022-01-26 14:17:03.501 | DEBUG    | __main__:trials:24 - Trial = 7986/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.503 | DEBUG    | __main__:trials:29 - Trial = 7986/30000 | Total reward = 44.04
2022-01-26 14:17:03.505 | DEBUG    | __main__:trials:26 - Trial = 7987/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.507 | DEBUG    | __main__:trials:29 - Trial = 7987/30000 | Total reward = 15.05
2022-01-26 14:17:03.510 | DEBUG    | __main__:trials:24 - Trial = 7988/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.511 | DEBUG    | __main__:trials:29 - Trial = 7988/30000 | Total reward = 38.75
2022-01-26 14:17:03.515 | DEBUG    | __main__:trials:24 - Trial = 7989/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.516 | DEBUG    | __main__:trials:29 - Trial = 7989/30000 | Total reward = 44.50
2022-01-26 14:17:03.520 | DEBUG    | __main__:trials:24 - Trial = 7990/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.521 | DEBUG    | __main__:trials:29 - Trial = 7990/30000 | Total reward = 42.20
2022-01-26 14:17:03.525 | DEBUG    | __main__:trials:24 - Trial = 7991/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.527 | DEBUG    | __main__:trials:29 - Trial = 7991/30000 | Total reward = 24.17
2022-01-26 14:17:03.531 | DEBUG    | __main__:trials:24 - Trial = 7992/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.532 | DEBUG    | __main__:trials:29 - Trial = 7992/30000 | Total reward = 34.08
2022-01-26 14:17:03.536 | DEBUG    | __main__:trials:24 - Trial = 7993/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.538 | DEBUG    | __main__:trials:29 - Trial = 7993/30000 | Total reward = 51.14
2022-01-26 14:17:03.541 | DEBUG    | __main__:trials:24 - Trial = 7994/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.543 | DEBUG    | __main__:trials:29 - Trial = 7994/30000 | Total reward = 35.88
2022-01-26 14:17:03.547 | DEBUG    | __main__:trials:24 - Trial = 7995/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.548 | DEBUG    | __main__:trials:29 - Trial = 7995/30000 | Total reward = 50.30
2022-01-26 14:17:03.552 | DEBUG    | __main__:trials:26 - Trial = 7996/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:03.552 | DEBUG    | __main__:trials:29 - Trial = 7996/30000 | Total reward = 23.21
2022-01-26 14:17:03.557 | DEBUG    | __main__:trials:24 - Trial = 7997/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.557 | DEBUG    | __main__:trials:29 - Trial = 7997/30000 | Total reward = 47.50
2022-01-26 14:17:03.561 | DEBUG    | __main__:trials:24 - Trial = 7998/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.561 | DEBUG    | __main__:trials:29 - Trial = 7998/30000 | Total reward = 18.85
2022-01-26 14:17:03.566 | DEBUG    | __main__:trials:24 - Trial = 7999/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.567 | DEBUG    | __main__:trials:29 - Trial = 7999/30000 | Total reward = 45.76
2022-01-26 14:17:03.571 | DEBUG    | __main__:trials:24 - Trial = 8000/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.573 | DEBUG    | __main__:trials:29 - Trial = 8000/30000 | Total reward = 45.01
2022-01-26 14:17:03.577 | DEBUG    | __main__:trials:24 - Trial = 8001/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.578 | DEBUG    | __main__:trials:29 - Trial = 8001/30000 | Total reward = 49.17
2022-01-26 14:17:03.582 | DEBUG    | __main__:trials:24 - Trial = 8002/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.583 | DEBUG    | __main__:trials:29 - Trial = 8002/30000 | Total reward = 47.21
2022-01-26 14:17:03.586 | DEBUG    | __main__:trials:24 - Trial = 8003/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.588 | DEBUG    | __main__:trials:29 - Trial = 8003/30000 | Total reward = 38.72
2022-01-26 14:17:03.592 | DEBUG    | __main__:trials:24 - Trial = 8004/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.594 | DEBUG    | __main__:trials:29 - Trial = 8004/30000 | Total reward = 45.87
2022-01-26 14:17:03.598 | DEBUG    | __main__:trials:24 - Trial = 8005/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.599 | DEBUG    | __main__:trials:29 - Trial = 8005/30000 | Total reward = 51.19
2022-01-26 14:17:03.602 | DEBUG    | __main__:trials:24 - Trial = 8006/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.604 | DEBUG    | __main__:trials:29 - Trial = 8006/30000 | Total reward = 50.73
2022-01-26 14:17:03.608 | DEBUG    | __main__:trials:24 - Trial = 8007/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.610 | DEBUG    | __main__:trials:29 - Trial = 8007/30000 | Total reward = 48.40
2022-01-26 14:17:03.614 | DEBUG    | __main__:trials:24 - Trial = 8008/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.615 | DEBUG    | __main__:trials:29 - Trial = 8008/30000 | Total reward = 51.75
2022-01-26 14:17:03.619 | DEBUG    | __main__:trials:24 - Trial = 8009/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.619 | DEBUG    | __main__:trials:29 - Trial = 8009/30000 | Total reward = 53.15
2022-01-26 14:17:03.624 | DEBUG    | __main__:trials:24 - Trial = 8010/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.625 | DEBUG    | __main__:trials:29 - Trial = 8010/30000 | Total reward = 51.65
2022-01-26 14:17:03.628 | DEBUG    | __main__:trials:24 - Trial = 8011/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.630 | DEBUG    | __main__:trials:29 - Trial = 8011/30000 | Total reward = 51.65
2022-01-26 14:17:03.633 | DEBUG    | __main__:trials:24 - Trial = 8012/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.634 | DEBUG    | __main__:trials:29 - Trial = 8012/30000 | Total reward = 53.21
2022-01-26 14:17:03.638 | DEBUG    | __main__:trials:24 - Trial = 8013/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.640 | DEBUG    | __main__:trials:29 - Trial = 8013/30000 | Total reward = 52.12
2022-01-26 14:17:03.644 | DEBUG    | __main__:trials:24 - Trial = 8014/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.645 | DEBUG    | __main__:trials:29 - Trial = 8014/30000 | Total reward = 36.31
2022-01-26 14:17:03.648 | DEBUG    | __main__:trials:24 - Trial = 8015/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.649 | DEBUG    | __main__:trials:29 - Trial = 8015/30000 | Total reward = 36.69
2022-01-26 14:17:03.652 | DEBUG    | __main__:trials:24 - Trial = 8016/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.653 | DEBUG    | __main__:trials:29 - Trial = 8016/30000 | Total reward = 28.81
2022-01-26 14:17:03.657 | DEBUG    | __main__:trials:24 - Trial = 8017/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.658 | DEBUG    | __main__:trials:29 - Trial = 8017/30000 | Total reward = 38.99
2022-01-26 14:17:03.662 | DEBUG    | __main__:trials:24 - Trial = 8018/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.664 | DEBUG    | __main__:trials:29 - Trial = 8018/30000 | Total reward = 42.45
2022-01-26 14:17:03.667 | DEBUG    | __main__:trials:24 - Trial = 8019/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.669 | DEBUG    | __main__:trials:29 - Trial = 8019/30000 | Total reward = 51.75
2022-01-26 14:17:03.672 | DEBUG    | __main__:trials:24 - Trial = 8020/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.674 | DEBUG    | __main__:trials:29 - Trial = 8020/30000 | Total reward = 50.32
2022-01-26 14:17:03.678 | DEBUG    | __main__:trials:24 - Trial = 8021/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.680 | DEBUG    | __main__:trials:29 - Trial = 8021/30000 | Total reward = 51.34
2022-01-26 14:17:03.684 | DEBUG    | __main__:trials:24 - Trial = 8022/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.686 | DEBUG    | __main__:trials:29 - Trial = 8022/30000 | Total reward = 38.40
2022-01-26 14:17:03.690 | DEBUG    | __main__:trials:24 - Trial = 8023/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.691 | DEBUG    | __main__:trials:29 - Trial = 8023/30000 | Total reward = 55.89
2022-01-26 14:17:03.695 | DEBUG    | __main__:trials:24 - Trial = 8024/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.696 | DEBUG    | __main__:trials:29 - Trial = 8024/30000 | Total reward = 50.29
2022-01-26 14:17:03.699 | DEBUG    | __main__:trials:24 - Trial = 8025/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.701 | DEBUG    | __main__:trials:29 - Trial = 8025/30000 | Total reward = 52.39
2022-01-26 14:17:03.705 | DEBUG    | __main__:trials:24 - Trial = 8026/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.707 | DEBUG    | __main__:trials:29 - Trial = 8026/30000 | Total reward = 51.65
2022-01-26 14:17:03.710 | DEBUG    | __main__:trials:24 - Trial = 8027/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.712 | DEBUG    | __main__:trials:29 - Trial = 8027/30000 | Total reward = 45.55
2022-01-26 14:17:03.715 | DEBUG    | __main__:trials:24 - Trial = 8028/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.717 | DEBUG    | __main__:trials:29 - Trial = 8028/30000 | Total reward = 47.94
2022-01-26 14:17:03.721 | DEBUG    | __main__:trials:24 - Trial = 8029/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.722 | DEBUG    | __main__:trials:29 - Trial = 8029/30000 | Total reward = 53.31
2022-01-26 14:17:03.725 | DEBUG    | __main__:trials:24 - Trial = 8030/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.727 | DEBUG    | __main__:trials:29 - Trial = 8030/30000 | Total reward = 51.24
2022-01-26 14:17:03.731 | DEBUG    | __main__:trials:24 - Trial = 8031/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.732 | DEBUG    | __main__:trials:29 - Trial = 8031/30000 | Total reward = 51.62
2022-01-26 14:17:03.736 | DEBUG    | __main__:trials:24 - Trial = 8032/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.737 | DEBUG    | __main__:trials:29 - Trial = 8032/30000 | Total reward = 58.98
2022-01-26 14:17:03.741 | DEBUG    | __main__:trials:24 - Trial = 8033/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.742 | DEBUG    | __main__:trials:29 - Trial = 8033/30000 | Total reward = 51.78
2022-01-26 14:17:03.746 | DEBUG    | __main__:trials:24 - Trial = 8034/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.747 | DEBUG    | __main__:trials:29 - Trial = 8034/30000 | Total reward = 56.88
2022-01-26 14:17:03.750 | DEBUG    | __main__:trials:24 - Trial = 8035/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.753 | DEBUG    | __main__:trials:29 - Trial = 8035/30000 | Total reward = 58.02
2022-01-26 14:17:03.756 | DEBUG    | __main__:trials:24 - Trial = 8036/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.758 | DEBUG    | __main__:trials:29 - Trial = 8036/30000 | Total reward = 40.38
2022-01-26 14:17:03.762 | DEBUG    | __main__:trials:24 - Trial = 8037/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.763 | DEBUG    | __main__:trials:29 - Trial = 8037/30000 | Total reward = 37.40
2022-01-26 14:17:03.766 | DEBUG    | __main__:trials:24 - Trial = 8038/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.768 | DEBUG    | __main__:trials:29 - Trial = 8038/30000 | Total reward = 40.25
2022-01-26 14:17:03.772 | DEBUG    | __main__:trials:24 - Trial = 8039/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.774 | DEBUG    | __main__:trials:29 - Trial = 8039/30000 | Total reward = 50.61
2022-01-26 14:17:03.777 | DEBUG    | __main__:trials:24 - Trial = 8040/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.779 | DEBUG    | __main__:trials:29 - Trial = 8040/30000 | Total reward = 63.93
2022-01-26 14:17:03.782 | DEBUG    | __main__:trials:24 - Trial = 8041/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.784 | DEBUG    | __main__:trials:29 - Trial = 8041/30000 | Total reward = 51.19
2022-01-26 14:17:03.788 | DEBUG    | __main__:trials:24 - Trial = 8042/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.789 | DEBUG    | __main__:trials:29 - Trial = 8042/30000 | Total reward = 51.24
2022-01-26 14:17:03.793 | DEBUG    | __main__:trials:24 - Trial = 8043/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.795 | DEBUG    | __main__:trials:29 - Trial = 8043/30000 | Total reward = 38.72
2022-01-26 14:17:03.798 | DEBUG    | __main__:trials:24 - Trial = 8044/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.800 | DEBUG    | __main__:trials:29 - Trial = 8044/30000 | Total reward = 40.69
2022-01-26 14:17:03.804 | DEBUG    | __main__:trials:24 - Trial = 8045/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.805 | DEBUG    | __main__:trials:29 - Trial = 8045/30000 | Total reward = 52.52
2022-01-26 14:17:03.809 | DEBUG    | __main__:trials:24 - Trial = 8046/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.811 | DEBUG    | __main__:trials:29 - Trial = 8046/30000 | Total reward = 49.32
2022-01-26 14:17:03.814 | DEBUG    | __main__:trials:24 - Trial = 8047/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.816 | DEBUG    | __main__:trials:29 - Trial = 8047/30000 | Total reward = 46.98
2022-01-26 14:17:03.820 | DEBUG    | __main__:trials:24 - Trial = 8048/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.822 | DEBUG    | __main__:trials:29 - Trial = 8048/30000 | Total reward = 49.00
2022-01-26 14:17:03.825 | DEBUG    | __main__:trials:24 - Trial = 8049/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.827 | DEBUG    | __main__:trials:29 - Trial = 8049/30000 | Total reward = 46.54
2022-01-26 14:17:03.830 | DEBUG    | __main__:trials:24 - Trial = 8050/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.832 | DEBUG    | __main__:trials:29 - Trial = 8050/30000 | Total reward = 44.73
2022-01-26 14:17:03.835 | DEBUG    | __main__:trials:24 - Trial = 8051/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.837 | DEBUG    | __main__:trials:29 - Trial = 8051/30000 | Total reward = 27.92
2022-01-26 14:17:03.840 | DEBUG    | __main__:trials:24 - Trial = 8052/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.841 | DEBUG    | __main__:trials:29 - Trial = 8052/30000 | Total reward = 44.98
2022-01-26 14:17:03.844 | DEBUG    | __main__:trials:24 - Trial = 8053/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.846 | DEBUG    | __main__:trials:29 - Trial = 8053/30000 | Total reward = 46.78
2022-01-26 14:17:03.850 | DEBUG    | __main__:trials:24 - Trial = 8054/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.852 | DEBUG    | __main__:trials:29 - Trial = 8054/30000 | Total reward = 44.04
2022-01-26 14:17:03.856 | DEBUG    | __main__:trials:24 - Trial = 8055/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.857 | DEBUG    | __main__:trials:29 - Trial = 8055/30000 | Total reward = 47.48
2022-01-26 14:17:03.860 | DEBUG    | __main__:trials:24 - Trial = 8056/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.861 | DEBUG    | __main__:trials:29 - Trial = 8056/30000 | Total reward = 40.51
2022-01-26 14:17:03.865 | DEBUG    | __main__:trials:24 - Trial = 8057/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.867 | DEBUG    | __main__:trials:29 - Trial = 8057/30000 | Total reward = 36.73
2022-01-26 14:17:03.870 | DEBUG    | __main__:trials:24 - Trial = 8058/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.872 | DEBUG    | __main__:trials:29 - Trial = 8058/30000 | Total reward = 42.53
2022-01-26 14:17:03.876 | DEBUG    | __main__:trials:24 - Trial = 8059/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.876 | DEBUG    | __main__:trials:29 - Trial = 8059/30000 | Total reward = 51.65
2022-01-26 14:17:03.880 | DEBUG    | __main__:trials:24 - Trial = 8060/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.881 | DEBUG    | __main__:trials:29 - Trial = 8060/30000 | Total reward = 36.20
2022-01-26 14:17:03.885 | DEBUG    | __main__:trials:24 - Trial = 8061/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.886 | DEBUG    | __main__:trials:29 - Trial = 8061/30000 | Total reward = 57.66
2022-01-26 14:17:03.889 | DEBUG    | __main__:trials:24 - Trial = 8062/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.891 | DEBUG    | __main__:trials:29 - Trial = 8062/30000 | Total reward = 42.40
2022-01-26 14:17:03.894 | DEBUG    | __main__:trials:24 - Trial = 8063/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.895 | DEBUG    | __main__:trials:29 - Trial = 8063/30000 | Total reward = 52.29
2022-01-26 14:17:03.899 | DEBUG    | __main__:trials:24 - Trial = 8064/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.901 | DEBUG    | __main__:trials:29 - Trial = 8064/30000 | Total reward = 55.43
2022-01-26 14:17:03.904 | DEBUG    | __main__:trials:24 - Trial = 8065/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.906 | DEBUG    | __main__:trials:29 - Trial = 8065/30000 | Total reward = 34.29
2022-01-26 14:17:03.909 | DEBUG    | __main__:trials:24 - Trial = 8066/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.911 | DEBUG    | __main__:trials:29 - Trial = 8066/30000 | Total reward = 38.81
2022-01-26 14:17:03.915 | DEBUG    | __main__:trials:24 - Trial = 8067/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.917 | DEBUG    | __main__:trials:29 - Trial = 8067/30000 | Total reward = 46.31
2022-01-26 14:17:03.920 | DEBUG    | __main__:trials:24 - Trial = 8068/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.921 | DEBUG    | __main__:trials:29 - Trial = 8068/30000 | Total reward = 51.28
2022-01-26 14:17:03.925 | DEBUG    | __main__:trials:24 - Trial = 8069/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.927 | DEBUG    | __main__:trials:29 - Trial = 8069/30000 | Total reward = 39.04
2022-01-26 14:17:03.930 | DEBUG    | __main__:trials:24 - Trial = 8070/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.931 | DEBUG    | __main__:trials:29 - Trial = 8070/30000 | Total reward = 48.95
2022-01-26 14:17:03.935 | DEBUG    | __main__:trials:24 - Trial = 8071/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.937 | DEBUG    | __main__:trials:29 - Trial = 8071/30000 | Total reward = 43.19
2022-01-26 14:17:03.940 | DEBUG    | __main__:trials:24 - Trial = 8072/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.942 | DEBUG    | __main__:trials:29 - Trial = 8072/30000 | Total reward = 40.50
2022-01-26 14:17:03.945 | DEBUG    | __main__:trials:24 - Trial = 8073/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.947 | DEBUG    | __main__:trials:29 - Trial = 8073/30000 | Total reward = 39.02
2022-01-26 14:17:03.951 | DEBUG    | __main__:trials:24 - Trial = 8074/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.952 | DEBUG    | __main__:trials:29 - Trial = 8074/30000 | Total reward = 42.74
2022-01-26 14:17:03.956 | DEBUG    | __main__:trials:24 - Trial = 8075/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.957 | DEBUG    | __main__:trials:29 - Trial = 8075/30000 | Total reward = 43.16
2022-01-26 14:17:03.961 | DEBUG    | __main__:trials:24 - Trial = 8076/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.963 | DEBUG    | __main__:trials:29 - Trial = 8076/30000 | Total reward = 41.68
2022-01-26 14:17:03.966 | DEBUG    | __main__:trials:24 - Trial = 8077/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.968 | DEBUG    | __main__:trials:29 - Trial = 8077/30000 | Total reward = 52.98
2022-01-26 14:17:03.972 | DEBUG    | __main__:trials:24 - Trial = 8078/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.973 | DEBUG    | __main__:trials:29 - Trial = 8078/30000 | Total reward = 46.56
2022-01-26 14:17:03.977 | DEBUG    | __main__:trials:24 - Trial = 8079/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.979 | DEBUG    | __main__:trials:29 - Trial = 8079/30000 | Total reward = 52.29
2022-01-26 14:17:03.983 | DEBUG    | __main__:trials:24 - Trial = 8080/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.984 | DEBUG    | __main__:trials:29 - Trial = 8080/30000 | Total reward = 56.53
2022-01-26 14:17:03.987 | DEBUG    | __main__:trials:24 - Trial = 8081/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.989 | DEBUG    | __main__:trials:29 - Trial = 8081/30000 | Total reward = 42.86
2022-01-26 14:17:03.993 | DEBUG    | __main__:trials:24 - Trial = 8082/30000 | Max number of steps (20) reached
2022-01-26 14:17:03.995 | DEBUG    | __main__:trials:29 - Trial = 8082/30000 | Total reward = 52.23
2022-01-26 14:17:03.998 | DEBUG    | __main__:trials:24 - Trial = 8083/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.000 | DEBUG    | __main__:trials:29 - Trial = 8083/30000 | Total reward = 38.64
2022-01-26 14:17:04.004 | DEBUG    | __main__:trials:24 - Trial = 8084/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.006 | DEBUG    | __main__:trials:29 - Trial = 8084/30000 | Total reward = 42.65
2022-01-26 14:17:04.009 | DEBUG    | __main__:trials:24 - Trial = 8085/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.011 | DEBUG    | __main__:trials:29 - Trial = 8085/30000 | Total reward = 35.34
2022-01-26 14:17:04.015 | DEBUG    | __main__:trials:24 - Trial = 8086/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.017 | DEBUG    | __main__:trials:29 - Trial = 8086/30000 | Total reward = 48.44
2022-01-26 14:17:04.020 | DEBUG    | __main__:trials:24 - Trial = 8087/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.022 | DEBUG    | __main__:trials:29 - Trial = 8087/30000 | Total reward = 26.30
2022-01-26 14:17:04.026 | DEBUG    | __main__:trials:24 - Trial = 8088/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.027 | DEBUG    | __main__:trials:29 - Trial = 8088/30000 | Total reward = 42.92
2022-01-26 14:17:04.031 | DEBUG    | __main__:trials:26 - Trial = 8089/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.032 | DEBUG    | __main__:trials:29 - Trial = 8089/30000 | Total reward = 39.25
2022-01-26 14:17:04.036 | DEBUG    | __main__:trials:24 - Trial = 8090/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.037 | DEBUG    | __main__:trials:29 - Trial = 8090/30000 | Total reward = 29.76
2022-01-26 14:17:04.040 | DEBUG    | __main__:trials:26 - Trial = 8091/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.041 | DEBUG    | __main__:trials:29 - Trial = 8091/30000 | Total reward = 13.57
2022-01-26 14:17:04.045 | DEBUG    | __main__:trials:24 - Trial = 8092/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.046 | DEBUG    | __main__:trials:29 - Trial = 8092/30000 | Total reward = 40.45
2022-01-26 14:17:04.050 | DEBUG    | __main__:trials:24 - Trial = 8093/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.052 | DEBUG    | __main__:trials:29 - Trial = 8093/30000 | Total reward = 42.74
2022-01-26 14:17:04.055 | DEBUG    | __main__:trials:24 - Trial = 8094/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.057 | DEBUG    | __main__:trials:29 - Trial = 8094/30000 | Total reward = 36.95
2022-01-26 14:17:04.060 | DEBUG    | __main__:trials:24 - Trial = 8095/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.062 | DEBUG    | __main__:trials:29 - Trial = 8095/30000 | Total reward = 36.58
2022-01-26 14:17:04.065 | DEBUG    | __main__:trials:24 - Trial = 8096/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.067 | DEBUG    | __main__:trials:29 - Trial = 8096/30000 | Total reward = 47.91
2022-01-26 14:17:04.071 | DEBUG    | __main__:trials:24 - Trial = 8097/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.073 | DEBUG    | __main__:trials:29 - Trial = 8097/30000 | Total reward = 47.74
2022-01-26 14:17:04.077 | DEBUG    | __main__:trials:24 - Trial = 8098/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.078 | DEBUG    | __main__:trials:29 - Trial = 8098/30000 | Total reward = 52.57
2022-01-26 14:17:04.082 | DEBUG    | __main__:trials:24 - Trial = 8099/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.084 | DEBUG    | __main__:trials:29 - Trial = 8099/30000 | Total reward = 52.49
2022-01-26 14:17:04.088 | DEBUG    | __main__:trials:24 - Trial = 8100/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.088 | DEBUG    | __main__:trials:29 - Trial = 8100/30000 | Total reward = 51.47
2022-01-26 14:17:04.092 | DEBUG    | __main__:trials:24 - Trial = 8101/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.094 | DEBUG    | __main__:trials:29 - Trial = 8101/30000 | Total reward = 52.29
2022-01-26 14:17:04.098 | DEBUG    | __main__:trials:24 - Trial = 8102/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.100 | DEBUG    | __main__:trials:29 - Trial = 8102/30000 | Total reward = 51.65
2022-01-26 14:17:04.103 | DEBUG    | __main__:trials:24 - Trial = 8103/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.104 | DEBUG    | __main__:trials:29 - Trial = 8103/30000 | Total reward = 37.12
2022-01-26 14:17:04.108 | DEBUG    | __main__:trials:24 - Trial = 8104/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.110 | DEBUG    | __main__:trials:29 - Trial = 8104/30000 | Total reward = 38.16
2022-01-26 14:17:04.114 | DEBUG    | __main__:trials:24 - Trial = 8105/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.114 | DEBUG    | __main__:trials:29 - Trial = 8105/30000 | Total reward = 48.46
2022-01-26 14:17:04.118 | DEBUG    | __main__:trials:24 - Trial = 8106/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.120 | DEBUG    | __main__:trials:29 - Trial = 8106/30000 | Total reward = 33.39
2022-01-26 14:17:04.124 | DEBUG    | __main__:trials:24 - Trial = 8107/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.125 | DEBUG    | __main__:trials:29 - Trial = 8107/30000 | Total reward = 51.65
2022-01-26 14:17:04.129 | DEBUG    | __main__:trials:24 - Trial = 8108/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.131 | DEBUG    | __main__:trials:29 - Trial = 8108/30000 | Total reward = 55.10
2022-01-26 14:17:04.134 | DEBUG    | __main__:trials:24 - Trial = 8109/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.136 | DEBUG    | __main__:trials:29 - Trial = 8109/30000 | Total reward = 50.28
2022-01-26 14:17:04.140 | DEBUG    | __main__:trials:24 - Trial = 8110/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.141 | DEBUG    | __main__:trials:29 - Trial = 8110/30000 | Total reward = 47.21
2022-01-26 14:17:04.145 | DEBUG    | __main__:trials:24 - Trial = 8111/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.146 | DEBUG    | __main__:trials:29 - Trial = 8111/30000 | Total reward = 57.22
2022-01-26 14:17:04.150 | DEBUG    | __main__:trials:24 - Trial = 8112/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.151 | DEBUG    | __main__:trials:29 - Trial = 8112/30000 | Total reward = 31.95
2022-01-26 14:17:04.155 | DEBUG    | __main__:trials:24 - Trial = 8113/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.157 | DEBUG    | __main__:trials:29 - Trial = 8113/30000 | Total reward = 39.90
2022-01-26 14:17:04.160 | DEBUG    | __main__:trials:24 - Trial = 8114/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.162 | DEBUG    | __main__:trials:29 - Trial = 8114/30000 | Total reward = 46.89
2022-01-26 14:17:04.166 | DEBUG    | __main__:trials:24 - Trial = 8115/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.167 | DEBUG    | __main__:trials:29 - Trial = 8115/30000 | Total reward = 28.13
2022-01-26 14:17:04.169 | DEBUG    | __main__:trials:26 - Trial = 8116/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.171 | DEBUG    | __main__:trials:29 - Trial = 8116/30000 | Total reward = 15.24
2022-01-26 14:17:04.175 | DEBUG    | __main__:trials:24 - Trial = 8117/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.176 | DEBUG    | __main__:trials:29 - Trial = 8117/30000 | Total reward = 40.19
2022-01-26 14:17:04.179 | DEBUG    | __main__:trials:24 - Trial = 8118/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.181 | DEBUG    | __main__:trials:29 - Trial = 8118/30000 | Total reward = 42.71
2022-01-26 14:17:04.184 | DEBUG    | __main__:trials:24 - Trial = 8119/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.186 | DEBUG    | __main__:trials:29 - Trial = 8119/30000 | Total reward = 36.21
2022-01-26 14:17:04.190 | DEBUG    | __main__:trials:24 - Trial = 8120/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.191 | DEBUG    | __main__:trials:29 - Trial = 8120/30000 | Total reward = 28.60
2022-01-26 14:17:04.194 | DEBUG    | __main__:trials:24 - Trial = 8121/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.196 | DEBUG    | __main__:trials:29 - Trial = 8121/30000 | Total reward = 37.52
2022-01-26 14:17:04.200 | DEBUG    | __main__:trials:24 - Trial = 8122/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.201 | DEBUG    | __main__:trials:29 - Trial = 8122/30000 | Total reward = 49.07
2022-01-26 14:17:04.205 | DEBUG    | __main__:trials:24 - Trial = 8123/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.206 | DEBUG    | __main__:trials:29 - Trial = 8123/30000 | Total reward = 31.37
2022-01-26 14:17:04.210 | DEBUG    | __main__:trials:24 - Trial = 8124/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.212 | DEBUG    | __main__:trials:29 - Trial = 8124/30000 | Total reward = 31.74
2022-01-26 14:17:04.215 | DEBUG    | __main__:trials:24 - Trial = 8125/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.217 | DEBUG    | __main__:trials:29 - Trial = 8125/30000 | Total reward = 34.57
2022-01-26 14:17:04.220 | DEBUG    | __main__:trials:24 - Trial = 8126/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.221 | DEBUG    | __main__:trials:29 - Trial = 8126/30000 | Total reward = 38.64
2022-01-26 14:17:04.224 | DEBUG    | __main__:trials:24 - Trial = 8127/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.225 | DEBUG    | __main__:trials:29 - Trial = 8127/30000 | Total reward = 34.92
2022-01-26 14:17:04.229 | DEBUG    | __main__:trials:24 - Trial = 8128/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.229 | DEBUG    | __main__:trials:29 - Trial = 8128/30000 | Total reward = 51.47
2022-01-26 14:17:04.233 | DEBUG    | __main__:trials:24 - Trial = 8129/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.233 | DEBUG    | __main__:trials:29 - Trial = 8129/30000 | Total reward = 15.96
2022-01-26 14:17:04.237 | DEBUG    | __main__:trials:24 - Trial = 8130/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.239 | DEBUG    | __main__:trials:29 - Trial = 8130/30000 | Total reward = 40.66
2022-01-26 14:17:04.243 | DEBUG    | __main__:trials:24 - Trial = 8131/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.245 | DEBUG    | __main__:trials:29 - Trial = 8131/30000 | Total reward = 51.55
2022-01-26 14:17:04.247 | DEBUG    | __main__:trials:26 - Trial = 8132/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.249 | DEBUG    | __main__:trials:29 - Trial = 8132/30000 | Total reward = 12.57
2022-01-26 14:17:04.252 | DEBUG    | __main__:trials:24 - Trial = 8133/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.254 | DEBUG    | __main__:trials:29 - Trial = 8133/30000 | Total reward = 47.99
2022-01-26 14:17:04.257 | DEBUG    | __main__:trials:24 - Trial = 8134/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.258 | DEBUG    | __main__:trials:29 - Trial = 8134/30000 | Total reward = 41.65
2022-01-26 14:17:04.261 | DEBUG    | __main__:trials:24 - Trial = 8135/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.263 | DEBUG    | __main__:trials:29 - Trial = 8135/30000 | Total reward = 42.44
2022-01-26 14:17:04.267 | DEBUG    | __main__:trials:24 - Trial = 8136/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.268 | DEBUG    | __main__:trials:29 - Trial = 8136/30000 | Total reward = 48.59
2022-01-26 14:17:04.272 | DEBUG    | __main__:trials:24 - Trial = 8137/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.273 | DEBUG    | __main__:trials:29 - Trial = 8137/30000 | Total reward = 36.07
2022-01-26 14:17:04.277 | DEBUG    | __main__:trials:24 - Trial = 8138/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.278 | DEBUG    | __main__:trials:29 - Trial = 8138/30000 | Total reward = 43.82
2022-01-26 14:17:04.280 | DEBUG    | __main__:trials:24 - Trial = 8139/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.281 | DEBUG    | __main__:trials:29 - Trial = 8139/30000 | Total reward = 44.18
2022-01-26 14:17:04.285 | DEBUG    | __main__:trials:24 - Trial = 8140/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.287 | DEBUG    | __main__:trials:29 - Trial = 8140/30000 | Total reward = 38.31
2022-01-26 14:17:04.291 | DEBUG    | __main__:trials:24 - Trial = 8141/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.292 | DEBUG    | __main__:trials:29 - Trial = 8141/30000 | Total reward = 35.19
2022-01-26 14:17:04.296 | DEBUG    | __main__:trials:24 - Trial = 8142/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.298 | DEBUG    | __main__:trials:29 - Trial = 8142/30000 | Total reward = 40.78
2022-01-26 14:17:04.301 | DEBUG    | __main__:trials:24 - Trial = 8143/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.303 | DEBUG    | __main__:trials:29 - Trial = 8143/30000 | Total reward = 49.25
2022-01-26 14:17:04.306 | DEBUG    | __main__:trials:24 - Trial = 8144/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.308 | DEBUG    | __main__:trials:29 - Trial = 8144/30000 | Total reward = 30.55
2022-01-26 14:17:04.312 | DEBUG    | __main__:trials:24 - Trial = 8145/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.313 | DEBUG    | __main__:trials:29 - Trial = 8145/30000 | Total reward = 31.69
2022-01-26 14:17:04.316 | DEBUG    | __main__:trials:26 - Trial = 8146/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.317 | DEBUG    | __main__:trials:29 - Trial = 8146/30000 | Total reward = 11.11
2022-01-26 14:17:04.320 | DEBUG    | __main__:trials:24 - Trial = 8147/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.322 | DEBUG    | __main__:trials:29 - Trial = 8147/30000 | Total reward = 29.50
2022-01-26 14:17:04.326 | DEBUG    | __main__:trials:24 - Trial = 8148/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.327 | DEBUG    | __main__:trials:29 - Trial = 8148/30000 | Total reward = 30.69
2022-01-26 14:17:04.330 | DEBUG    | __main__:trials:24 - Trial = 8149/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.332 | DEBUG    | __main__:trials:29 - Trial = 8149/30000 | Total reward = 37.82
2022-01-26 14:17:04.336 | DEBUG    | __main__:trials:24 - Trial = 8150/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.337 | DEBUG    | __main__:trials:29 - Trial = 8150/30000 | Total reward = 34.25
2022-01-26 14:17:04.340 | DEBUG    | __main__:trials:24 - Trial = 8151/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.342 | DEBUG    | __main__:trials:29 - Trial = 8151/30000 | Total reward = 31.74
2022-01-26 14:17:04.346 | DEBUG    | __main__:trials:24 - Trial = 8152/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.347 | DEBUG    | __main__:trials:29 - Trial = 8152/30000 | Total reward = 38.44
2022-01-26 14:17:04.351 | DEBUG    | __main__:trials:24 - Trial = 8153/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.353 | DEBUG    | __main__:trials:29 - Trial = 8153/30000 | Total reward = 49.59
2022-01-26 14:17:04.356 | DEBUG    | __main__:trials:24 - Trial = 8154/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.358 | DEBUG    | __main__:trials:29 - Trial = 8154/30000 | Total reward = 41.79
2022-01-26 14:17:04.361 | DEBUG    | __main__:trials:24 - Trial = 8155/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.363 | DEBUG    | __main__:trials:29 - Trial = 8155/30000 | Total reward = 32.51
2022-01-26 14:17:04.367 | DEBUG    | __main__:trials:24 - Trial = 8156/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.368 | DEBUG    | __main__:trials:29 - Trial = 8156/30000 | Total reward = 32.36
2022-01-26 14:17:04.372 | DEBUG    | __main__:trials:24 - Trial = 8157/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.374 | DEBUG    | __main__:trials:29 - Trial = 8157/30000 | Total reward = 29.10
2022-01-26 14:17:04.378 | DEBUG    | __main__:trials:24 - Trial = 8158/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.380 | DEBUG    | __main__:trials:29 - Trial = 8158/30000 | Total reward = 35.02
2022-01-26 14:17:04.383 | DEBUG    | __main__:trials:24 - Trial = 8159/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.385 | DEBUG    | __main__:trials:29 - Trial = 8159/30000 | Total reward = 39.05
2022-01-26 14:17:04.388 | DEBUG    | __main__:trials:24 - Trial = 8160/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.390 | DEBUG    | __main__:trials:29 - Trial = 8160/30000 | Total reward = 27.07
2022-01-26 14:17:04.393 | DEBUG    | __main__:trials:24 - Trial = 8161/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.394 | DEBUG    | __main__:trials:29 - Trial = 8161/30000 | Total reward = 35.95
2022-01-26 14:17:04.397 | DEBUG    | __main__:trials:24 - Trial = 8162/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.399 | DEBUG    | __main__:trials:29 - Trial = 8162/30000 | Total reward = 49.08
2022-01-26 14:17:04.402 | DEBUG    | __main__:trials:24 - Trial = 8163/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.404 | DEBUG    | __main__:trials:29 - Trial = 8163/30000 | Total reward = 38.28
2022-01-26 14:17:04.408 | DEBUG    | __main__:trials:24 - Trial = 8164/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.409 | DEBUG    | __main__:trials:29 - Trial = 8164/30000 | Total reward = 33.28
2022-01-26 14:17:04.412 | DEBUG    | __main__:trials:24 - Trial = 8165/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.414 | DEBUG    | __main__:trials:29 - Trial = 8165/30000 | Total reward = 36.28
2022-01-26 14:17:04.418 | DEBUG    | __main__:trials:24 - Trial = 8166/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.419 | DEBUG    | __main__:trials:29 - Trial = 8166/30000 | Total reward = 33.27
2022-01-26 14:17:04.422 | DEBUG    | __main__:trials:24 - Trial = 8167/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.424 | DEBUG    | __main__:trials:29 - Trial = 8167/30000 | Total reward = 47.03
2022-01-26 14:17:04.428 | DEBUG    | __main__:trials:24 - Trial = 8168/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.429 | DEBUG    | __main__:trials:29 - Trial = 8168/30000 | Total reward = 29.57
2022-01-26 14:17:04.433 | DEBUG    | __main__:trials:24 - Trial = 8169/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.435 | DEBUG    | __main__:trials:29 - Trial = 8169/30000 | Total reward = 33.02
2022-01-26 14:17:04.439 | DEBUG    | __main__:trials:24 - Trial = 8170/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.440 | DEBUG    | __main__:trials:29 - Trial = 8170/30000 | Total reward = 52.39
2022-01-26 14:17:04.443 | DEBUG    | __main__:trials:24 - Trial = 8171/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.445 | DEBUG    | __main__:trials:29 - Trial = 8171/30000 | Total reward = 29.94
2022-01-26 14:17:04.449 | DEBUG    | __main__:trials:24 - Trial = 8172/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.449 | DEBUG    | __main__:trials:29 - Trial = 8172/30000 | Total reward = 27.82
2022-01-26 14:17:04.453 | DEBUG    | __main__:trials:24 - Trial = 8173/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.453 | DEBUG    | __main__:trials:29 - Trial = 8173/30000 | Total reward = 29.19
2022-01-26 14:17:04.457 | DEBUG    | __main__:trials:24 - Trial = 8174/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.459 | DEBUG    | __main__:trials:29 - Trial = 8174/30000 | Total reward = 42.05
2022-01-26 14:17:04.462 | DEBUG    | __main__:trials:24 - Trial = 8175/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.464 | DEBUG    | __main__:trials:29 - Trial = 8175/30000 | Total reward = 50.39
2022-01-26 14:17:04.467 | DEBUG    | __main__:trials:24 - Trial = 8176/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.469 | DEBUG    | __main__:trials:29 - Trial = 8176/30000 | Total reward = 39.57
2022-01-26 14:17:04.472 | DEBUG    | __main__:trials:24 - Trial = 8177/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.475 | DEBUG    | __main__:trials:29 - Trial = 8177/30000 | Total reward = 39.93
2022-01-26 14:17:04.478 | DEBUG    | __main__:trials:24 - Trial = 8178/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.480 | DEBUG    | __main__:trials:29 - Trial = 8178/30000 | Total reward = 47.62
2022-01-26 14:17:04.483 | DEBUG    | __main__:trials:24 - Trial = 8179/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.485 | DEBUG    | __main__:trials:29 - Trial = 8179/30000 | Total reward = 36.56
2022-01-26 14:17:04.488 | DEBUG    | __main__:trials:24 - Trial = 8180/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.490 | DEBUG    | __main__:trials:29 - Trial = 8180/30000 | Total reward = 41.94
2022-01-26 14:17:04.494 | DEBUG    | __main__:trials:24 - Trial = 8181/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.496 | DEBUG    | __main__:trials:29 - Trial = 8181/30000 | Total reward = 41.38
2022-01-26 14:17:04.500 | DEBUG    | __main__:trials:24 - Trial = 8182/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.501 | DEBUG    | __main__:trials:29 - Trial = 8182/30000 | Total reward = 32.06
2022-01-26 14:17:04.505 | DEBUG    | __main__:trials:24 - Trial = 8183/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.507 | DEBUG    | __main__:trials:29 - Trial = 8183/30000 | Total reward = 37.98
2022-01-26 14:17:04.510 | DEBUG    | __main__:trials:26 - Trial = 8184/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.511 | DEBUG    | __main__:trials:29 - Trial = 8184/30000 | Total reward = 17.32
2022-01-26 14:17:04.515 | DEBUG    | __main__:trials:24 - Trial = 8185/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.516 | DEBUG    | __main__:trials:29 - Trial = 8185/30000 | Total reward = 40.30
2022-01-26 14:17:04.520 | DEBUG    | __main__:trials:24 - Trial = 8186/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.522 | DEBUG    | __main__:trials:29 - Trial = 8186/30000 | Total reward = 39.96
2022-01-26 14:17:04.525 | DEBUG    | __main__:trials:24 - Trial = 8187/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.527 | DEBUG    | __main__:trials:29 - Trial = 8187/30000 | Total reward = 44.93
2022-01-26 14:17:04.531 | DEBUG    | __main__:trials:24 - Trial = 8188/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.532 | DEBUG    | __main__:trials:29 - Trial = 8188/30000 | Total reward = 43.26
2022-01-26 14:17:04.536 | DEBUG    | __main__:trials:24 - Trial = 8189/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.537 | DEBUG    | __main__:trials:29 - Trial = 8189/30000 | Total reward = 46.20
2022-01-26 14:17:04.541 | DEBUG    | __main__:trials:24 - Trial = 8190/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.541 | DEBUG    | __main__:trials:29 - Trial = 8190/30000 | Total reward = 43.61
2022-01-26 14:17:04.546 | DEBUG    | __main__:trials:24 - Trial = 8191/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.547 | DEBUG    | __main__:trials:29 - Trial = 8191/30000 | Total reward = 46.63
2022-01-26 14:17:04.551 | DEBUG    | __main__:trials:24 - Trial = 8192/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.553 | DEBUG    | __main__:trials:29 - Trial = 8192/30000 | Total reward = 32.34
2022-01-26 14:17:04.556 | DEBUG    | __main__:trials:24 - Trial = 8193/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.558 | DEBUG    | __main__:trials:29 - Trial = 8193/30000 | Total reward = 45.06
2022-01-26 14:17:04.561 | DEBUG    | __main__:trials:24 - Trial = 8194/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.563 | DEBUG    | __main__:trials:29 - Trial = 8194/30000 | Total reward = 37.47
2022-01-26 14:17:04.567 | DEBUG    | __main__:trials:24 - Trial = 8195/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.568 | DEBUG    | __main__:trials:29 - Trial = 8195/30000 | Total reward = 46.63
2022-01-26 14:17:04.571 | DEBUG    | __main__:trials:24 - Trial = 8196/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.573 | DEBUG    | __main__:trials:29 - Trial = 8196/30000 | Total reward = 44.53
2022-01-26 14:17:04.576 | DEBUG    | __main__:trials:24 - Trial = 8197/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.578 | DEBUG    | __main__:trials:29 - Trial = 8197/30000 | Total reward = 36.31
2022-01-26 14:17:04.582 | DEBUG    | __main__:trials:24 - Trial = 8198/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.583 | DEBUG    | __main__:trials:29 - Trial = 8198/30000 | Total reward = 47.76
2022-01-26 14:17:04.586 | DEBUG    | __main__:trials:24 - Trial = 8199/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.589 | DEBUG    | __main__:trials:29 - Trial = 8199/30000 | Total reward = 44.24
2022-01-26 14:17:04.593 | DEBUG    | __main__:trials:24 - Trial = 8200/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.594 | DEBUG    | __main__:trials:29 - Trial = 8200/30000 | Total reward = 42.71
2022-01-26 14:17:04.598 | DEBUG    | __main__:trials:24 - Trial = 8201/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.599 | DEBUG    | __main__:trials:29 - Trial = 8201/30000 | Total reward = 32.41
2022-01-26 14:17:04.603 | DEBUG    | __main__:trials:24 - Trial = 8202/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.605 | DEBUG    | __main__:trials:29 - Trial = 8202/30000 | Total reward = 42.93
2022-01-26 14:17:04.608 | DEBUG    | __main__:trials:24 - Trial = 8203/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.610 | DEBUG    | __main__:trials:29 - Trial = 8203/30000 | Total reward = 36.44
2022-01-26 14:17:04.614 | DEBUG    | __main__:trials:24 - Trial = 8204/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.615 | DEBUG    | __main__:trials:29 - Trial = 8204/30000 | Total reward = 37.09
2022-01-26 14:17:04.618 | DEBUG    | __main__:trials:24 - Trial = 8205/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.620 | DEBUG    | __main__:trials:29 - Trial = 8205/30000 | Total reward = 39.89
2022-01-26 14:17:04.624 | DEBUG    | __main__:trials:24 - Trial = 8206/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.626 | DEBUG    | __main__:trials:29 - Trial = 8206/30000 | Total reward = 46.76
2022-01-26 14:17:04.629 | DEBUG    | __main__:trials:24 - Trial = 8207/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.631 | DEBUG    | __main__:trials:29 - Trial = 8207/30000 | Total reward = 39.26
2022-01-26 14:17:04.634 | DEBUG    | __main__:trials:24 - Trial = 8208/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.636 | DEBUG    | __main__:trials:29 - Trial = 8208/30000 | Total reward = 48.80
2022-01-26 14:17:04.640 | DEBUG    | __main__:trials:24 - Trial = 8209/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.641 | DEBUG    | __main__:trials:29 - Trial = 8209/30000 | Total reward = 48.66
2022-01-26 14:17:04.644 | DEBUG    | __main__:trials:24 - Trial = 8210/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.646 | DEBUG    | __main__:trials:29 - Trial = 8210/30000 | Total reward = 41.44
2022-01-26 14:17:04.649 | DEBUG    | __main__:trials:24 - Trial = 8211/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.651 | DEBUG    | __main__:trials:29 - Trial = 8211/30000 | Total reward = 44.84
2022-01-26 14:17:04.653 | DEBUG    | __main__:trials:24 - Trial = 8212/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.654 | DEBUG    | __main__:trials:29 - Trial = 8212/30000 | Total reward = 39.09
2022-01-26 14:17:04.658 | DEBUG    | __main__:trials:24 - Trial = 8213/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.659 | DEBUG    | __main__:trials:29 - Trial = 8213/30000 | Total reward = 46.77
2022-01-26 14:17:04.663 | DEBUG    | __main__:trials:24 - Trial = 8214/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.664 | DEBUG    | __main__:trials:29 - Trial = 8214/30000 | Total reward = 62.95
2022-01-26 14:17:04.667 | DEBUG    | __main__:trials:24 - Trial = 8215/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.669 | DEBUG    | __main__:trials:29 - Trial = 8215/30000 | Total reward = 46.63
2022-01-26 14:17:04.672 | DEBUG    | __main__:trials:24 - Trial = 8216/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.675 | DEBUG    | __main__:trials:29 - Trial = 8216/30000 | Total reward = 36.73
2022-01-26 14:17:04.678 | DEBUG    | __main__:trials:24 - Trial = 8217/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.680 | DEBUG    | __main__:trials:29 - Trial = 8217/30000 | Total reward = 46.49
2022-01-26 14:17:04.684 | DEBUG    | __main__:trials:24 - Trial = 8218/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.686 | DEBUG    | __main__:trials:29 - Trial = 8218/30000 | Total reward = 47.42
2022-01-26 14:17:04.689 | DEBUG    | __main__:trials:24 - Trial = 8219/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.690 | DEBUG    | __main__:trials:29 - Trial = 8219/30000 | Total reward = 43.10
2022-01-26 14:17:04.694 | DEBUG    | __main__:trials:24 - Trial = 8220/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.696 | DEBUG    | __main__:trials:29 - Trial = 8220/30000 | Total reward = 49.23
2022-01-26 14:17:04.699 | DEBUG    | __main__:trials:24 - Trial = 8221/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.701 | DEBUG    | __main__:trials:29 - Trial = 8221/30000 | Total reward = 53.93
2022-01-26 14:17:04.704 | DEBUG    | __main__:trials:24 - Trial = 8222/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.705 | DEBUG    | __main__:trials:29 - Trial = 8222/30000 | Total reward = 32.22
2022-01-26 14:17:04.709 | DEBUG    | __main__:trials:24 - Trial = 8223/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.711 | DEBUG    | __main__:trials:29 - Trial = 8223/30000 | Total reward = 32.05
2022-01-26 14:17:04.715 | DEBUG    | __main__:trials:24 - Trial = 8224/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.716 | DEBUG    | __main__:trials:29 - Trial = 8224/30000 | Total reward = 41.28
2022-01-26 14:17:04.719 | DEBUG    | __main__:trials:24 - Trial = 8225/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.721 | DEBUG    | __main__:trials:29 - Trial = 8225/30000 | Total reward = 35.56
2022-01-26 14:17:04.725 | DEBUG    | __main__:trials:24 - Trial = 8226/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.727 | DEBUG    | __main__:trials:29 - Trial = 8226/30000 | Total reward = 43.60
2022-01-26 14:17:04.731 | DEBUG    | __main__:trials:24 - Trial = 8227/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.731 | DEBUG    | __main__:trials:29 - Trial = 8227/30000 | Total reward = 32.34
2022-01-26 14:17:04.736 | DEBUG    | __main__:trials:24 - Trial = 8228/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.737 | DEBUG    | __main__:trials:29 - Trial = 8228/30000 | Total reward = 55.46
2022-01-26 14:17:04.741 | DEBUG    | __main__:trials:24 - Trial = 8229/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.743 | DEBUG    | __main__:trials:29 - Trial = 8229/30000 | Total reward = 36.82
2022-01-26 14:17:04.746 | DEBUG    | __main__:trials:24 - Trial = 8230/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.748 | DEBUG    | __main__:trials:29 - Trial = 8230/30000 | Total reward = 52.06
2022-01-26 14:17:04.752 | DEBUG    | __main__:trials:26 - Trial = 8231/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.753 | DEBUG    | __main__:trials:29 - Trial = 8231/30000 | Total reward = 20.99
2022-01-26 14:17:04.757 | DEBUG    | __main__:trials:24 - Trial = 8232/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.758 | DEBUG    | __main__:trials:29 - Trial = 8232/30000 | Total reward = 32.58
2022-01-26 14:17:04.762 | DEBUG    | __main__:trials:24 - Trial = 8233/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.763 | DEBUG    | __main__:trials:29 - Trial = 8233/30000 | Total reward = 50.10
2022-01-26 14:17:04.766 | DEBUG    | __main__:trials:24 - Trial = 8234/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.767 | DEBUG    | __main__:trials:29 - Trial = 8234/30000 | Total reward = 32.09
2022-01-26 14:17:04.770 | DEBUG    | __main__:trials:24 - Trial = 8235/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.772 | DEBUG    | __main__:trials:29 - Trial = 8235/30000 | Total reward = 31.63
2022-01-26 14:17:04.776 | DEBUG    | __main__:trials:24 - Trial = 8236/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.778 | DEBUG    | __main__:trials:29 - Trial = 8236/30000 | Total reward = 44.19
2022-01-26 14:17:04.781 | DEBUG    | __main__:trials:24 - Trial = 8237/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.783 | DEBUG    | __main__:trials:29 - Trial = 8237/30000 | Total reward = 31.81
2022-01-26 14:17:04.786 | DEBUG    | __main__:trials:26 - Trial = 8238/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.788 | DEBUG    | __main__:trials:29 - Trial = 8238/30000 | Total reward = 25.01
2022-01-26 14:17:04.791 | DEBUG    | __main__:trials:24 - Trial = 8239/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.793 | DEBUG    | __main__:trials:29 - Trial = 8239/30000 | Total reward = 42.86
2022-01-26 14:17:04.796 | DEBUG    | __main__:trials:24 - Trial = 8240/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.798 | DEBUG    | __main__:trials:29 - Trial = 8240/30000 | Total reward = 44.39
2022-01-26 14:17:04.802 | DEBUG    | __main__:trials:24 - Trial = 8241/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.803 | DEBUG    | __main__:trials:29 - Trial = 8241/30000 | Total reward = 53.75
2022-01-26 14:17:04.806 | DEBUG    | __main__:trials:24 - Trial = 8242/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.808 | DEBUG    | __main__:trials:29 - Trial = 8242/30000 | Total reward = 66.55
2022-01-26 14:17:04.811 | DEBUG    | __main__:trials:24 - Trial = 8243/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.813 | DEBUG    | __main__:trials:29 - Trial = 8243/30000 | Total reward = 54.06
2022-01-26 14:17:04.816 | DEBUG    | __main__:trials:24 - Trial = 8244/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.818 | DEBUG    | __main__:trials:29 - Trial = 8244/30000 | Total reward = 29.42
2022-01-26 14:17:04.821 | DEBUG    | __main__:trials:24 - Trial = 8245/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.823 | DEBUG    | __main__:trials:29 - Trial = 8245/30000 | Total reward = 33.37
2022-01-26 14:17:04.826 | DEBUG    | __main__:trials:24 - Trial = 8246/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.828 | DEBUG    | __main__:trials:29 - Trial = 8246/30000 | Total reward = 49.27
2022-01-26 14:17:04.831 | DEBUG    | __main__:trials:24 - Trial = 8247/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.833 | DEBUG    | __main__:trials:29 - Trial = 8247/30000 | Total reward = 47.87
2022-01-26 14:17:04.836 | DEBUG    | __main__:trials:24 - Trial = 8248/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.837 | DEBUG    | __main__:trials:29 - Trial = 8248/30000 | Total reward = 58.65
2022-01-26 14:17:04.841 | DEBUG    | __main__:trials:24 - Trial = 8249/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.843 | DEBUG    | __main__:trials:29 - Trial = 8249/30000 | Total reward = 49.20
2022-01-26 14:17:04.846 | DEBUG    | __main__:trials:26 - Trial = 8250/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.848 | DEBUG    | __main__:trials:29 - Trial = 8250/30000 | Total reward = 34.42
2022-01-26 14:17:04.851 | DEBUG    | __main__:trials:24 - Trial = 8251/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.853 | DEBUG    | __main__:trials:29 - Trial = 8251/30000 | Total reward = 52.71
2022-01-26 14:17:04.856 | DEBUG    | __main__:trials:24 - Trial = 8252/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.857 | DEBUG    | __main__:trials:29 - Trial = 8252/30000 | Total reward = 50.56
2022-01-26 14:17:04.861 | DEBUG    | __main__:trials:24 - Trial = 8253/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.862 | DEBUG    | __main__:trials:29 - Trial = 8253/30000 | Total reward = 32.26
2022-01-26 14:17:04.866 | DEBUG    | __main__:trials:24 - Trial = 8254/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.867 | DEBUG    | __main__:trials:29 - Trial = 8254/30000 | Total reward = 32.55
2022-01-26 14:17:04.870 | DEBUG    | __main__:trials:24 - Trial = 8255/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.872 | DEBUG    | __main__:trials:29 - Trial = 8255/30000 | Total reward = 32.34
2022-01-26 14:17:04.876 | DEBUG    | __main__:trials:24 - Trial = 8256/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.877 | DEBUG    | __main__:trials:29 - Trial = 8256/30000 | Total reward = 39.32
2022-01-26 14:17:04.880 | DEBUG    | __main__:trials:24 - Trial = 8257/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.882 | DEBUG    | __main__:trials:29 - Trial = 8257/30000 | Total reward = 32.55
2022-01-26 14:17:04.885 | DEBUG    | __main__:trials:24 - Trial = 8258/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.887 | DEBUG    | __main__:trials:29 - Trial = 8258/30000 | Total reward = 34.27
2022-01-26 14:17:04.890 | DEBUG    | __main__:trials:24 - Trial = 8259/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.891 | DEBUG    | __main__:trials:29 - Trial = 8259/30000 | Total reward = 51.25
2022-01-26 14:17:04.895 | DEBUG    | __main__:trials:24 - Trial = 8260/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.897 | DEBUG    | __main__:trials:29 - Trial = 8260/30000 | Total reward = 50.85
2022-01-26 14:17:04.900 | DEBUG    | __main__:trials:24 - Trial = 8261/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.902 | DEBUG    | __main__:trials:29 - Trial = 8261/30000 | Total reward = 41.88
2022-01-26 14:17:04.905 | DEBUG    | __main__:trials:24 - Trial = 8262/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.907 | DEBUG    | __main__:trials:29 - Trial = 8262/30000 | Total reward = 58.49
2022-01-26 14:17:04.911 | DEBUG    | __main__:trials:24 - Trial = 8263/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.912 | DEBUG    | __main__:trials:29 - Trial = 8263/30000 | Total reward = 34.13
2022-01-26 14:17:04.916 | DEBUG    | __main__:trials:24 - Trial = 8264/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.918 | DEBUG    | __main__:trials:29 - Trial = 8264/30000 | Total reward = 30.20
2022-01-26 14:17:04.921 | DEBUG    | __main__:trials:24 - Trial = 8265/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.923 | DEBUG    | __main__:trials:29 - Trial = 8265/30000 | Total reward = 33.03
2022-01-26 14:17:04.926 | DEBUG    | __main__:trials:24 - Trial = 8266/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.928 | DEBUG    | __main__:trials:29 - Trial = 8266/30000 | Total reward = 50.43
2022-01-26 14:17:04.932 | DEBUG    | __main__:trials:24 - Trial = 8267/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.934 | DEBUG    | __main__:trials:29 - Trial = 8267/30000 | Total reward = 33.40
2022-01-26 14:17:04.937 | DEBUG    | __main__:trials:24 - Trial = 8268/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.938 | DEBUG    | __main__:trials:29 - Trial = 8268/30000 | Total reward = 52.66
2022-01-26 14:17:04.941 | DEBUG    | __main__:trials:24 - Trial = 8269/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.943 | DEBUG    | __main__:trials:29 - Trial = 8269/30000 | Total reward = 33.42
2022-01-26 14:17:04.946 | DEBUG    | __main__:trials:26 - Trial = 8270/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.947 | DEBUG    | __main__:trials:29 - Trial = 8270/30000 | Total reward = 29.64
2022-01-26 14:17:04.951 | DEBUG    | __main__:trials:24 - Trial = 8271/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.952 | DEBUG    | __main__:trials:29 - Trial = 8271/30000 | Total reward = 51.47
2022-01-26 14:17:04.956 | DEBUG    | __main__:trials:24 - Trial = 8272/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.957 | DEBUG    | __main__:trials:29 - Trial = 8272/30000 | Total reward = 47.22
2022-01-26 14:17:04.961 | DEBUG    | __main__:trials:24 - Trial = 8273/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.963 | DEBUG    | __main__:trials:29 - Trial = 8273/30000 | Total reward = 47.85
2022-01-26 14:17:04.966 | DEBUG    | __main__:trials:24 - Trial = 8274/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.968 | DEBUG    | __main__:trials:29 - Trial = 8274/30000 | Total reward = 51.55
2022-01-26 14:17:04.972 | DEBUG    | __main__:trials:24 - Trial = 8275/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.973 | DEBUG    | __main__:trials:29 - Trial = 8275/30000 | Total reward = 57.43
2022-01-26 14:17:04.977 | DEBUG    | __main__:trials:24 - Trial = 8276/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.979 | DEBUG    | __main__:trials:29 - Trial = 8276/30000 | Total reward = 60.86
2022-01-26 14:17:04.983 | DEBUG    | __main__:trials:24 - Trial = 8277/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.984 | DEBUG    | __main__:trials:29 - Trial = 8277/30000 | Total reward = 51.14
2022-01-26 14:17:04.987 | DEBUG    | __main__:trials:26 - Trial = 8278/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:04.989 | DEBUG    | __main__:trials:29 - Trial = 8278/30000 | Total reward = 17.57
2022-01-26 14:17:04.992 | DEBUG    | __main__:trials:24 - Trial = 8279/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.993 | DEBUG    | __main__:trials:29 - Trial = 8279/30000 | Total reward = 55.60
2022-01-26 14:17:04.997 | DEBUG    | __main__:trials:24 - Trial = 8280/30000 | Max number of steps (20) reached
2022-01-26 14:17:04.999 | DEBUG    | __main__:trials:29 - Trial = 8280/30000 | Total reward = 47.21
2022-01-26 14:17:05.002 | DEBUG    | __main__:trials:24 - Trial = 8281/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.004 | DEBUG    | __main__:trials:29 - Trial = 8281/30000 | Total reward = 44.51
2022-01-26 14:17:05.008 | DEBUG    | __main__:trials:24 - Trial = 8282/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.009 | DEBUG    | __main__:trials:29 - Trial = 8282/30000 | Total reward = 66.85
2022-01-26 14:17:05.013 | DEBUG    | __main__:trials:24 - Trial = 8283/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.014 | DEBUG    | __main__:trials:29 - Trial = 8283/30000 | Total reward = 45.28
2022-01-26 14:17:05.017 | DEBUG    | __main__:trials:24 - Trial = 8284/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.019 | DEBUG    | __main__:trials:29 - Trial = 8284/30000 | Total reward = 50.47
2022-01-26 14:17:05.022 | DEBUG    | __main__:trials:24 - Trial = 8285/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.024 | DEBUG    | __main__:trials:29 - Trial = 8285/30000 | Total reward = 36.95
2022-01-26 14:17:05.028 | DEBUG    | __main__:trials:24 - Trial = 8286/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.029 | DEBUG    | __main__:trials:29 - Trial = 8286/30000 | Total reward = 35.27
2022-01-26 14:17:05.032 | DEBUG    | __main__:trials:24 - Trial = 8287/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.034 | DEBUG    | __main__:trials:29 - Trial = 8287/30000 | Total reward = 43.88
2022-01-26 14:17:05.038 | DEBUG    | __main__:trials:24 - Trial = 8288/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.039 | DEBUG    | __main__:trials:29 - Trial = 8288/30000 | Total reward = 47.06
2022-01-26 14:17:05.043 | DEBUG    | __main__:trials:24 - Trial = 8289/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.045 | DEBUG    | __main__:trials:29 - Trial = 8289/30000 | Total reward = 59.43
2022-01-26 14:17:05.048 | DEBUG    | __main__:trials:24 - Trial = 8290/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.049 | DEBUG    | __main__:trials:29 - Trial = 8290/30000 | Total reward = 32.72
2022-01-26 14:17:05.053 | DEBUG    | __main__:trials:24 - Trial = 8291/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.053 | DEBUG    | __main__:trials:29 - Trial = 8291/30000 | Total reward = 37.24
2022-01-26 14:17:05.057 | DEBUG    | __main__:trials:24 - Trial = 8292/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.059 | DEBUG    | __main__:trials:29 - Trial = 8292/30000 | Total reward = 32.97
2022-01-26 14:17:05.062 | DEBUG    | __main__:trials:24 - Trial = 8293/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.064 | DEBUG    | __main__:trials:29 - Trial = 8293/30000 | Total reward = 29.50
2022-01-26 14:17:05.067 | DEBUG    | __main__:trials:24 - Trial = 8294/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.069 | DEBUG    | __main__:trials:29 - Trial = 8294/30000 | Total reward = 43.10
2022-01-26 14:17:05.072 | DEBUG    | __main__:trials:24 - Trial = 8295/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.074 | DEBUG    | __main__:trials:29 - Trial = 8295/30000 | Total reward = 32.26
2022-01-26 14:17:05.078 | DEBUG    | __main__:trials:24 - Trial = 8296/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.080 | DEBUG    | __main__:trials:29 - Trial = 8296/30000 | Total reward = 55.15
2022-01-26 14:17:05.083 | DEBUG    | __main__:trials:24 - Trial = 8297/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.085 | DEBUG    | __main__:trials:29 - Trial = 8297/30000 | Total reward = 60.63
2022-01-26 14:17:05.088 | DEBUG    | __main__:trials:24 - Trial = 8298/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.090 | DEBUG    | __main__:trials:29 - Trial = 8298/30000 | Total reward = 44.61
2022-01-26 14:17:05.094 | DEBUG    | __main__:trials:24 - Trial = 8299/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.095 | DEBUG    | __main__:trials:29 - Trial = 8299/30000 | Total reward = 45.65
2022-01-26 14:17:05.099 | DEBUG    | __main__:trials:24 - Trial = 8300/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.101 | DEBUG    | __main__:trials:29 - Trial = 8300/30000 | Total reward = 50.21
2022-01-26 14:17:05.105 | DEBUG    | __main__:trials:24 - Trial = 8301/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.106 | DEBUG    | __main__:trials:29 - Trial = 8301/30000 | Total reward = 46.15
2022-01-26 14:17:05.110 | DEBUG    | __main__:trials:24 - Trial = 8302/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.112 | DEBUG    | __main__:trials:29 - Trial = 8302/30000 | Total reward = 35.55
2022-01-26 14:17:05.115 | DEBUG    | __main__:trials:24 - Trial = 8303/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.116 | DEBUG    | __main__:trials:29 - Trial = 8303/30000 | Total reward = 32.81
2022-01-26 14:17:05.120 | DEBUG    | __main__:trials:24 - Trial = 8304/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.122 | DEBUG    | __main__:trials:29 - Trial = 8304/30000 | Total reward = 44.43
2022-01-26 14:17:05.125 | DEBUG    | __main__:trials:24 - Trial = 8305/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.127 | DEBUG    | __main__:trials:29 - Trial = 8305/30000 | Total reward = 45.03
2022-01-26 14:17:05.131 | DEBUG    | __main__:trials:24 - Trial = 8306/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.132 | DEBUG    | __main__:trials:29 - Trial = 8306/30000 | Total reward = 49.43
2022-01-26 14:17:05.136 | DEBUG    | __main__:trials:24 - Trial = 8307/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.137 | DEBUG    | __main__:trials:29 - Trial = 8307/30000 | Total reward = 54.98
2022-01-26 14:17:05.141 | DEBUG    | __main__:trials:24 - Trial = 8308/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.143 | DEBUG    | __main__:trials:29 - Trial = 8308/30000 | Total reward = 46.32
2022-01-26 14:17:05.146 | DEBUG    | __main__:trials:24 - Trial = 8309/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.148 | DEBUG    | __main__:trials:29 - Trial = 8309/30000 | Total reward = 63.66
2022-01-26 14:17:05.152 | DEBUG    | __main__:trials:24 - Trial = 8310/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.153 | DEBUG    | __main__:trials:29 - Trial = 8310/30000 | Total reward = 46.95
2022-01-26 14:17:05.157 | DEBUG    | __main__:trials:24 - Trial = 8311/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.157 | DEBUG    | __main__:trials:29 - Trial = 8311/30000 | Total reward = 40.01
2022-01-26 14:17:05.161 | DEBUG    | __main__:trials:26 - Trial = 8312/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:05.162 | DEBUG    | __main__:trials:29 - Trial = 8312/30000 | Total reward = 20.37
2022-01-26 14:17:05.166 | DEBUG    | __main__:trials:24 - Trial = 8313/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.168 | DEBUG    | __main__:trials:29 - Trial = 8313/30000 | Total reward = 44.52
2022-01-26 14:17:05.171 | DEBUG    | __main__:trials:24 - Trial = 8314/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.173 | DEBUG    | __main__:trials:29 - Trial = 8314/30000 | Total reward = 47.80
2022-01-26 14:17:05.176 | DEBUG    | __main__:trials:24 - Trial = 8315/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.178 | DEBUG    | __main__:trials:29 - Trial = 8315/30000 | Total reward = 44.96
2022-01-26 14:17:05.182 | DEBUG    | __main__:trials:24 - Trial = 8316/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.184 | DEBUG    | __main__:trials:29 - Trial = 8316/30000 | Total reward = 46.25
2022-01-26 14:17:05.187 | DEBUG    | __main__:trials:24 - Trial = 8317/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.189 | DEBUG    | __main__:trials:29 - Trial = 8317/30000 | Total reward = 42.73
2022-01-26 14:17:05.192 | DEBUG    | __main__:trials:24 - Trial = 8318/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.193 | DEBUG    | __main__:trials:29 - Trial = 8318/30000 | Total reward = 38.76
2022-01-26 14:17:05.197 | DEBUG    | __main__:trials:24 - Trial = 8319/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.197 | DEBUG    | __main__:trials:29 - Trial = 8319/30000 | Total reward = 43.27
2022-01-26 14:17:05.201 | DEBUG    | __main__:trials:24 - Trial = 8320/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.202 | DEBUG    | __main__:trials:29 - Trial = 8320/30000 | Total reward = 38.21
2022-01-26 14:17:05.205 | DEBUG    | __main__:trials:24 - Trial = 8321/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.207 | DEBUG    | __main__:trials:29 - Trial = 8321/30000 | Total reward = 46.95
2022-01-26 14:17:05.210 | DEBUG    | __main__:trials:24 - Trial = 8322/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.211 | DEBUG    | __main__:trials:29 - Trial = 8322/30000 | Total reward = 34.24
2022-01-26 14:17:05.215 | DEBUG    | __main__:trials:24 - Trial = 8323/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.216 | DEBUG    | __main__:trials:29 - Trial = 8323/30000 | Total reward = 52.33
2022-01-26 14:17:05.220 | DEBUG    | __main__:trials:24 - Trial = 8324/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.221 | DEBUG    | __main__:trials:29 - Trial = 8324/30000 | Total reward = 51.45
2022-01-26 14:17:05.225 | DEBUG    | __main__:trials:24 - Trial = 8325/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.226 | DEBUG    | __main__:trials:29 - Trial = 8325/30000 | Total reward = 41.07
2022-01-26 14:17:05.230 | DEBUG    | __main__:trials:24 - Trial = 8326/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.231 | DEBUG    | __main__:trials:29 - Trial = 8326/30000 | Total reward = 29.77
2022-01-26 14:17:05.235 | DEBUG    | __main__:trials:24 - Trial = 8327/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.237 | DEBUG    | __main__:trials:29 - Trial = 8327/30000 | Total reward = 29.28
2022-01-26 14:17:05.240 | DEBUG    | __main__:trials:24 - Trial = 8328/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.242 | DEBUG    | __main__:trials:29 - Trial = 8328/30000 | Total reward = 30.48
2022-01-26 14:17:05.245 | DEBUG    | __main__:trials:24 - Trial = 8329/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.247 | DEBUG    | __main__:trials:29 - Trial = 8329/30000 | Total reward = 44.62
2022-01-26 14:17:05.251 | DEBUG    | __main__:trials:24 - Trial = 8330/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.252 | DEBUG    | __main__:trials:29 - Trial = 8330/30000 | Total reward = 51.52
2022-01-26 14:17:05.256 | DEBUG    | __main__:trials:24 - Trial = 8331/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.257 | DEBUG    | __main__:trials:29 - Trial = 8331/30000 | Total reward = 57.59
2022-01-26 14:17:05.261 | DEBUG    | __main__:trials:24 - Trial = 8332/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.263 | DEBUG    | __main__:trials:29 - Trial = 8332/30000 | Total reward = 50.23
2022-01-26 14:17:05.267 | DEBUG    | __main__:trials:24 - Trial = 8333/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.268 | DEBUG    | __main__:trials:29 - Trial = 8333/30000 | Total reward = 40.71
2022-01-26 14:17:05.271 | DEBUG    | __main__:trials:24 - Trial = 8334/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.273 | DEBUG    | __main__:trials:29 - Trial = 8334/30000 | Total reward = 40.74
2022-01-26 14:17:05.276 | DEBUG    | __main__:trials:24 - Trial = 8335/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.278 | DEBUG    | __main__:trials:29 - Trial = 8335/30000 | Total reward = 52.61
2022-01-26 14:17:05.282 | DEBUG    | __main__:trials:24 - Trial = 8336/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.283 | DEBUG    | __main__:trials:29 - Trial = 8336/30000 | Total reward = 49.32
2022-01-26 14:17:05.287 | DEBUG    | __main__:trials:24 - Trial = 8337/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.288 | DEBUG    | __main__:trials:29 - Trial = 8337/30000 | Total reward = 50.01
2022-01-26 14:17:05.292 | DEBUG    | __main__:trials:24 - Trial = 8338/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.293 | DEBUG    | __main__:trials:29 - Trial = 8338/30000 | Total reward = 52.29
2022-01-26 14:17:05.297 | DEBUG    | __main__:trials:24 - Trial = 8339/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.299 | DEBUG    | __main__:trials:29 - Trial = 8339/30000 | Total reward = 46.95
2022-01-26 14:17:05.302 | DEBUG    | __main__:trials:24 - Trial = 8340/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.304 | DEBUG    | __main__:trials:29 - Trial = 8340/30000 | Total reward = 38.11
2022-01-26 14:17:05.308 | DEBUG    | __main__:trials:24 - Trial = 8341/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.310 | DEBUG    | __main__:trials:29 - Trial = 8341/30000 | Total reward = 57.58
2022-01-26 14:17:05.314 | DEBUG    | __main__:trials:24 - Trial = 8342/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.315 | DEBUG    | __main__:trials:29 - Trial = 8342/30000 | Total reward = 57.70
2022-01-26 14:17:05.319 | DEBUG    | __main__:trials:24 - Trial = 8343/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.320 | DEBUG    | __main__:trials:29 - Trial = 8343/30000 | Total reward = 58.12
2022-01-26 14:17:05.324 | DEBUG    | __main__:trials:24 - Trial = 8344/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.326 | DEBUG    | __main__:trials:29 - Trial = 8344/30000 | Total reward = 51.08
2022-01-26 14:17:05.329 | DEBUG    | __main__:trials:24 - Trial = 8345/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.331 | DEBUG    | __main__:trials:29 - Trial = 8345/30000 | Total reward = 61.47
2022-01-26 14:17:05.335 | DEBUG    | __main__:trials:24 - Trial = 8346/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.336 | DEBUG    | __main__:trials:29 - Trial = 8346/30000 | Total reward = 51.15
2022-01-26 14:17:05.340 | DEBUG    | __main__:trials:24 - Trial = 8347/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.342 | DEBUG    | __main__:trials:29 - Trial = 8347/30000 | Total reward = 55.05
2022-01-26 14:17:05.345 | DEBUG    | __main__:trials:24 - Trial = 8348/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.347 | DEBUG    | __main__:trials:29 - Trial = 8348/30000 | Total reward = 52.07
2022-01-26 14:17:05.350 | DEBUG    | __main__:trials:24 - Trial = 8349/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.352 | DEBUG    | __main__:trials:29 - Trial = 8349/30000 | Total reward = 52.02
2022-01-26 14:17:05.356 | DEBUG    | __main__:trials:24 - Trial = 8350/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.357 | DEBUG    | __main__:trials:29 - Trial = 8350/30000 | Total reward = 51.65
2022-01-26 14:17:05.361 | DEBUG    | __main__:trials:24 - Trial = 8351/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.362 | DEBUG    | __main__:trials:29 - Trial = 8351/30000 | Total reward = 49.66
2022-01-26 14:17:05.366 | DEBUG    | __main__:trials:24 - Trial = 8352/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.368 | DEBUG    | __main__:trials:29 - Trial = 8352/30000 | Total reward = 47.25
2022-01-26 14:17:05.371 | DEBUG    | __main__:trials:24 - Trial = 8353/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.373 | DEBUG    | __main__:trials:29 - Trial = 8353/30000 | Total reward = 48.56
2022-01-26 14:17:05.377 | DEBUG    | __main__:trials:24 - Trial = 8354/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.378 | DEBUG    | __main__:trials:29 - Trial = 8354/30000 | Total reward = 45.03
2022-01-26 14:17:05.382 | DEBUG    | __main__:trials:24 - Trial = 8355/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.382 | DEBUG    | __main__:trials:29 - Trial = 8355/30000 | Total reward = 45.22
2022-01-26 14:17:05.387 | DEBUG    | __main__:trials:24 - Trial = 8356/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.388 | DEBUG    | __main__:trials:29 - Trial = 8356/30000 | Total reward = 39.68
2022-01-26 14:17:05.392 | DEBUG    | __main__:trials:24 - Trial = 8357/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.393 | DEBUG    | __main__:trials:29 - Trial = 8357/30000 | Total reward = 39.89
2022-01-26 14:17:05.397 | DEBUG    | __main__:trials:24 - Trial = 8358/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.398 | DEBUG    | __main__:trials:29 - Trial = 8358/30000 | Total reward = 31.52
2022-01-26 14:17:05.402 | DEBUG    | __main__:trials:24 - Trial = 8359/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.404 | DEBUG    | __main__:trials:29 - Trial = 8359/30000 | Total reward = 57.35
2022-01-26 14:17:05.407 | DEBUG    | __main__:trials:24 - Trial = 8360/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.409 | DEBUG    | __main__:trials:29 - Trial = 8360/30000 | Total reward = 44.63
2022-01-26 14:17:05.412 | DEBUG    | __main__:trials:24 - Trial = 8361/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.414 | DEBUG    | __main__:trials:29 - Trial = 8361/30000 | Total reward = 44.92
2022-01-26 14:17:05.418 | DEBUG    | __main__:trials:24 - Trial = 8362/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.420 | DEBUG    | __main__:trials:29 - Trial = 8362/30000 | Total reward = 36.46
2022-01-26 14:17:05.423 | DEBUG    | __main__:trials:24 - Trial = 8363/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.425 | DEBUG    | __main__:trials:29 - Trial = 8363/30000 | Total reward = 48.71
2022-01-26 14:17:05.428 | DEBUG    | __main__:trials:24 - Trial = 8364/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.430 | DEBUG    | __main__:trials:29 - Trial = 8364/30000 | Total reward = 39.58
2022-01-26 14:17:05.434 | DEBUG    | __main__:trials:24 - Trial = 8365/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.435 | DEBUG    | __main__:trials:29 - Trial = 8365/30000 | Total reward = 38.18
2022-01-26 14:17:05.439 | DEBUG    | __main__:trials:24 - Trial = 8366/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.440 | DEBUG    | __main__:trials:29 - Trial = 8366/30000 | Total reward = 43.68
2022-01-26 14:17:05.443 | DEBUG    | __main__:trials:24 - Trial = 8367/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.445 | DEBUG    | __main__:trials:29 - Trial = 8367/30000 | Total reward = 45.98
2022-01-26 14:17:05.449 | DEBUG    | __main__:trials:24 - Trial = 8368/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.450 | DEBUG    | __main__:trials:29 - Trial = 8368/30000 | Total reward = 39.68
2022-01-26 14:17:05.454 | DEBUG    | __main__:trials:24 - Trial = 8369/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.456 | DEBUG    | __main__:trials:29 - Trial = 8369/30000 | Total reward = 43.57
2022-01-26 14:17:05.460 | DEBUG    | __main__:trials:24 - Trial = 8370/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.461 | DEBUG    | __main__:trials:29 - Trial = 8370/30000 | Total reward = 68.95
2022-01-26 14:17:05.464 | DEBUG    | __main__:trials:24 - Trial = 8371/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.466 | DEBUG    | __main__:trials:29 - Trial = 8371/30000 | Total reward = 39.91
2022-01-26 14:17:05.470 | DEBUG    | __main__:trials:24 - Trial = 8372/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.471 | DEBUG    | __main__:trials:29 - Trial = 8372/30000 | Total reward = 47.86
2022-01-26 14:17:05.475 | DEBUG    | __main__:trials:24 - Trial = 8373/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.477 | DEBUG    | __main__:trials:29 - Trial = 8373/30000 | Total reward = 46.95
2022-01-26 14:17:05.481 | DEBUG    | __main__:trials:24 - Trial = 8374/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.482 | DEBUG    | __main__:trials:29 - Trial = 8374/30000 | Total reward = 42.09
2022-01-26 14:17:05.486 | DEBUG    | __main__:trials:24 - Trial = 8375/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.487 | DEBUG    | __main__:trials:29 - Trial = 8375/30000 | Total reward = 47.87
2022-01-26 14:17:05.490 | DEBUG    | __main__:trials:24 - Trial = 8376/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.492 | DEBUG    | __main__:trials:29 - Trial = 8376/30000 | Total reward = 31.45
2022-01-26 14:17:05.495 | DEBUG    | __main__:trials:24 - Trial = 8377/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.497 | DEBUG    | __main__:trials:29 - Trial = 8377/30000 | Total reward = 43.50
2022-01-26 14:17:05.500 | DEBUG    | __main__:trials:24 - Trial = 8378/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.502 | DEBUG    | __main__:trials:29 - Trial = 8378/30000 | Total reward = 45.08
2022-01-26 14:17:05.506 | DEBUG    | __main__:trials:24 - Trial = 8379/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.507 | DEBUG    | __main__:trials:29 - Trial = 8379/30000 | Total reward = 40.80
2022-01-26 14:17:05.511 | DEBUG    | __main__:trials:24 - Trial = 8380/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.513 | DEBUG    | __main__:trials:29 - Trial = 8380/30000 | Total reward = 41.37
2022-01-26 14:17:05.516 | DEBUG    | __main__:trials:24 - Trial = 8381/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.518 | DEBUG    | __main__:trials:29 - Trial = 8381/30000 | Total reward = 47.21
2022-01-26 14:17:05.521 | DEBUG    | __main__:trials:24 - Trial = 8382/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.523 | DEBUG    | __main__:trials:29 - Trial = 8382/30000 | Total reward = 60.74
2022-01-26 14:17:05.527 | DEBUG    | __main__:trials:24 - Trial = 8383/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.528 | DEBUG    | __main__:trials:29 - Trial = 8383/30000 | Total reward = 32.82
2022-01-26 14:17:05.531 | DEBUG    | __main__:trials:24 - Trial = 8384/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.533 | DEBUG    | __main__:trials:29 - Trial = 8384/30000 | Total reward = 52.82
2022-01-26 14:17:05.536 | DEBUG    | __main__:trials:24 - Trial = 8385/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.537 | DEBUG    | __main__:trials:29 - Trial = 8385/30000 | Total reward = 50.05
2022-01-26 14:17:05.541 | DEBUG    | __main__:trials:24 - Trial = 8386/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.542 | DEBUG    | __main__:trials:29 - Trial = 8386/30000 | Total reward = 49.47
2022-01-26 14:17:05.546 | DEBUG    | __main__:trials:24 - Trial = 8387/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.547 | DEBUG    | __main__:trials:29 - Trial = 8387/30000 | Total reward = 47.21
2022-01-26 14:17:05.551 | DEBUG    | __main__:trials:24 - Trial = 8388/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.551 | DEBUG    | __main__:trials:29 - Trial = 8388/30000 | Total reward = 48.15
2022-01-26 14:17:05.555 | DEBUG    | __main__:trials:24 - Trial = 8389/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.557 | DEBUG    | __main__:trials:29 - Trial = 8389/30000 | Total reward = 51.95
2022-01-26 14:17:05.560 | DEBUG    | __main__:trials:24 - Trial = 8390/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.561 | DEBUG    | __main__:trials:29 - Trial = 8390/30000 | Total reward = 47.38
2022-01-26 14:17:05.564 | DEBUG    | __main__:trials:24 - Trial = 8391/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.566 | DEBUG    | __main__:trials:29 - Trial = 8391/30000 | Total reward = 57.07
2022-01-26 14:17:05.569 | DEBUG    | __main__:trials:24 - Trial = 8392/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.570 | DEBUG    | __main__:trials:29 - Trial = 8392/30000 | Total reward = 46.62
2022-01-26 14:17:05.573 | DEBUG    | __main__:trials:24 - Trial = 8393/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.575 | DEBUG    | __main__:trials:29 - Trial = 8393/30000 | Total reward = 46.28
2022-01-26 14:17:05.578 | DEBUG    | __main__:trials:24 - Trial = 8394/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.580 | DEBUG    | __main__:trials:29 - Trial = 8394/30000 | Total reward = 32.14
2022-01-26 14:17:05.584 | DEBUG    | __main__:trials:24 - Trial = 8395/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.585 | DEBUG    | __main__:trials:29 - Trial = 8395/30000 | Total reward = 46.36
2022-01-26 14:17:05.589 | DEBUG    | __main__:trials:24 - Trial = 8396/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.590 | DEBUG    | __main__:trials:29 - Trial = 8396/30000 | Total reward = 45.03
2022-01-26 14:17:05.593 | DEBUG    | __main__:trials:26 - Trial = 8397/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:05.593 | DEBUG    | __main__:trials:29 - Trial = 8397/30000 | Total reward = 33.23
2022-01-26 14:17:05.597 | DEBUG    | __main__:trials:24 - Trial = 8398/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.599 | DEBUG    | __main__:trials:29 - Trial = 8398/30000 | Total reward = 47.62
2022-01-26 14:17:05.602 | DEBUG    | __main__:trials:24 - Trial = 8399/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.603 | DEBUG    | __main__:trials:29 - Trial = 8399/30000 | Total reward = 42.85
2022-01-26 14:17:05.607 | DEBUG    | __main__:trials:24 - Trial = 8400/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.608 | DEBUG    | __main__:trials:29 - Trial = 8400/30000 | Total reward = 46.30
2022-01-26 14:17:05.611 | DEBUG    | __main__:trials:24 - Trial = 8401/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.613 | DEBUG    | __main__:trials:29 - Trial = 8401/30000 | Total reward = 45.37
2022-01-26 14:17:05.617 | DEBUG    | __main__:trials:24 - Trial = 8402/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.618 | DEBUG    | __main__:trials:29 - Trial = 8402/30000 | Total reward = 47.21
2022-01-26 14:17:05.622 | DEBUG    | __main__:trials:24 - Trial = 8403/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.623 | DEBUG    | __main__:trials:29 - Trial = 8403/30000 | Total reward = 30.15
2022-01-26 14:17:05.627 | DEBUG    | __main__:trials:24 - Trial = 8404/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.628 | DEBUG    | __main__:trials:29 - Trial = 8404/30000 | Total reward = 48.10
2022-01-26 14:17:05.631 | DEBUG    | __main__:trials:24 - Trial = 8405/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.633 | DEBUG    | __main__:trials:29 - Trial = 8405/30000 | Total reward = 47.39
2022-01-26 14:17:05.637 | DEBUG    | __main__:trials:24 - Trial = 8406/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.638 | DEBUG    | __main__:trials:29 - Trial = 8406/30000 | Total reward = 46.22
2022-01-26 14:17:05.642 | DEBUG    | __main__:trials:24 - Trial = 8407/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.644 | DEBUG    | __main__:trials:29 - Trial = 8407/30000 | Total reward = 59.89
2022-01-26 14:17:05.647 | DEBUG    | __main__:trials:24 - Trial = 8408/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.649 | DEBUG    | __main__:trials:29 - Trial = 8408/30000 | Total reward = 30.44
2022-01-26 14:17:05.652 | DEBUG    | __main__:trials:24 - Trial = 8409/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.654 | DEBUG    | __main__:trials:29 - Trial = 8409/30000 | Total reward = 36.16
2022-01-26 14:17:05.658 | DEBUG    | __main__:trials:24 - Trial = 8410/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.659 | DEBUG    | __main__:trials:29 - Trial = 8410/30000 | Total reward = 38.66
2022-01-26 14:17:05.662 | DEBUG    | __main__:trials:26 - Trial = 8411/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:05.664 | DEBUG    | __main__:trials:29 - Trial = 8411/30000 | Total reward = 21.36
2022-01-26 14:17:05.667 | DEBUG    | __main__:trials:24 - Trial = 8412/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.668 | DEBUG    | __main__:trials:29 - Trial = 8412/30000 | Total reward = 53.69
2022-01-26 14:17:05.672 | DEBUG    | __main__:trials:24 - Trial = 8413/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.674 | DEBUG    | __main__:trials:29 - Trial = 8413/30000 | Total reward = 34.00
2022-01-26 14:17:05.678 | DEBUG    | __main__:trials:24 - Trial = 8414/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.679 | DEBUG    | __main__:trials:29 - Trial = 8414/30000 | Total reward = 36.42
2022-01-26 14:17:05.683 | DEBUG    | __main__:trials:24 - Trial = 8415/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.684 | DEBUG    | __main__:trials:29 - Trial = 8415/30000 | Total reward = 49.01
2022-01-26 14:17:05.688 | DEBUG    | __main__:trials:24 - Trial = 8416/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.689 | DEBUG    | __main__:trials:29 - Trial = 8416/30000 | Total reward = 45.98
2022-01-26 14:17:05.693 | DEBUG    | __main__:trials:24 - Trial = 8417/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.694 | DEBUG    | __main__:trials:29 - Trial = 8417/30000 | Total reward = 51.85
2022-01-26 14:17:05.697 | DEBUG    | __main__:trials:26 - Trial = 8418/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:05.698 | DEBUG    | __main__:trials:29 - Trial = 8418/30000 | Total reward = 25.25
2022-01-26 14:17:05.701 | DEBUG    | __main__:trials:24 - Trial = 8419/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.703 | DEBUG    | __main__:trials:29 - Trial = 8419/30000 | Total reward = 43.96
2022-01-26 14:17:05.705 | DEBUG    | __main__:trials:24 - Trial = 8420/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.707 | DEBUG    | __main__:trials:29 - Trial = 8420/30000 | Total reward = 48.40
2022-01-26 14:17:05.710 | DEBUG    | __main__:trials:24 - Trial = 8421/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.712 | DEBUG    | __main__:trials:29 - Trial = 8421/30000 | Total reward = 44.83
2022-01-26 14:17:05.715 | DEBUG    | __main__:trials:24 - Trial = 8422/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.717 | DEBUG    | __main__:trials:29 - Trial = 8422/30000 | Total reward = 46.41
2022-01-26 14:17:05.720 | DEBUG    | __main__:trials:24 - Trial = 8423/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.722 | DEBUG    | __main__:trials:29 - Trial = 8423/30000 | Total reward = 53.36
2022-01-26 14:17:05.725 | DEBUG    | __main__:trials:24 - Trial = 8424/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.727 | DEBUG    | __main__:trials:29 - Trial = 8424/30000 | Total reward = 48.79
2022-01-26 14:17:05.730 | DEBUG    | __main__:trials:24 - Trial = 8425/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.732 | DEBUG    | __main__:trials:29 - Trial = 8425/30000 | Total reward = 49.13
2022-01-26 14:17:05.736 | DEBUG    | __main__:trials:24 - Trial = 8426/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.737 | DEBUG    | __main__:trials:29 - Trial = 8426/30000 | Total reward = 37.79
2022-01-26 14:17:05.740 | DEBUG    | __main__:trials:24 - Trial = 8427/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.741 | DEBUG    | __main__:trials:29 - Trial = 8427/30000 | Total reward = 47.66
2022-01-26 14:17:05.746 | DEBUG    | __main__:trials:24 - Trial = 8428/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.747 | DEBUG    | __main__:trials:29 - Trial = 8428/30000 | Total reward = 45.42
2022-01-26 14:17:05.750 | DEBUG    | __main__:trials:24 - Trial = 8429/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.752 | DEBUG    | __main__:trials:29 - Trial = 8429/30000 | Total reward = 43.67
2022-01-26 14:17:05.755 | DEBUG    | __main__:trials:24 - Trial = 8430/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.756 | DEBUG    | __main__:trials:29 - Trial = 8430/30000 | Total reward = 43.51
2022-01-26 14:17:05.761 | DEBUG    | __main__:trials:24 - Trial = 8431/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.763 | DEBUG    | __main__:trials:29 - Trial = 8431/30000 | Total reward = 51.14
2022-01-26 14:17:05.766 | DEBUG    | __main__:trials:24 - Trial = 8432/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.768 | DEBUG    | __main__:trials:29 - Trial = 8432/30000 | Total reward = 47.21
2022-01-26 14:17:05.771 | DEBUG    | __main__:trials:24 - Trial = 8433/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.773 | DEBUG    | __main__:trials:29 - Trial = 8433/30000 | Total reward = 43.99
2022-01-26 14:17:05.776 | DEBUG    | __main__:trials:24 - Trial = 8434/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.777 | DEBUG    | __main__:trials:29 - Trial = 8434/30000 | Total reward = 51.73
2022-01-26 14:17:05.780 | DEBUG    | __main__:trials:24 - Trial = 8435/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.781 | DEBUG    | __main__:trials:29 - Trial = 8435/30000 | Total reward = 46.33
2022-01-26 14:17:05.785 | DEBUG    | __main__:trials:24 - Trial = 8436/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.786 | DEBUG    | __main__:trials:29 - Trial = 8436/30000 | Total reward = 37.99
2022-01-26 14:17:05.790 | DEBUG    | __main__:trials:24 - Trial = 8437/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.791 | DEBUG    | __main__:trials:29 - Trial = 8437/30000 | Total reward = 47.16
2022-01-26 14:17:05.794 | DEBUG    | __main__:trials:24 - Trial = 8438/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.796 | DEBUG    | __main__:trials:29 - Trial = 8438/30000 | Total reward = 43.39
2022-01-26 14:17:05.800 | DEBUG    | __main__:trials:24 - Trial = 8439/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.802 | DEBUG    | __main__:trials:29 - Trial = 8439/30000 | Total reward = 52.05
2022-01-26 14:17:05.804 | DEBUG    | __main__:trials:24 - Trial = 8440/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.805 | DEBUG    | __main__:trials:29 - Trial = 8440/30000 | Total reward = 46.41
2022-01-26 14:17:05.808 | DEBUG    | __main__:trials:24 - Trial = 8441/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.810 | DEBUG    | __main__:trials:29 - Trial = 8441/30000 | Total reward = 52.51
2022-01-26 14:17:05.813 | DEBUG    | __main__:trials:24 - Trial = 8442/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.815 | DEBUG    | __main__:trials:29 - Trial = 8442/30000 | Total reward = 48.92
2022-01-26 14:17:05.819 | DEBUG    | __main__:trials:24 - Trial = 8443/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.821 | DEBUG    | __main__:trials:29 - Trial = 8443/30000 | Total reward = 48.93
2022-01-26 14:17:05.824 | DEBUG    | __main__:trials:24 - Trial = 8444/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.826 | DEBUG    | __main__:trials:29 - Trial = 8444/30000 | Total reward = 32.36
2022-01-26 14:17:05.829 | DEBUG    | __main__:trials:24 - Trial = 8445/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.831 | DEBUG    | __main__:trials:29 - Trial = 8445/30000 | Total reward = 48.66
2022-01-26 14:17:05.835 | DEBUG    | __main__:trials:24 - Trial = 8446/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.837 | DEBUG    | __main__:trials:29 - Trial = 8446/30000 | Total reward = 50.29
2022-01-26 14:17:05.840 | DEBUG    | __main__:trials:24 - Trial = 8447/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.842 | DEBUG    | __main__:trials:29 - Trial = 8447/30000 | Total reward = 52.70
2022-01-26 14:17:05.845 | DEBUG    | __main__:trials:24 - Trial = 8448/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.847 | DEBUG    | __main__:trials:29 - Trial = 8448/30000 | Total reward = 50.72
2022-01-26 14:17:05.850 | DEBUG    | __main__:trials:24 - Trial = 8449/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.852 | DEBUG    | __main__:trials:29 - Trial = 8449/30000 | Total reward = 46.70
2022-01-26 14:17:05.855 | DEBUG    | __main__:trials:24 - Trial = 8450/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.857 | DEBUG    | __main__:trials:29 - Trial = 8450/30000 | Total reward = 26.82
2022-01-26 14:17:05.861 | DEBUG    | __main__:trials:24 - Trial = 8451/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.862 | DEBUG    | __main__:trials:29 - Trial = 8451/30000 | Total reward = 45.49
2022-01-26 14:17:05.865 | DEBUG    | __main__:trials:24 - Trial = 8452/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.866 | DEBUG    | __main__:trials:29 - Trial = 8452/30000 | Total reward = 48.37
2022-01-26 14:17:05.869 | DEBUG    | __main__:trials:24 - Trial = 8453/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.870 | DEBUG    | __main__:trials:29 - Trial = 8453/30000 | Total reward = 59.55
2022-01-26 14:17:05.874 | DEBUG    | __main__:trials:24 - Trial = 8454/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.876 | DEBUG    | __main__:trials:29 - Trial = 8454/30000 | Total reward = 47.80
2022-01-26 14:17:05.879 | DEBUG    | __main__:trials:24 - Trial = 8455/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.881 | DEBUG    | __main__:trials:29 - Trial = 8455/30000 | Total reward = 47.81
2022-01-26 14:17:05.884 | DEBUG    | __main__:trials:24 - Trial = 8456/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.885 | DEBUG    | __main__:trials:29 - Trial = 8456/30000 | Total reward = 55.38
2022-01-26 14:17:05.888 | DEBUG    | __main__:trials:24 - Trial = 8457/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.890 | DEBUG    | __main__:trials:29 - Trial = 8457/30000 | Total reward = 49.70
2022-01-26 14:17:05.894 | DEBUG    | __main__:trials:24 - Trial = 8458/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.896 | DEBUG    | __main__:trials:29 - Trial = 8458/30000 | Total reward = 47.21
2022-01-26 14:17:05.899 | DEBUG    | __main__:trials:24 - Trial = 8459/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.901 | DEBUG    | __main__:trials:29 - Trial = 8459/30000 | Total reward = 28.32
2022-01-26 14:17:05.904 | DEBUG    | __main__:trials:24 - Trial = 8460/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.905 | DEBUG    | __main__:trials:29 - Trial = 8460/30000 | Total reward = 59.67
2022-01-26 14:17:05.909 | DEBUG    | __main__:trials:24 - Trial = 8461/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.911 | DEBUG    | __main__:trials:29 - Trial = 8461/30000 | Total reward = 43.07
2022-01-26 14:17:05.914 | DEBUG    | __main__:trials:24 - Trial = 8462/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.916 | DEBUG    | __main__:trials:29 - Trial = 8462/30000 | Total reward = 38.37
2022-01-26 14:17:05.920 | DEBUG    | __main__:trials:24 - Trial = 8463/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.921 | DEBUG    | __main__:trials:29 - Trial = 8463/30000 | Total reward = 26.53
2022-01-26 14:17:05.924 | DEBUG    | __main__:trials:24 - Trial = 8464/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.926 | DEBUG    | __main__:trials:29 - Trial = 8464/30000 | Total reward = 50.77
2022-01-26 14:17:05.929 | DEBUG    | __main__:trials:24 - Trial = 8465/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.931 | DEBUG    | __main__:trials:29 - Trial = 8465/30000 | Total reward = 59.62
2022-01-26 14:17:05.934 | DEBUG    | __main__:trials:24 - Trial = 8466/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.936 | DEBUG    | __main__:trials:29 - Trial = 8466/30000 | Total reward = 45.83
2022-01-26 14:17:05.940 | DEBUG    | __main__:trials:24 - Trial = 8467/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.941 | DEBUG    | __main__:trials:29 - Trial = 8467/30000 | Total reward = 61.93
2022-01-26 14:17:05.945 | DEBUG    | __main__:trials:24 - Trial = 8468/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.946 | DEBUG    | __main__:trials:29 - Trial = 8468/30000 | Total reward = 46.22
2022-01-26 14:17:05.950 | DEBUG    | __main__:trials:24 - Trial = 8469/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.951 | DEBUG    | __main__:trials:29 - Trial = 8469/30000 | Total reward = 53.12
2022-01-26 14:17:05.954 | DEBUG    | __main__:trials:24 - Trial = 8470/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.956 | DEBUG    | __main__:trials:29 - Trial = 8470/30000 | Total reward = 46.99
2022-01-26 14:17:05.960 | DEBUG    | __main__:trials:24 - Trial = 8471/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.961 | DEBUG    | __main__:trials:29 - Trial = 8471/30000 | Total reward = 47.39
2022-01-26 14:17:05.964 | DEBUG    | __main__:trials:26 - Trial = 8472/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:05.965 | DEBUG    | __main__:trials:29 - Trial = 8472/30000 | Total reward = 9.16
2022-01-26 14:17:05.969 | DEBUG    | __main__:trials:24 - Trial = 8473/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.970 | DEBUG    | __main__:trials:29 - Trial = 8473/30000 | Total reward = 47.21
2022-01-26 14:17:05.973 | DEBUG    | __main__:trials:24 - Trial = 8474/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.974 | DEBUG    | __main__:trials:29 - Trial = 8474/30000 | Total reward = 45.21
2022-01-26 14:17:05.977 | DEBUG    | __main__:trials:24 - Trial = 8475/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.978 | DEBUG    | __main__:trials:29 - Trial = 8475/30000 | Total reward = 47.61
2022-01-26 14:17:05.982 | DEBUG    | __main__:trials:24 - Trial = 8476/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.983 | DEBUG    | __main__:trials:29 - Trial = 8476/30000 | Total reward = 42.63
2022-01-26 14:17:05.987 | DEBUG    | __main__:trials:24 - Trial = 8477/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.989 | DEBUG    | __main__:trials:29 - Trial = 8477/30000 | Total reward = 47.21
2022-01-26 14:17:05.992 | DEBUG    | __main__:trials:24 - Trial = 8478/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.994 | DEBUG    | __main__:trials:29 - Trial = 8478/30000 | Total reward = 44.72
2022-01-26 14:17:05.998 | DEBUG    | __main__:trials:24 - Trial = 8479/30000 | Max number of steps (20) reached
2022-01-26 14:17:05.999 | DEBUG    | __main__:trials:29 - Trial = 8479/30000 | Total reward = 46.37
2022-01-26 14:17:06.003 | DEBUG    | __main__:trials:24 - Trial = 8480/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.004 | DEBUG    | __main__:trials:29 - Trial = 8480/30000 | Total reward = 47.52
2022-01-26 14:17:06.007 | DEBUG    | __main__:trials:24 - Trial = 8481/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.009 | DEBUG    | __main__:trials:29 - Trial = 8481/30000 | Total reward = 40.34
2022-01-26 14:17:06.012 | DEBUG    | __main__:trials:24 - Trial = 8482/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.014 | DEBUG    | __main__:trials:29 - Trial = 8482/30000 | Total reward = 43.57
2022-01-26 14:17:06.018 | DEBUG    | __main__:trials:24 - Trial = 8483/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.019 | DEBUG    | __main__:trials:29 - Trial = 8483/30000 | Total reward = 46.95
2022-01-26 14:17:06.023 | DEBUG    | __main__:trials:24 - Trial = 8484/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.025 | DEBUG    | __main__:trials:29 - Trial = 8484/30000 | Total reward = 49.81
2022-01-26 14:17:06.028 | DEBUG    | __main__:trials:24 - Trial = 8485/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.030 | DEBUG    | __main__:trials:29 - Trial = 8485/30000 | Total reward = 38.42
2022-01-26 14:17:06.034 | DEBUG    | __main__:trials:24 - Trial = 8486/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.035 | DEBUG    | __main__:trials:29 - Trial = 8486/30000 | Total reward = 45.88
2022-01-26 14:17:06.038 | DEBUG    | __main__:trials:24 - Trial = 8487/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.040 | DEBUG    | __main__:trials:29 - Trial = 8487/30000 | Total reward = 55.10
2022-01-26 14:17:06.043 | DEBUG    | __main__:trials:24 - Trial = 8488/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.045 | DEBUG    | __main__:trials:29 - Trial = 8488/30000 | Total reward = 47.76
2022-01-26 14:17:06.048 | DEBUG    | __main__:trials:24 - Trial = 8489/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.050 | DEBUG    | __main__:trials:29 - Trial = 8489/30000 | Total reward = 34.28
2022-01-26 14:17:06.054 | DEBUG    | __main__:trials:24 - Trial = 8490/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.055 | DEBUG    | __main__:trials:29 - Trial = 8490/30000 | Total reward = 40.09
2022-01-26 14:17:06.058 | DEBUG    | __main__:trials:24 - Trial = 8491/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.060 | DEBUG    | __main__:trials:29 - Trial = 8491/30000 | Total reward = 45.17
2022-01-26 14:17:06.063 | DEBUG    | __main__:trials:24 - Trial = 8492/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.065 | DEBUG    | __main__:trials:29 - Trial = 8492/30000 | Total reward = 48.58
2022-01-26 14:17:06.068 | DEBUG    | __main__:trials:24 - Trial = 8493/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.070 | DEBUG    | __main__:trials:29 - Trial = 8493/30000 | Total reward = 45.36
2022-01-26 14:17:06.073 | DEBUG    | __main__:trials:24 - Trial = 8494/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.074 | DEBUG    | __main__:trials:29 - Trial = 8494/30000 | Total reward = 45.03
2022-01-26 14:17:06.078 | DEBUG    | __main__:trials:24 - Trial = 8495/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.079 | DEBUG    | __main__:trials:29 - Trial = 8495/30000 | Total reward = 52.07
2022-01-26 14:17:06.083 | DEBUG    | __main__:trials:24 - Trial = 8496/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.084 | DEBUG    | __main__:trials:29 - Trial = 8496/30000 | Total reward = 47.09
2022-01-26 14:17:06.088 | DEBUG    | __main__:trials:24 - Trial = 8497/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.090 | DEBUG    | __main__:trials:29 - Trial = 8497/30000 | Total reward = 44.55
2022-01-26 14:17:06.094 | DEBUG    | __main__:trials:24 - Trial = 8498/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.095 | DEBUG    | __main__:trials:29 - Trial = 8498/30000 | Total reward = 47.97
2022-01-26 14:17:06.098 | DEBUG    | __main__:trials:24 - Trial = 8499/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.100 | DEBUG    | __main__:trials:29 - Trial = 8499/30000 | Total reward = 67.17
2022-01-26 14:17:06.103 | DEBUG    | __main__:trials:24 - Trial = 8500/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.105 | DEBUG    | __main__:trials:29 - Trial = 8500/30000 | Total reward = 43.15
2022-01-26 14:17:06.109 | DEBUG    | __main__:trials:24 - Trial = 8501/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.111 | DEBUG    | __main__:trials:29 - Trial = 8501/30000 | Total reward = 48.77
2022-01-26 14:17:06.114 | DEBUG    | __main__:trials:24 - Trial = 8502/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.116 | DEBUG    | __main__:trials:29 - Trial = 8502/30000 | Total reward = 35.64
2022-01-26 14:17:06.119 | DEBUG    | __main__:trials:24 - Trial = 8503/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.121 | DEBUG    | __main__:trials:29 - Trial = 8503/30000 | Total reward = 32.14
2022-01-26 14:17:06.124 | DEBUG    | __main__:trials:24 - Trial = 8504/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.126 | DEBUG    | __main__:trials:29 - Trial = 8504/30000 | Total reward = 53.88
2022-01-26 14:17:06.129 | DEBUG    | __main__:trials:24 - Trial = 8505/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.130 | DEBUG    | __main__:trials:29 - Trial = 8505/30000 | Total reward = 37.48
2022-01-26 14:17:06.134 | DEBUG    | __main__:trials:24 - Trial = 8506/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.135 | DEBUG    | __main__:trials:29 - Trial = 8506/30000 | Total reward = 52.47
2022-01-26 14:17:06.138 | DEBUG    | __main__:trials:24 - Trial = 8507/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.139 | DEBUG    | __main__:trials:29 - Trial = 8507/30000 | Total reward = 49.67
2022-01-26 14:17:06.142 | DEBUG    | __main__:trials:24 - Trial = 8508/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.144 | DEBUG    | __main__:trials:29 - Trial = 8508/30000 | Total reward = 42.17
2022-01-26 14:17:06.147 | DEBUG    | __main__:trials:24 - Trial = 8509/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.149 | DEBUG    | __main__:trials:29 - Trial = 8509/30000 | Total reward = 37.94
2022-01-26 14:17:06.152 | DEBUG    | __main__:trials:24 - Trial = 8510/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.154 | DEBUG    | __main__:trials:29 - Trial = 8510/30000 | Total reward = 49.99
2022-01-26 14:17:06.157 | DEBUG    | __main__:trials:24 - Trial = 8511/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.159 | DEBUG    | __main__:trials:29 - Trial = 8511/30000 | Total reward = 67.34
2022-01-26 14:17:06.163 | DEBUG    | __main__:trials:24 - Trial = 8512/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.164 | DEBUG    | __main__:trials:29 - Trial = 8512/30000 | Total reward = 47.39
2022-01-26 14:17:06.168 | DEBUG    | __main__:trials:24 - Trial = 8513/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.169 | DEBUG    | __main__:trials:29 - Trial = 8513/30000 | Total reward = 44.21
2022-01-26 14:17:06.173 | DEBUG    | __main__:trials:24 - Trial = 8514/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.175 | DEBUG    | __main__:trials:29 - Trial = 8514/30000 | Total reward = 47.21
2022-01-26 14:17:06.178 | DEBUG    | __main__:trials:24 - Trial = 8515/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.180 | DEBUG    | __main__:trials:29 - Trial = 8515/30000 | Total reward = 48.55
2022-01-26 14:17:06.183 | DEBUG    | __main__:trials:24 - Trial = 8516/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.185 | DEBUG    | __main__:trials:29 - Trial = 8516/30000 | Total reward = 51.49
2022-01-26 14:17:06.187 | DEBUG    | __main__:trials:24 - Trial = 8517/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.189 | DEBUG    | __main__:trials:29 - Trial = 8517/30000 | Total reward = 48.68
2022-01-26 14:17:06.192 | DEBUG    | __main__:trials:24 - Trial = 8518/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.194 | DEBUG    | __main__:trials:29 - Trial = 8518/30000 | Total reward = 43.87
2022-01-26 14:17:06.198 | DEBUG    | __main__:trials:24 - Trial = 8519/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.199 | DEBUG    | __main__:trials:29 - Trial = 8519/30000 | Total reward = 47.71
2022-01-26 14:17:06.203 | DEBUG    | __main__:trials:24 - Trial = 8520/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.205 | DEBUG    | __main__:trials:29 - Trial = 8520/30000 | Total reward = 64.37
2022-01-26 14:17:06.208 | DEBUG    | __main__:trials:24 - Trial = 8521/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.210 | DEBUG    | __main__:trials:29 - Trial = 8521/30000 | Total reward = 54.44
2022-01-26 14:17:06.213 | DEBUG    | __main__:trials:24 - Trial = 8522/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.214 | DEBUG    | __main__:trials:29 - Trial = 8522/30000 | Total reward = 49.20
2022-01-26 14:17:06.218 | DEBUG    | __main__:trials:24 - Trial = 8523/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.219 | DEBUG    | __main__:trials:29 - Trial = 8523/30000 | Total reward = 32.39
2022-01-26 14:17:06.223 | DEBUG    | __main__:trials:24 - Trial = 8524/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.224 | DEBUG    | __main__:trials:29 - Trial = 8524/30000 | Total reward = 35.52
2022-01-26 14:17:06.228 | DEBUG    | __main__:trials:24 - Trial = 8525/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.229 | DEBUG    | __main__:trials:29 - Trial = 8525/30000 | Total reward = 44.04
2022-01-26 14:17:06.232 | DEBUG    | __main__:trials:24 - Trial = 8526/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.234 | DEBUG    | __main__:trials:29 - Trial = 8526/30000 | Total reward = 55.68
2022-01-26 14:17:06.238 | DEBUG    | __main__:trials:24 - Trial = 8527/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.239 | DEBUG    | __main__:trials:29 - Trial = 8527/30000 | Total reward = 43.40
2022-01-26 14:17:06.243 | DEBUG    | __main__:trials:24 - Trial = 8528/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.244 | DEBUG    | __main__:trials:29 - Trial = 8528/30000 | Total reward = 40.60
2022-01-26 14:17:06.248 | DEBUG    | __main__:trials:24 - Trial = 8529/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.250 | DEBUG    | __main__:trials:29 - Trial = 8529/30000 | Total reward = 33.36
2022-01-26 14:17:06.253 | DEBUG    | __main__:trials:24 - Trial = 8530/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.255 | DEBUG    | __main__:trials:29 - Trial = 8530/30000 | Total reward = 43.68
2022-01-26 14:17:06.258 | DEBUG    | __main__:trials:24 - Trial = 8531/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.260 | DEBUG    | __main__:trials:29 - Trial = 8531/30000 | Total reward = 42.98
2022-01-26 14:17:06.264 | DEBUG    | __main__:trials:24 - Trial = 8532/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.265 | DEBUG    | __main__:trials:29 - Trial = 8532/30000 | Total reward = 33.19
2022-01-26 14:17:06.268 | DEBUG    | __main__:trials:26 - Trial = 8533/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:06.268 | DEBUG    | __main__:trials:29 - Trial = 8533/30000 | Total reward = 12.57
2022-01-26 14:17:06.272 | DEBUG    | __main__:trials:24 - Trial = 8534/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.273 | DEBUG    | __main__:trials:29 - Trial = 8534/30000 | Total reward = 59.78
2022-01-26 14:17:06.276 | DEBUG    | __main__:trials:24 - Trial = 8535/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.277 | DEBUG    | __main__:trials:29 - Trial = 8535/30000 | Total reward = 24.87
2022-01-26 14:17:06.281 | DEBUG    | __main__:trials:24 - Trial = 8536/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.282 | DEBUG    | __main__:trials:29 - Trial = 8536/30000 | Total reward = 33.06
2022-01-26 14:17:06.286 | DEBUG    | __main__:trials:24 - Trial = 8537/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.288 | DEBUG    | __main__:trials:29 - Trial = 8537/30000 | Total reward = 36.36
2022-01-26 14:17:06.291 | DEBUG    | __main__:trials:24 - Trial = 8538/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.293 | DEBUG    | __main__:trials:29 - Trial = 8538/30000 | Total reward = 34.64
2022-01-26 14:17:06.296 | DEBUG    | __main__:trials:24 - Trial = 8539/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.297 | DEBUG    | __main__:trials:29 - Trial = 8539/30000 | Total reward = 51.65
2022-01-26 14:17:06.301 | DEBUG    | __main__:trials:24 - Trial = 8540/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.302 | DEBUG    | __main__:trials:29 - Trial = 8540/30000 | Total reward = 28.10
2022-01-26 14:17:06.306 | DEBUG    | __main__:trials:24 - Trial = 8541/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.307 | DEBUG    | __main__:trials:29 - Trial = 8541/30000 | Total reward = 46.30
2022-01-26 14:17:06.311 | DEBUG    | __main__:trials:24 - Trial = 8542/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.312 | DEBUG    | __main__:trials:29 - Trial = 8542/30000 | Total reward = 33.32
2022-01-26 14:17:06.316 | DEBUG    | __main__:trials:24 - Trial = 8543/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.318 | DEBUG    | __main__:trials:29 - Trial = 8543/30000 | Total reward = 30.60
2022-01-26 14:17:06.321 | DEBUG    | __main__:trials:24 - Trial = 8544/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.323 | DEBUG    | __main__:trials:29 - Trial = 8544/30000 | Total reward = 23.85
2022-01-26 14:17:06.327 | DEBUG    | __main__:trials:24 - Trial = 8545/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.328 | DEBUG    | __main__:trials:29 - Trial = 8545/30000 | Total reward = 29.69
2022-01-26 14:17:06.332 | DEBUG    | __main__:trials:24 - Trial = 8546/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.334 | DEBUG    | __main__:trials:29 - Trial = 8546/30000 | Total reward = 23.94
2022-01-26 14:17:06.338 | DEBUG    | __main__:trials:24 - Trial = 8547/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.339 | DEBUG    | __main__:trials:29 - Trial = 8547/30000 | Total reward = 57.63
2022-01-26 14:17:06.342 | DEBUG    | __main__:trials:24 - Trial = 8548/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.344 | DEBUG    | __main__:trials:29 - Trial = 8548/30000 | Total reward = 43.01
2022-01-26 14:17:06.348 | DEBUG    | __main__:trials:26 - Trial = 8549/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:06.349 | DEBUG    | __main__:trials:29 - Trial = 8549/30000 | Total reward = 34.35
2022-01-26 14:17:06.353 | DEBUG    | __main__:trials:24 - Trial = 8550/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.354 | DEBUG    | __main__:trials:29 - Trial = 8550/30000 | Total reward = 64.48
2022-01-26 14:17:06.357 | DEBUG    | __main__:trials:24 - Trial = 8551/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.358 | DEBUG    | __main__:trials:29 - Trial = 8551/30000 | Total reward = 52.48
2022-01-26 14:17:06.361 | DEBUG    | __main__:trials:24 - Trial = 8552/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.362 | DEBUG    | __main__:trials:29 - Trial = 8552/30000 | Total reward = 42.03
2022-01-26 14:17:06.365 | DEBUG    | __main__:trials:24 - Trial = 8553/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.367 | DEBUG    | __main__:trials:29 - Trial = 8553/30000 | Total reward = 26.99
2022-01-26 14:17:06.370 | DEBUG    | __main__:trials:24 - Trial = 8554/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.372 | DEBUG    | __main__:trials:29 - Trial = 8554/30000 | Total reward = 31.91
2022-01-26 14:17:06.376 | DEBUG    | __main__:trials:24 - Trial = 8555/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.377 | DEBUG    | __main__:trials:29 - Trial = 8555/30000 | Total reward = 29.47
2022-01-26 14:17:06.381 | DEBUG    | __main__:trials:24 - Trial = 8556/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.382 | DEBUG    | __main__:trials:29 - Trial = 8556/30000 | Total reward = 32.07
2022-01-26 14:17:06.386 | DEBUG    | __main__:trials:24 - Trial = 8557/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.387 | DEBUG    | __main__:trials:29 - Trial = 8557/30000 | Total reward = 39.40
2022-01-26 14:17:06.391 | DEBUG    | __main__:trials:24 - Trial = 8558/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.393 | DEBUG    | __main__:trials:29 - Trial = 8558/30000 | Total reward = 30.08
2022-01-26 14:17:06.396 | DEBUG    | __main__:trials:24 - Trial = 8559/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.398 | DEBUG    | __main__:trials:29 - Trial = 8559/30000 | Total reward = 55.16
2022-01-26 14:17:06.401 | DEBUG    | __main__:trials:26 - Trial = 8560/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:06.402 | DEBUG    | __main__:trials:29 - Trial = 8560/30000 | Total reward = 16.31
2022-01-26 14:17:06.406 | DEBUG    | __main__:trials:24 - Trial = 8561/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.408 | DEBUG    | __main__:trials:29 - Trial = 8561/30000 | Total reward = 32.04
2022-01-26 14:17:06.410 | DEBUG    | __main__:trials:24 - Trial = 8562/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.412 | DEBUG    | __main__:trials:29 - Trial = 8562/30000 | Total reward = 60.84
2022-01-26 14:17:06.416 | DEBUG    | __main__:trials:24 - Trial = 8563/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.418 | DEBUG    | __main__:trials:29 - Trial = 8563/30000 | Total reward = 23.91
2022-01-26 14:17:06.421 | DEBUG    | __main__:trials:24 - Trial = 8564/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.423 | DEBUG    | __main__:trials:29 - Trial = 8564/30000 | Total reward = 36.06
2022-01-26 14:17:06.426 | DEBUG    | __main__:trials:24 - Trial = 8565/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.428 | DEBUG    | __main__:trials:29 - Trial = 8565/30000 | Total reward = 49.81
2022-01-26 14:17:06.431 | DEBUG    | __main__:trials:24 - Trial = 8566/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.433 | DEBUG    | __main__:trials:29 - Trial = 8566/30000 | Total reward = 35.36
2022-01-26 14:17:06.436 | DEBUG    | __main__:trials:24 - Trial = 8567/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.438 | DEBUG    | __main__:trials:29 - Trial = 8567/30000 | Total reward = 36.84
2022-01-26 14:17:06.443 | DEBUG    | __main__:trials:24 - Trial = 8568/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.444 | DEBUG    | __main__:trials:29 - Trial = 8568/30000 | Total reward = 28.80
2022-01-26 14:17:06.448 | DEBUG    | __main__:trials:24 - Trial = 8569/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.449 | DEBUG    | __main__:trials:29 - Trial = 8569/30000 | Total reward = 41.94
2022-01-26 14:17:06.453 | DEBUG    | __main__:trials:24 - Trial = 8570/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.453 | DEBUG    | __main__:trials:29 - Trial = 8570/30000 | Total reward = 32.93
2022-01-26 14:17:06.457 | DEBUG    | __main__:trials:24 - Trial = 8571/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.459 | DEBUG    | __main__:trials:29 - Trial = 8571/30000 | Total reward = 24.05
2022-01-26 14:17:06.463 | DEBUG    | __main__:trials:24 - Trial = 8572/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.464 | DEBUG    | __main__:trials:29 - Trial = 8572/30000 | Total reward = 43.45
2022-01-26 14:17:06.467 | DEBUG    | __main__:trials:24 - Trial = 8573/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.469 | DEBUG    | __main__:trials:29 - Trial = 8573/30000 | Total reward = 38.18
2022-01-26 14:17:06.472 | DEBUG    | __main__:trials:26 - Trial = 8574/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:06.473 | DEBUG    | __main__:trials:29 - Trial = 8574/30000 | Total reward = 17.72
2022-01-26 14:17:06.477 | DEBUG    | __main__:trials:24 - Trial = 8575/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.477 | DEBUG    | __main__:trials:29 - Trial = 8575/30000 | Total reward = 56.72
2022-01-26 14:17:06.481 | DEBUG    | __main__:trials:24 - Trial = 8576/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.483 | DEBUG    | __main__:trials:29 - Trial = 8576/30000 | Total reward = 45.85
2022-01-26 14:17:06.486 | DEBUG    | __main__:trials:24 - Trial = 8577/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.488 | DEBUG    | __main__:trials:29 - Trial = 8577/30000 | Total reward = 47.94
2022-01-26 14:17:06.492 | DEBUG    | __main__:trials:24 - Trial = 8578/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.493 | DEBUG    | __main__:trials:29 - Trial = 8578/30000 | Total reward = 44.86
2022-01-26 14:17:06.497 | DEBUG    | __main__:trials:24 - Trial = 8579/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.498 | DEBUG    | __main__:trials:29 - Trial = 8579/30000 | Total reward = 47.81
2022-01-26 14:17:06.502 | DEBUG    | __main__:trials:24 - Trial = 8580/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.503 | DEBUG    | __main__:trials:29 - Trial = 8580/30000 | Total reward = 63.63
2022-01-26 14:17:06.507 | DEBUG    | __main__:trials:24 - Trial = 8581/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.509 | DEBUG    | __main__:trials:29 - Trial = 8581/30000 | Total reward = 54.05
2022-01-26 14:17:06.512 | DEBUG    | __main__:trials:24 - Trial = 8582/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.514 | DEBUG    | __main__:trials:29 - Trial = 8582/30000 | Total reward = 52.57
2022-01-26 14:17:06.518 | DEBUG    | __main__:trials:24 - Trial = 8583/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.519 | DEBUG    | __main__:trials:29 - Trial = 8583/30000 | Total reward = 62.55
2022-01-26 14:17:06.522 | DEBUG    | __main__:trials:24 - Trial = 8584/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.524 | DEBUG    | __main__:trials:29 - Trial = 8584/30000 | Total reward = 48.99
2022-01-26 14:17:06.527 | DEBUG    | __main__:trials:24 - Trial = 8585/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.529 | DEBUG    | __main__:trials:29 - Trial = 8585/30000 | Total reward = 52.30
2022-01-26 14:17:06.532 | DEBUG    | __main__:trials:24 - Trial = 8586/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.534 | DEBUG    | __main__:trials:29 - Trial = 8586/30000 | Total reward = 43.21
2022-01-26 14:17:06.537 | DEBUG    | __main__:trials:24 - Trial = 8587/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.538 | DEBUG    | __main__:trials:29 - Trial = 8587/30000 | Total reward = 49.74
2022-01-26 14:17:06.541 | DEBUG    | __main__:trials:26 - Trial = 8588/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:06.542 | DEBUG    | __main__:trials:29 - Trial = 8588/30000 | Total reward = 10.39
2022-01-26 14:17:06.546 | DEBUG    | __main__:trials:24 - Trial = 8589/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.547 | DEBUG    | __main__:trials:29 - Trial = 8589/30000 | Total reward = 34.54
2022-01-26 14:17:06.551 | DEBUG    | __main__:trials:24 - Trial = 8590/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.552 | DEBUG    | __main__:trials:29 - Trial = 8590/30000 | Total reward = 41.97
2022-01-26 14:17:06.556 | DEBUG    | __main__:trials:24 - Trial = 8591/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.558 | DEBUG    | __main__:trials:29 - Trial = 8591/30000 | Total reward = 39.44
2022-01-26 14:17:06.561 | DEBUG    | __main__:trials:24 - Trial = 8592/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.563 | DEBUG    | __main__:trials:29 - Trial = 8592/30000 | Total reward = 49.44
2022-01-26 14:17:06.567 | DEBUG    | __main__:trials:24 - Trial = 8593/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.568 | DEBUG    | __main__:trials:29 - Trial = 8593/30000 | Total reward = 36.01
2022-01-26 14:17:06.572 | DEBUG    | __main__:trials:24 - Trial = 8594/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.574 | DEBUG    | __main__:trials:29 - Trial = 8594/30000 | Total reward = 48.72
2022-01-26 14:17:06.578 | DEBUG    | __main__:trials:24 - Trial = 8595/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.578 | DEBUG    | __main__:trials:29 - Trial = 8595/30000 | Total reward = 25.59
2022-01-26 14:17:06.582 | DEBUG    | __main__:trials:24 - Trial = 8596/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.584 | DEBUG    | __main__:trials:29 - Trial = 8596/30000 | Total reward = 36.78
2022-01-26 14:17:06.587 | DEBUG    | __main__:trials:24 - Trial = 8597/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.589 | DEBUG    | __main__:trials:29 - Trial = 8597/30000 | Total reward = 45.77
2022-01-26 14:17:06.592 | DEBUG    | __main__:trials:24 - Trial = 8598/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.594 | DEBUG    | __main__:trials:29 - Trial = 8598/30000 | Total reward = 44.90
2022-01-26 14:17:06.597 | DEBUG    | __main__:trials:24 - Trial = 8599/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.599 | DEBUG    | __main__:trials:29 - Trial = 8599/30000 | Total reward = 63.13
2022-01-26 14:17:06.602 | DEBUG    | __main__:trials:24 - Trial = 8600/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.604 | DEBUG    | __main__:trials:29 - Trial = 8600/30000 | Total reward = 46.57
2022-01-26 14:17:06.607 | DEBUG    | __main__:trials:24 - Trial = 8601/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.609 | DEBUG    | __main__:trials:29 - Trial = 8601/30000 | Total reward = 46.99
2022-01-26 14:17:06.612 | DEBUG    | __main__:trials:24 - Trial = 8602/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.613 | DEBUG    | __main__:trials:29 - Trial = 8602/30000 | Total reward = 47.37
2022-01-26 14:17:06.617 | DEBUG    | __main__:trials:24 - Trial = 8603/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.618 | DEBUG    | __main__:trials:29 - Trial = 8603/30000 | Total reward = 43.73
2022-01-26 14:17:06.621 | DEBUG    | __main__:trials:24 - Trial = 8604/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.622 | DEBUG    | __main__:trials:29 - Trial = 8604/30000 | Total reward = 45.68
2022-01-26 14:17:06.626 | DEBUG    | __main__:trials:24 - Trial = 8605/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.627 | DEBUG    | __main__:trials:29 - Trial = 8605/30000 | Total reward = 47.21
2022-01-26 14:17:06.631 | DEBUG    | __main__:trials:24 - Trial = 8606/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.632 | DEBUG    | __main__:trials:29 - Trial = 8606/30000 | Total reward = 38.80
2022-01-26 14:17:06.635 | DEBUG    | __main__:trials:24 - Trial = 8607/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.637 | DEBUG    | __main__:trials:29 - Trial = 8607/30000 | Total reward = 43.50
2022-01-26 14:17:06.640 | DEBUG    | __main__:trials:24 - Trial = 8608/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.642 | DEBUG    | __main__:trials:29 - Trial = 8608/30000 | Total reward = 45.45
2022-01-26 14:17:06.646 | DEBUG    | __main__:trials:24 - Trial = 8609/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.648 | DEBUG    | __main__:trials:29 - Trial = 8609/30000 | Total reward = 51.29
2022-01-26 14:17:06.651 | DEBUG    | __main__:trials:24 - Trial = 8610/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.653 | DEBUG    | __main__:trials:29 - Trial = 8610/30000 | Total reward = 45.98
2022-01-26 14:17:06.656 | DEBUG    | __main__:trials:24 - Trial = 8611/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.658 | DEBUG    | __main__:trials:29 - Trial = 8611/30000 | Total reward = 46.30
2022-01-26 14:17:06.661 | DEBUG    | __main__:trials:24 - Trial = 8612/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.663 | DEBUG    | __main__:trials:29 - Trial = 8612/30000 | Total reward = 49.67
2022-01-26 14:17:06.666 | DEBUG    | __main__:trials:24 - Trial = 8613/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.668 | DEBUG    | __main__:trials:29 - Trial = 8613/30000 | Total reward = 29.44
2022-01-26 14:17:06.671 | DEBUG    | __main__:trials:24 - Trial = 8614/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.673 | DEBUG    | __main__:trials:29 - Trial = 8614/30000 | Total reward = 42.48
2022-01-26 14:17:06.676 | DEBUG    | __main__:trials:24 - Trial = 8615/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.678 | DEBUG    | __main__:trials:29 - Trial = 8615/30000 | Total reward = 45.38
2022-01-26 14:17:06.682 | DEBUG    | __main__:trials:24 - Trial = 8616/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.683 | DEBUG    | __main__:trials:29 - Trial = 8616/30000 | Total reward = 48.58
2022-01-26 14:17:06.687 | DEBUG    | __main__:trials:24 - Trial = 8617/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.688 | DEBUG    | __main__:trials:29 - Trial = 8617/30000 | Total reward = 62.78
2022-01-26 14:17:06.691 | DEBUG    | __main__:trials:24 - Trial = 8618/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.694 | DEBUG    | __main__:trials:29 - Trial = 8618/30000 | Total reward = 41.17
2022-01-26 14:17:06.697 | DEBUG    | __main__:trials:24 - Trial = 8619/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.699 | DEBUG    | __main__:trials:29 - Trial = 8619/30000 | Total reward = 45.72
2022-01-26 14:17:06.702 | DEBUG    | __main__:trials:24 - Trial = 8620/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.703 | DEBUG    | __main__:trials:29 - Trial = 8620/30000 | Total reward = 57.73
2022-01-26 14:17:06.707 | DEBUG    | __main__:trials:24 - Trial = 8621/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.709 | DEBUG    | __main__:trials:29 - Trial = 8621/30000 | Total reward = 58.36
2022-01-26 14:17:06.712 | DEBUG    | __main__:trials:24 - Trial = 8622/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.713 | DEBUG    | __main__:trials:29 - Trial = 8622/30000 | Total reward = 44.40
2022-01-26 14:17:06.716 | DEBUG    | __main__:trials:24 - Trial = 8623/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.717 | DEBUG    | __main__:trials:29 - Trial = 8623/30000 | Total reward = 51.65
2022-01-26 14:17:06.721 | DEBUG    | __main__:trials:24 - Trial = 8624/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.721 | DEBUG    | __main__:trials:29 - Trial = 8624/30000 | Total reward = 65.71
2022-01-26 14:17:06.726 | DEBUG    | __main__:trials:24 - Trial = 8625/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.728 | DEBUG    | __main__:trials:29 - Trial = 8625/30000 | Total reward = 45.99
2022-01-26 14:17:06.732 | DEBUG    | __main__:trials:24 - Trial = 8626/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.733 | DEBUG    | __main__:trials:29 - Trial = 8626/30000 | Total reward = 42.93
2022-01-26 14:17:06.737 | DEBUG    | __main__:trials:24 - Trial = 8627/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.738 | DEBUG    | __main__:trials:29 - Trial = 8627/30000 | Total reward = 46.41
2022-01-26 14:17:06.742 | DEBUG    | __main__:trials:24 - Trial = 8628/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.743 | DEBUG    | __main__:trials:29 - Trial = 8628/30000 | Total reward = 46.91
2022-01-26 14:17:06.746 | DEBUG    | __main__:trials:24 - Trial = 8629/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.747 | DEBUG    | __main__:trials:29 - Trial = 8629/30000 | Total reward = 45.63
2022-01-26 14:17:06.751 | DEBUG    | __main__:trials:24 - Trial = 8630/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.752 | DEBUG    | __main__:trials:29 - Trial = 8630/30000 | Total reward = 46.31
2022-01-26 14:17:06.756 | DEBUG    | __main__:trials:24 - Trial = 8631/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.757 | DEBUG    | __main__:trials:29 - Trial = 8631/30000 | Total reward = 56.99
2022-01-26 14:17:06.760 | DEBUG    | __main__:trials:24 - Trial = 8632/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.762 | DEBUG    | __main__:trials:29 - Trial = 8632/30000 | Total reward = 51.24
2022-01-26 14:17:06.766 | DEBUG    | __main__:trials:24 - Trial = 8633/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.767 | DEBUG    | __main__:trials:29 - Trial = 8633/30000 | Total reward = 38.03
2022-01-26 14:17:06.771 | DEBUG    | __main__:trials:24 - Trial = 8634/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.773 | DEBUG    | __main__:trials:29 - Trial = 8634/30000 | Total reward = 51.55
2022-01-26 14:17:06.777 | DEBUG    | __main__:trials:24 - Trial = 8635/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.778 | DEBUG    | __main__:trials:29 - Trial = 8635/30000 | Total reward = 49.32
2022-01-26 14:17:06.782 | DEBUG    | __main__:trials:24 - Trial = 8636/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.783 | DEBUG    | __main__:trials:29 - Trial = 8636/30000 | Total reward = 30.16
2022-01-26 14:17:06.787 | DEBUG    | __main__:trials:24 - Trial = 8637/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.789 | DEBUG    | __main__:trials:29 - Trial = 8637/30000 | Total reward = 50.91
2022-01-26 14:17:06.792 | DEBUG    | __main__:trials:24 - Trial = 8638/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.794 | DEBUG    | __main__:trials:29 - Trial = 8638/30000 | Total reward = 22.77
2022-01-26 14:17:06.797 | DEBUG    | __main__:trials:24 - Trial = 8639/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.799 | DEBUG    | __main__:trials:29 - Trial = 8639/30000 | Total reward = 49.06
2022-01-26 14:17:06.802 | DEBUG    | __main__:trials:24 - Trial = 8640/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.803 | DEBUG    | __main__:trials:29 - Trial = 8640/30000 | Total reward = 36.01
2022-01-26 14:17:06.807 | DEBUG    | __main__:trials:24 - Trial = 8641/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.809 | DEBUG    | __main__:trials:29 - Trial = 8641/30000 | Total reward = 45.15
2022-01-26 14:17:06.812 | DEBUG    | __main__:trials:24 - Trial = 8642/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.814 | DEBUG    | __main__:trials:29 - Trial = 8642/30000 | Total reward = 35.82
2022-01-26 14:17:06.817 | DEBUG    | __main__:trials:24 - Trial = 8643/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.818 | DEBUG    | __main__:trials:29 - Trial = 8643/30000 | Total reward = 36.12
2022-01-26 14:17:06.821 | DEBUG    | __main__:trials:24 - Trial = 8644/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.822 | DEBUG    | __main__:trials:29 - Trial = 8644/30000 | Total reward = 51.23
2022-01-26 14:17:06.825 | DEBUG    | __main__:trials:24 - Trial = 8645/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.827 | DEBUG    | __main__:trials:29 - Trial = 8645/30000 | Total reward = 33.40
2022-01-26 14:17:06.830 | DEBUG    | __main__:trials:24 - Trial = 8646/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.831 | DEBUG    | __main__:trials:29 - Trial = 8646/30000 | Total reward = 40.79
2022-01-26 14:17:06.834 | DEBUG    | __main__:trials:24 - Trial = 8647/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.836 | DEBUG    | __main__:trials:29 - Trial = 8647/30000 | Total reward = 32.97
2022-01-26 14:17:06.839 | DEBUG    | __main__:trials:24 - Trial = 8648/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.841 | DEBUG    | __main__:trials:29 - Trial = 8648/30000 | Total reward = 38.86
2022-01-26 14:17:06.845 | DEBUG    | __main__:trials:24 - Trial = 8649/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.846 | DEBUG    | __main__:trials:29 - Trial = 8649/30000 | Total reward = 33.00
2022-01-26 14:17:06.851 | DEBUG    | __main__:trials:24 - Trial = 8650/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.852 | DEBUG    | __main__:trials:29 - Trial = 8650/30000 | Total reward = 26.83
2022-01-26 14:17:06.856 | DEBUG    | __main__:trials:24 - Trial = 8651/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.858 | DEBUG    | __main__:trials:29 - Trial = 8651/30000 | Total reward = 22.56
2022-01-26 14:17:06.861 | DEBUG    | __main__:trials:24 - Trial = 8652/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.863 | DEBUG    | __main__:trials:29 - Trial = 8652/30000 | Total reward = 36.01
2022-01-26 14:17:06.867 | DEBUG    | __main__:trials:24 - Trial = 8653/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.868 | DEBUG    | __main__:trials:29 - Trial = 8653/30000 | Total reward = 31.28
2022-01-26 14:17:06.872 | DEBUG    | __main__:trials:24 - Trial = 8654/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.874 | DEBUG    | __main__:trials:29 - Trial = 8654/30000 | Total reward = 45.08
2022-01-26 14:17:06.876 | DEBUG    | __main__:trials:24 - Trial = 8655/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.878 | DEBUG    | __main__:trials:29 - Trial = 8655/30000 | Total reward = 38.25
2022-01-26 14:17:06.882 | DEBUG    | __main__:trials:24 - Trial = 8656/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.883 | DEBUG    | __main__:trials:29 - Trial = 8656/30000 | Total reward = 45.19
2022-01-26 14:17:06.886 | DEBUG    | __main__:trials:24 - Trial = 8657/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.887 | DEBUG    | __main__:trials:29 - Trial = 8657/30000 | Total reward = 22.24
2022-01-26 14:17:06.891 | DEBUG    | __main__:trials:24 - Trial = 8658/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.892 | DEBUG    | __main__:trials:29 - Trial = 8658/30000 | Total reward = 46.85
2022-01-26 14:17:06.896 | DEBUG    | __main__:trials:24 - Trial = 8659/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.898 | DEBUG    | __main__:trials:29 - Trial = 8659/30000 | Total reward = 18.01
2022-01-26 14:17:06.901 | DEBUG    | __main__:trials:24 - Trial = 8660/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.903 | DEBUG    | __main__:trials:29 - Trial = 8660/30000 | Total reward = 31.15
2022-01-26 14:17:06.906 | DEBUG    | __main__:trials:24 - Trial = 8661/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.908 | DEBUG    | __main__:trials:29 - Trial = 8661/30000 | Total reward = 33.76
2022-01-26 14:17:06.912 | DEBUG    | __main__:trials:24 - Trial = 8662/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.913 | DEBUG    | __main__:trials:29 - Trial = 8662/30000 | Total reward = 27.87
2022-01-26 14:17:06.916 | DEBUG    | __main__:trials:24 - Trial = 8663/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.918 | DEBUG    | __main__:trials:29 - Trial = 8663/30000 | Total reward = 41.82
2022-01-26 14:17:06.922 | DEBUG    | __main__:trials:24 - Trial = 8664/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.923 | DEBUG    | __main__:trials:29 - Trial = 8664/30000 | Total reward = 39.66
2022-01-26 14:17:06.927 | DEBUG    | __main__:trials:24 - Trial = 8665/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.928 | DEBUG    | __main__:trials:29 - Trial = 8665/30000 | Total reward = 31.83
2022-01-26 14:17:06.932 | DEBUG    | __main__:trials:24 - Trial = 8666/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.933 | DEBUG    | __main__:trials:29 - Trial = 8666/30000 | Total reward = 41.38
2022-01-26 14:17:06.937 | DEBUG    | __main__:trials:24 - Trial = 8667/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.938 | DEBUG    | __main__:trials:29 - Trial = 8667/30000 | Total reward = 33.36
2022-01-26 14:17:06.942 | DEBUG    | __main__:trials:24 - Trial = 8668/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.943 | DEBUG    | __main__:trials:29 - Trial = 8668/30000 | Total reward = 50.97
2022-01-26 14:17:06.947 | DEBUG    | __main__:trials:24 - Trial = 8669/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.948 | DEBUG    | __main__:trials:29 - Trial = 8669/30000 | Total reward = 39.90
2022-01-26 14:17:06.952 | DEBUG    | __main__:trials:24 - Trial = 8670/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.953 | DEBUG    | __main__:trials:29 - Trial = 8670/30000 | Total reward = 52.05
2022-01-26 14:17:06.957 | DEBUG    | __main__:trials:24 - Trial = 8671/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.959 | DEBUG    | __main__:trials:29 - Trial = 8671/30000 | Total reward = 62.16
2022-01-26 14:17:06.962 | DEBUG    | __main__:trials:24 - Trial = 8672/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.964 | DEBUG    | __main__:trials:29 - Trial = 8672/30000 | Total reward = 32.09
2022-01-26 14:17:06.967 | DEBUG    | __main__:trials:24 - Trial = 8673/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.969 | DEBUG    | __main__:trials:29 - Trial = 8673/30000 | Total reward = 44.18
2022-01-26 14:17:06.972 | DEBUG    | __main__:trials:24 - Trial = 8674/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.974 | DEBUG    | __main__:trials:29 - Trial = 8674/30000 | Total reward = 33.36
2022-01-26 14:17:06.978 | DEBUG    | __main__:trials:24 - Trial = 8675/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.980 | DEBUG    | __main__:trials:29 - Trial = 8675/30000 | Total reward = 30.21
2022-01-26 14:17:06.983 | DEBUG    | __main__:trials:24 - Trial = 8676/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.985 | DEBUG    | __main__:trials:29 - Trial = 8676/30000 | Total reward = 51.75
2022-01-26 14:17:06.989 | DEBUG    | __main__:trials:24 - Trial = 8677/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.990 | DEBUG    | __main__:trials:29 - Trial = 8677/30000 | Total reward = 33.36
2022-01-26 14:17:06.994 | DEBUG    | __main__:trials:24 - Trial = 8678/30000 | Max number of steps (20) reached
2022-01-26 14:17:06.995 | DEBUG    | __main__:trials:29 - Trial = 8678/30000 | Total reward = 42.77
2022-01-26 14:17:06.999 | DEBUG    | __main__:trials:24 - Trial = 8679/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.001 | DEBUG    | __main__:trials:29 - Trial = 8679/30000 | Total reward = 17.19
2022-01-26 14:17:07.004 | DEBUG    | __main__:trials:24 - Trial = 8680/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.006 | DEBUG    | __main__:trials:29 - Trial = 8680/30000 | Total reward = 45.19
2022-01-26 14:17:07.009 | DEBUG    | __main__:trials:24 - Trial = 8681/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.011 | DEBUG    | __main__:trials:29 - Trial = 8681/30000 | Total reward = 53.46
2022-01-26 14:17:07.015 | DEBUG    | __main__:trials:24 - Trial = 8682/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.016 | DEBUG    | __main__:trials:29 - Trial = 8682/30000 | Total reward = 48.23
2022-01-26 14:17:07.020 | DEBUG    | __main__:trials:24 - Trial = 8683/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.021 | DEBUG    | __main__:trials:29 - Trial = 8683/30000 | Total reward = 46.62
2022-01-26 14:17:07.025 | DEBUG    | __main__:trials:24 - Trial = 8684/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.026 | DEBUG    | __main__:trials:29 - Trial = 8684/30000 | Total reward = 47.77
2022-01-26 14:17:07.030 | DEBUG    | __main__:trials:24 - Trial = 8685/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.031 | DEBUG    | __main__:trials:29 - Trial = 8685/30000 | Total reward = 19.81
2022-01-26 14:17:07.035 | DEBUG    | __main__:trials:24 - Trial = 8686/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.037 | DEBUG    | __main__:trials:29 - Trial = 8686/30000 | Total reward = 51.65
2022-01-26 14:17:07.040 | DEBUG    | __main__:trials:24 - Trial = 8687/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.042 | DEBUG    | __main__:trials:29 - Trial = 8687/30000 | Total reward = 45.39
2022-01-26 14:17:07.046 | DEBUG    | __main__:trials:24 - Trial = 8688/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.047 | DEBUG    | __main__:trials:29 - Trial = 8688/30000 | Total reward = 55.07
2022-01-26 14:17:07.051 | DEBUG    | __main__:trials:24 - Trial = 8689/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.052 | DEBUG    | __main__:trials:29 - Trial = 8689/30000 | Total reward = 51.65
2022-01-26 14:17:07.056 | DEBUG    | __main__:trials:24 - Trial = 8690/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.058 | DEBUG    | __main__:trials:29 - Trial = 8690/30000 | Total reward = 51.81
2022-01-26 14:17:07.061 | DEBUG    | __main__:trials:24 - Trial = 8691/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.062 | DEBUG    | __main__:trials:29 - Trial = 8691/30000 | Total reward = 52.85
2022-01-26 14:17:07.066 | DEBUG    | __main__:trials:24 - Trial = 8692/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.068 | DEBUG    | __main__:trials:29 - Trial = 8692/30000 | Total reward = 46.62
2022-01-26 14:17:07.071 | DEBUG    | __main__:trials:24 - Trial = 8693/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.073 | DEBUG    | __main__:trials:29 - Trial = 8693/30000 | Total reward = 51.65
2022-01-26 14:17:07.076 | DEBUG    | __main__:trials:26 - Trial = 8694/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.077 | DEBUG    | __main__:trials:29 - Trial = 8694/30000 | Total reward = 25.77
2022-01-26 14:17:07.081 | DEBUG    | __main__:trials:24 - Trial = 8695/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.082 | DEBUG    | __main__:trials:29 - Trial = 8695/30000 | Total reward = 50.74
2022-01-26 14:17:07.086 | DEBUG    | __main__:trials:24 - Trial = 8696/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.087 | DEBUG    | __main__:trials:29 - Trial = 8696/30000 | Total reward = 29.87
2022-01-26 14:17:07.091 | DEBUG    | __main__:trials:24 - Trial = 8697/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.093 | DEBUG    | __main__:trials:29 - Trial = 8697/30000 | Total reward = 50.57
2022-01-26 14:17:07.096 | DEBUG    | __main__:trials:24 - Trial = 8698/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.098 | DEBUG    | __main__:trials:29 - Trial = 8698/30000 | Total reward = 52.29
2022-01-26 14:17:07.101 | DEBUG    | __main__:trials:24 - Trial = 8699/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.103 | DEBUG    | __main__:trials:29 - Trial = 8699/30000 | Total reward = 52.39
2022-01-26 14:17:07.107 | DEBUG    | __main__:trials:24 - Trial = 8700/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.108 | DEBUG    | __main__:trials:29 - Trial = 8700/30000 | Total reward = 31.13
2022-01-26 14:17:07.112 | DEBUG    | __main__:trials:26 - Trial = 8701/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.113 | DEBUG    | __main__:trials:29 - Trial = 8701/30000 | Total reward = 11.54
2022-01-26 14:17:07.117 | DEBUG    | __main__:trials:24 - Trial = 8702/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.119 | DEBUG    | __main__:trials:29 - Trial = 8702/30000 | Total reward = 63.72
2022-01-26 14:17:07.122 | DEBUG    | __main__:trials:24 - Trial = 8703/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.124 | DEBUG    | __main__:trials:29 - Trial = 8703/30000 | Total reward = 44.95
2022-01-26 14:17:07.127 | DEBUG    | __main__:trials:24 - Trial = 8704/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.129 | DEBUG    | __main__:trials:29 - Trial = 8704/30000 | Total reward = 48.44
2022-01-26 14:17:07.133 | DEBUG    | __main__:trials:24 - Trial = 8705/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.135 | DEBUG    | __main__:trials:29 - Trial = 8705/30000 | Total reward = 52.16
2022-01-26 14:17:07.138 | DEBUG    | __main__:trials:24 - Trial = 8706/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.140 | DEBUG    | __main__:trials:29 - Trial = 8706/30000 | Total reward = 47.21
2022-01-26 14:17:07.143 | DEBUG    | __main__:trials:24 - Trial = 8707/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.145 | DEBUG    | __main__:trials:29 - Trial = 8707/30000 | Total reward = 39.31
2022-01-26 14:17:07.149 | DEBUG    | __main__:trials:24 - Trial = 8708/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.150 | DEBUG    | __main__:trials:29 - Trial = 8708/30000 | Total reward = 54.48
2022-01-26 14:17:07.154 | DEBUG    | __main__:trials:24 - Trial = 8709/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.156 | DEBUG    | __main__:trials:29 - Trial = 8709/30000 | Total reward = 32.04
2022-01-26 14:17:07.159 | DEBUG    | __main__:trials:24 - Trial = 8710/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.161 | DEBUG    | __main__:trials:29 - Trial = 8710/30000 | Total reward = 29.29
2022-01-26 14:17:07.163 | DEBUG    | __main__:trials:24 - Trial = 8711/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.165 | DEBUG    | __main__:trials:29 - Trial = 8711/30000 | Total reward = 51.93
2022-01-26 14:17:07.169 | DEBUG    | __main__:trials:24 - Trial = 8712/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.170 | DEBUG    | __main__:trials:29 - Trial = 8712/30000 | Total reward = 34.71
2022-01-26 14:17:07.173 | DEBUG    | __main__:trials:24 - Trial = 8713/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.174 | DEBUG    | __main__:trials:29 - Trial = 8713/30000 | Total reward = 40.10
2022-01-26 14:17:07.178 | DEBUG    | __main__:trials:24 - Trial = 8714/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.178 | DEBUG    | __main__:trials:29 - Trial = 8714/30000 | Total reward = 32.56
2022-01-26 14:17:07.181 | DEBUG    | __main__:trials:26 - Trial = 8715/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.183 | DEBUG    | __main__:trials:29 - Trial = 8715/30000 | Total reward = 11.11
2022-01-26 14:17:07.187 | DEBUG    | __main__:trials:24 - Trial = 8716/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.188 | DEBUG    | __main__:trials:29 - Trial = 8716/30000 | Total reward = 34.36
2022-01-26 14:17:07.191 | DEBUG    | __main__:trials:24 - Trial = 8717/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.193 | DEBUG    | __main__:trials:29 - Trial = 8717/30000 | Total reward = 37.16
2022-01-26 14:17:07.197 | DEBUG    | __main__:trials:24 - Trial = 8718/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.198 | DEBUG    | __main__:trials:29 - Trial = 8718/30000 | Total reward = 34.27
2022-01-26 14:17:07.201 | DEBUG    | __main__:trials:24 - Trial = 8719/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.202 | DEBUG    | __main__:trials:29 - Trial = 8719/30000 | Total reward = 50.32
2022-01-26 14:17:07.205 | DEBUG    | __main__:trials:24 - Trial = 8720/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.206 | DEBUG    | __main__:trials:29 - Trial = 8720/30000 | Total reward = 33.34
2022-01-26 14:17:07.209 | DEBUG    | __main__:trials:24 - Trial = 8721/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.210 | DEBUG    | __main__:trials:29 - Trial = 8721/30000 | Total reward = 48.86
2022-01-26 14:17:07.213 | DEBUG    | __main__:trials:24 - Trial = 8722/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.214 | DEBUG    | __main__:trials:29 - Trial = 8722/30000 | Total reward = 39.97
2022-01-26 14:17:07.217 | DEBUG    | __main__:trials:24 - Trial = 8723/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.218 | DEBUG    | __main__:trials:29 - Trial = 8723/30000 | Total reward = 34.73
2022-01-26 14:17:07.221 | DEBUG    | __main__:trials:24 - Trial = 8724/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.223 | DEBUG    | __main__:trials:29 - Trial = 8724/30000 | Total reward = 23.98
2022-01-26 14:17:07.226 | DEBUG    | __main__:trials:24 - Trial = 8725/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.227 | DEBUG    | __main__:trials:29 - Trial = 8725/30000 | Total reward = 42.18
2022-01-26 14:17:07.230 | DEBUG    | __main__:trials:24 - Trial = 8726/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.231 | DEBUG    | __main__:trials:29 - Trial = 8726/30000 | Total reward = 40.90
2022-01-26 14:17:07.235 | DEBUG    | __main__:trials:24 - Trial = 8727/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.237 | DEBUG    | __main__:trials:29 - Trial = 8727/30000 | Total reward = 36.08
2022-01-26 14:17:07.240 | DEBUG    | __main__:trials:24 - Trial = 8728/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.242 | DEBUG    | __main__:trials:29 - Trial = 8728/30000 | Total reward = 39.82
2022-01-26 14:17:07.245 | DEBUG    | __main__:trials:24 - Trial = 8729/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.246 | DEBUG    | __main__:trials:29 - Trial = 8729/30000 | Total reward = 44.02
2022-01-26 14:17:07.249 | DEBUG    | __main__:trials:24 - Trial = 8730/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.250 | DEBUG    | __main__:trials:29 - Trial = 8730/30000 | Total reward = 41.88
2022-01-26 14:17:07.252 | DEBUG    | __main__:trials:26 - Trial = 8731/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.254 | DEBUG    | __main__:trials:29 - Trial = 8731/30000 | Total reward = 13.13
2022-01-26 14:17:07.257 | DEBUG    | __main__:trials:24 - Trial = 8732/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.259 | DEBUG    | __main__:trials:29 - Trial = 8732/30000 | Total reward = 41.58
2022-01-26 14:17:07.263 | DEBUG    | __main__:trials:24 - Trial = 8733/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.264 | DEBUG    | __main__:trials:29 - Trial = 8733/30000 | Total reward = 42.30
2022-01-26 14:17:07.268 | DEBUG    | __main__:trials:24 - Trial = 8734/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.270 | DEBUG    | __main__:trials:29 - Trial = 8734/30000 | Total reward = 40.07
2022-01-26 14:17:07.273 | DEBUG    | __main__:trials:24 - Trial = 8735/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.275 | DEBUG    | __main__:trials:29 - Trial = 8735/30000 | Total reward = 32.56
2022-01-26 14:17:07.279 | DEBUG    | __main__:trials:24 - Trial = 8736/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.280 | DEBUG    | __main__:trials:29 - Trial = 8736/30000 | Total reward = 42.07
2022-01-26 14:17:07.284 | DEBUG    | __main__:trials:24 - Trial = 8737/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.285 | DEBUG    | __main__:trials:29 - Trial = 8737/30000 | Total reward = 47.04
2022-01-26 14:17:07.288 | DEBUG    | __main__:trials:24 - Trial = 8738/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.290 | DEBUG    | __main__:trials:29 - Trial = 8738/30000 | Total reward = 38.82
2022-01-26 14:17:07.293 | DEBUG    | __main__:trials:24 - Trial = 8739/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.295 | DEBUG    | __main__:trials:29 - Trial = 8739/30000 | Total reward = 43.09
2022-01-26 14:17:07.298 | DEBUG    | __main__:trials:24 - Trial = 8740/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.298 | DEBUG    | __main__:trials:29 - Trial = 8740/30000 | Total reward = 23.85
2022-01-26 14:17:07.302 | DEBUG    | __main__:trials:24 - Trial = 8741/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.303 | DEBUG    | __main__:trials:29 - Trial = 8741/30000 | Total reward = 44.99
2022-01-26 14:17:07.306 | DEBUG    | __main__:trials:24 - Trial = 8742/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.307 | DEBUG    | __main__:trials:29 - Trial = 8742/30000 | Total reward = 40.35
2022-01-26 14:17:07.310 | DEBUG    | __main__:trials:24 - Trial = 8743/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.312 | DEBUG    | __main__:trials:29 - Trial = 8743/30000 | Total reward = 38.56
2022-01-26 14:17:07.315 | DEBUG    | __main__:trials:24 - Trial = 8744/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.317 | DEBUG    | __main__:trials:29 - Trial = 8744/30000 | Total reward = 38.19
2022-01-26 14:17:07.321 | DEBUG    | __main__:trials:24 - Trial = 8745/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.323 | DEBUG    | __main__:trials:29 - Trial = 8745/30000 | Total reward = 57.61
2022-01-26 14:17:07.326 | DEBUG    | __main__:trials:24 - Trial = 8746/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.326 | DEBUG    | __main__:trials:29 - Trial = 8746/30000 | Total reward = 43.33
2022-01-26 14:17:07.330 | DEBUG    | __main__:trials:24 - Trial = 8747/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.331 | DEBUG    | __main__:trials:29 - Trial = 8747/30000 | Total reward = 47.29
2022-01-26 14:17:07.334 | DEBUG    | __main__:trials:24 - Trial = 8748/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.336 | DEBUG    | __main__:trials:29 - Trial = 8748/30000 | Total reward = 40.65
2022-01-26 14:17:07.339 | DEBUG    | __main__:trials:24 - Trial = 8749/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.341 | DEBUG    | __main__:trials:29 - Trial = 8749/30000 | Total reward = 40.41
2022-01-26 14:17:07.344 | DEBUG    | __main__:trials:24 - Trial = 8750/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.346 | DEBUG    | __main__:trials:29 - Trial = 8750/30000 | Total reward = 36.68
2022-01-26 14:17:07.349 | DEBUG    | __main__:trials:24 - Trial = 8751/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.351 | DEBUG    | __main__:trials:29 - Trial = 8751/30000 | Total reward = 31.65
2022-01-26 14:17:07.354 | DEBUG    | __main__:trials:24 - Trial = 8752/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.356 | DEBUG    | __main__:trials:29 - Trial = 8752/30000 | Total reward = 43.73
2022-01-26 14:17:07.359 | DEBUG    | __main__:trials:24 - Trial = 8753/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.361 | DEBUG    | __main__:trials:29 - Trial = 8753/30000 | Total reward = 37.65
2022-01-26 14:17:07.364 | DEBUG    | __main__:trials:24 - Trial = 8754/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.365 | DEBUG    | __main__:trials:29 - Trial = 8754/30000 | Total reward = 44.72
2022-01-26 14:17:07.369 | DEBUG    | __main__:trials:24 - Trial = 8755/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.369 | DEBUG    | __main__:trials:29 - Trial = 8755/30000 | Total reward = 25.90
2022-01-26 14:17:07.373 | DEBUG    | __main__:trials:24 - Trial = 8756/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.375 | DEBUG    | __main__:trials:29 - Trial = 8756/30000 | Total reward = 26.22
2022-01-26 14:17:07.379 | DEBUG    | __main__:trials:24 - Trial = 8757/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.380 | DEBUG    | __main__:trials:29 - Trial = 8757/30000 | Total reward = 43.95
2022-01-26 14:17:07.384 | DEBUG    | __main__:trials:24 - Trial = 8758/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.386 | DEBUG    | __main__:trials:29 - Trial = 8758/30000 | Total reward = 42.41
2022-01-26 14:17:07.389 | DEBUG    | __main__:trials:24 - Trial = 8759/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.390 | DEBUG    | __main__:trials:29 - Trial = 8759/30000 | Total reward = 37.35
2022-01-26 14:17:07.394 | DEBUG    | __main__:trials:24 - Trial = 8760/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.395 | DEBUG    | __main__:trials:29 - Trial = 8760/30000 | Total reward = 39.79
2022-01-26 14:17:07.399 | DEBUG    | __main__:trials:24 - Trial = 8761/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.401 | DEBUG    | __main__:trials:29 - Trial = 8761/30000 | Total reward = 46.08
2022-01-26 14:17:07.405 | DEBUG    | __main__:trials:24 - Trial = 8762/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.406 | DEBUG    | __main__:trials:29 - Trial = 8762/30000 | Total reward = 44.61
2022-01-26 14:17:07.409 | DEBUG    | __main__:trials:24 - Trial = 8763/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.410 | DEBUG    | __main__:trials:29 - Trial = 8763/30000 | Total reward = 40.63
2022-01-26 14:17:07.414 | DEBUG    | __main__:trials:24 - Trial = 8764/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.415 | DEBUG    | __main__:trials:29 - Trial = 8764/30000 | Total reward = 45.88
2022-01-26 14:17:07.419 | DEBUG    | __main__:trials:24 - Trial = 8765/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.421 | DEBUG    | __main__:trials:29 - Trial = 8765/30000 | Total reward = 42.72
2022-01-26 14:17:07.424 | DEBUG    | __main__:trials:24 - Trial = 8766/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.426 | DEBUG    | __main__:trials:29 - Trial = 8766/30000 | Total reward = 45.03
2022-01-26 14:17:07.430 | DEBUG    | __main__:trials:24 - Trial = 8767/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.431 | DEBUG    | __main__:trials:29 - Trial = 8767/30000 | Total reward = 48.25
2022-01-26 14:17:07.435 | DEBUG    | __main__:trials:24 - Trial = 8768/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.436 | DEBUG    | __main__:trials:29 - Trial = 8768/30000 | Total reward = 45.63
2022-01-26 14:17:07.440 | DEBUG    | __main__:trials:24 - Trial = 8769/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.441 | DEBUG    | __main__:trials:29 - Trial = 8769/30000 | Total reward = 40.32
2022-01-26 14:17:07.445 | DEBUG    | __main__:trials:24 - Trial = 8770/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.446 | DEBUG    | __main__:trials:29 - Trial = 8770/30000 | Total reward = 52.72
2022-01-26 14:17:07.450 | DEBUG    | __main__:trials:24 - Trial = 8771/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.452 | DEBUG    | __main__:trials:29 - Trial = 8771/30000 | Total reward = 48.14
2022-01-26 14:17:07.455 | DEBUG    | __main__:trials:24 - Trial = 8772/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.457 | DEBUG    | __main__:trials:29 - Trial = 8772/30000 | Total reward = 42.49
2022-01-26 14:17:07.460 | DEBUG    | __main__:trials:24 - Trial = 8773/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.462 | DEBUG    | __main__:trials:29 - Trial = 8773/30000 | Total reward = 38.91
2022-01-26 14:17:07.466 | DEBUG    | __main__:trials:24 - Trial = 8774/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.467 | DEBUG    | __main__:trials:29 - Trial = 8774/30000 | Total reward = 40.26
2022-01-26 14:17:07.471 | DEBUG    | __main__:trials:24 - Trial = 8775/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.472 | DEBUG    | __main__:trials:29 - Trial = 8775/30000 | Total reward = 47.58
2022-01-26 14:17:07.475 | DEBUG    | __main__:trials:24 - Trial = 8776/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.477 | DEBUG    | __main__:trials:29 - Trial = 8776/30000 | Total reward = 50.19
2022-01-26 14:17:07.481 | DEBUG    | __main__:trials:24 - Trial = 8777/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.483 | DEBUG    | __main__:trials:29 - Trial = 8777/30000 | Total reward = 51.65
2022-01-26 14:17:07.486 | DEBUG    | __main__:trials:24 - Trial = 8778/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.488 | DEBUG    | __main__:trials:29 - Trial = 8778/30000 | Total reward = 53.59
2022-01-26 14:17:07.491 | DEBUG    | __main__:trials:24 - Trial = 8779/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.493 | DEBUG    | __main__:trials:29 - Trial = 8779/30000 | Total reward = 47.80
2022-01-26 14:17:07.496 | DEBUG    | __main__:trials:24 - Trial = 8780/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.498 | DEBUG    | __main__:trials:29 - Trial = 8780/30000 | Total reward = 45.80
2022-01-26 14:17:07.501 | DEBUG    | __main__:trials:24 - Trial = 8781/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.502 | DEBUG    | __main__:trials:29 - Trial = 8781/30000 | Total reward = 54.69
2022-01-26 14:17:07.505 | DEBUG    | __main__:trials:24 - Trial = 8782/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.506 | DEBUG    | __main__:trials:29 - Trial = 8782/30000 | Total reward = 39.93
2022-01-26 14:17:07.509 | DEBUG    | __main__:trials:24 - Trial = 8783/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.511 | DEBUG    | __main__:trials:29 - Trial = 8783/30000 | Total reward = 48.83
2022-01-26 14:17:07.514 | DEBUG    | __main__:trials:24 - Trial = 8784/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.515 | DEBUG    | __main__:trials:29 - Trial = 8784/30000 | Total reward = 38.00
2022-01-26 14:17:07.519 | DEBUG    | __main__:trials:24 - Trial = 8785/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.521 | DEBUG    | __main__:trials:29 - Trial = 8785/30000 | Total reward = 36.95
2022-01-26 14:17:07.524 | DEBUG    | __main__:trials:24 - Trial = 8786/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.526 | DEBUG    | __main__:trials:29 - Trial = 8786/30000 | Total reward = 41.10
2022-01-26 14:17:07.529 | DEBUG    | __main__:trials:24 - Trial = 8787/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.531 | DEBUG    | __main__:trials:29 - Trial = 8787/30000 | Total reward = 39.12
2022-01-26 14:17:07.535 | DEBUG    | __main__:trials:24 - Trial = 8788/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.536 | DEBUG    | __main__:trials:29 - Trial = 8788/30000 | Total reward = 41.65
2022-01-26 14:17:07.540 | DEBUG    | __main__:trials:24 - Trial = 8789/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.541 | DEBUG    | __main__:trials:29 - Trial = 8789/30000 | Total reward = 51.38
2022-01-26 14:17:07.545 | DEBUG    | __main__:trials:24 - Trial = 8790/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.546 | DEBUG    | __main__:trials:29 - Trial = 8790/30000 | Total reward = 39.78
2022-01-26 14:17:07.550 | DEBUG    | __main__:trials:24 - Trial = 8791/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.551 | DEBUG    | __main__:trials:29 - Trial = 8791/30000 | Total reward = 43.09
2022-01-26 14:17:07.555 | DEBUG    | __main__:trials:24 - Trial = 8792/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.556 | DEBUG    | __main__:trials:29 - Trial = 8792/30000 | Total reward = 43.08
2022-01-26 14:17:07.560 | DEBUG    | __main__:trials:24 - Trial = 8793/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.561 | DEBUG    | __main__:trials:29 - Trial = 8793/30000 | Total reward = 47.42
2022-01-26 14:17:07.565 | DEBUG    | __main__:trials:24 - Trial = 8794/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.567 | DEBUG    | __main__:trials:29 - Trial = 8794/30000 | Total reward = 41.84
2022-01-26 14:17:07.571 | DEBUG    | __main__:trials:24 - Trial = 8795/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.572 | DEBUG    | __main__:trials:29 - Trial = 8795/30000 | Total reward = 37.35
2022-01-26 14:17:07.576 | DEBUG    | __main__:trials:24 - Trial = 8796/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.578 | DEBUG    | __main__:trials:29 - Trial = 8796/30000 | Total reward = 43.49
2022-01-26 14:17:07.582 | DEBUG    | __main__:trials:24 - Trial = 8797/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.583 | DEBUG    | __main__:trials:29 - Trial = 8797/30000 | Total reward = 40.52
2022-01-26 14:17:07.587 | DEBUG    | __main__:trials:24 - Trial = 8798/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.588 | DEBUG    | __main__:trials:29 - Trial = 8798/30000 | Total reward = 43.73
2022-01-26 14:17:07.592 | DEBUG    | __main__:trials:24 - Trial = 8799/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.594 | DEBUG    | __main__:trials:29 - Trial = 8799/30000 | Total reward = 34.18
2022-01-26 14:17:07.597 | DEBUG    | __main__:trials:24 - Trial = 8800/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.599 | DEBUG    | __main__:trials:29 - Trial = 8800/30000 | Total reward = 39.29
2022-01-26 14:17:07.603 | DEBUG    | __main__:trials:24 - Trial = 8801/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.604 | DEBUG    | __main__:trials:29 - Trial = 8801/30000 | Total reward = 41.95
2022-01-26 14:17:07.608 | DEBUG    | __main__:trials:24 - Trial = 8802/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.609 | DEBUG    | __main__:trials:29 - Trial = 8802/30000 | Total reward = 42.00
2022-01-26 14:17:07.613 | DEBUG    | __main__:trials:24 - Trial = 8803/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.614 | DEBUG    | __main__:trials:29 - Trial = 8803/30000 | Total reward = 43.01
2022-01-26 14:17:07.618 | DEBUG    | __main__:trials:24 - Trial = 8804/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.619 | DEBUG    | __main__:trials:29 - Trial = 8804/30000 | Total reward = 44.30
2022-01-26 14:17:07.623 | DEBUG    | __main__:trials:24 - Trial = 8805/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.625 | DEBUG    | __main__:trials:29 - Trial = 8805/30000 | Total reward = 33.40
2022-01-26 14:17:07.628 | DEBUG    | __main__:trials:24 - Trial = 8806/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.630 | DEBUG    | __main__:trials:29 - Trial = 8806/30000 | Total reward = 35.52
2022-01-26 14:17:07.634 | DEBUG    | __main__:trials:24 - Trial = 8807/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.635 | DEBUG    | __main__:trials:29 - Trial = 8807/30000 | Total reward = 40.92
2022-01-26 14:17:07.639 | DEBUG    | __main__:trials:24 - Trial = 8808/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.641 | DEBUG    | __main__:trials:29 - Trial = 8808/30000 | Total reward = 33.35
2022-01-26 14:17:07.644 | DEBUG    | __main__:trials:26 - Trial = 8809/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.645 | DEBUG    | __main__:trials:29 - Trial = 8809/30000 | Total reward = 18.19
2022-01-26 14:17:07.649 | DEBUG    | __main__:trials:24 - Trial = 8810/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.650 | DEBUG    | __main__:trials:29 - Trial = 8810/30000 | Total reward = 38.46
2022-01-26 14:17:07.653 | DEBUG    | __main__:trials:24 - Trial = 8811/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.654 | DEBUG    | __main__:trials:29 - Trial = 8811/30000 | Total reward = 43.10
2022-01-26 14:17:07.658 | DEBUG    | __main__:trials:24 - Trial = 8812/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.659 | DEBUG    | __main__:trials:29 - Trial = 8812/30000 | Total reward = 39.18
2022-01-26 14:17:07.662 | DEBUG    | __main__:trials:24 - Trial = 8813/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.664 | DEBUG    | __main__:trials:29 - Trial = 8813/30000 | Total reward = 40.14
2022-01-26 14:17:07.668 | DEBUG    | __main__:trials:24 - Trial = 8814/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.669 | DEBUG    | __main__:trials:29 - Trial = 8814/30000 | Total reward = 36.45
2022-01-26 14:17:07.672 | DEBUG    | __main__:trials:24 - Trial = 8815/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.674 | DEBUG    | __main__:trials:29 - Trial = 8815/30000 | Total reward = 42.82
2022-01-26 14:17:07.678 | DEBUG    | __main__:trials:24 - Trial = 8816/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.679 | DEBUG    | __main__:trials:29 - Trial = 8816/30000 | Total reward = 38.17
2022-01-26 14:17:07.682 | DEBUG    | __main__:trials:24 - Trial = 8817/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.684 | DEBUG    | __main__:trials:29 - Trial = 8817/30000 | Total reward = 40.53
2022-01-26 14:17:07.688 | DEBUG    | __main__:trials:24 - Trial = 8818/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.689 | DEBUG    | __main__:trials:29 - Trial = 8818/30000 | Total reward = 37.68
2022-01-26 14:17:07.693 | DEBUG    | __main__:trials:24 - Trial = 8819/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.695 | DEBUG    | __main__:trials:29 - Trial = 8819/30000 | Total reward = 40.92
2022-01-26 14:17:07.699 | DEBUG    | __main__:trials:24 - Trial = 8820/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.700 | DEBUG    | __main__:trials:29 - Trial = 8820/30000 | Total reward = 39.36
2022-01-26 14:17:07.704 | DEBUG    | __main__:trials:24 - Trial = 8821/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.704 | DEBUG    | __main__:trials:29 - Trial = 8821/30000 | Total reward = 35.07
2022-01-26 14:17:07.708 | DEBUG    | __main__:trials:24 - Trial = 8822/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.710 | DEBUG    | __main__:trials:29 - Trial = 8822/30000 | Total reward = 43.51
2022-01-26 14:17:07.714 | DEBUG    | __main__:trials:24 - Trial = 8823/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.715 | DEBUG    | __main__:trials:29 - Trial = 8823/30000 | Total reward = 37.80
2022-01-26 14:17:07.719 | DEBUG    | __main__:trials:24 - Trial = 8824/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.721 | DEBUG    | __main__:trials:29 - Trial = 8824/30000 | Total reward = 43.59
2022-01-26 14:17:07.724 | DEBUG    | __main__:trials:24 - Trial = 8825/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.726 | DEBUG    | __main__:trials:29 - Trial = 8825/30000 | Total reward = 43.87
2022-01-26 14:17:07.730 | DEBUG    | __main__:trials:24 - Trial = 8826/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.731 | DEBUG    | __main__:trials:29 - Trial = 8826/30000 | Total reward = 40.58
2022-01-26 14:17:07.735 | DEBUG    | __main__:trials:24 - Trial = 8827/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.736 | DEBUG    | __main__:trials:29 - Trial = 8827/30000 | Total reward = 37.14
2022-01-26 14:17:07.740 | DEBUG    | __main__:trials:24 - Trial = 8828/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.742 | DEBUG    | __main__:trials:29 - Trial = 8828/30000 | Total reward = 48.78
2022-01-26 14:17:07.746 | DEBUG    | __main__:trials:24 - Trial = 8829/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.747 | DEBUG    | __main__:trials:29 - Trial = 8829/30000 | Total reward = 44.29
2022-01-26 14:17:07.751 | DEBUG    | __main__:trials:24 - Trial = 8830/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.752 | DEBUG    | __main__:trials:29 - Trial = 8830/30000 | Total reward = 44.51
2022-01-26 14:17:07.756 | DEBUG    | __main__:trials:24 - Trial = 8831/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.757 | DEBUG    | __main__:trials:29 - Trial = 8831/30000 | Total reward = 41.71
2022-01-26 14:17:07.761 | DEBUG    | __main__:trials:24 - Trial = 8832/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.763 | DEBUG    | __main__:trials:29 - Trial = 8832/30000 | Total reward = 45.18
2022-01-26 14:17:07.766 | DEBUG    | __main__:trials:24 - Trial = 8833/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.767 | DEBUG    | __main__:trials:29 - Trial = 8833/30000 | Total reward = 52.02
2022-01-26 14:17:07.771 | DEBUG    | __main__:trials:24 - Trial = 8834/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.773 | DEBUG    | __main__:trials:29 - Trial = 8834/30000 | Total reward = 48.98
2022-01-26 14:17:07.776 | DEBUG    | __main__:trials:26 - Trial = 8835/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.777 | DEBUG    | __main__:trials:29 - Trial = 8835/30000 | Total reward = 27.53
2022-01-26 14:17:07.780 | DEBUG    | __main__:trials:24 - Trial = 8836/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.782 | DEBUG    | __main__:trials:29 - Trial = 8836/30000 | Total reward = 43.70
2022-01-26 14:17:07.785 | DEBUG    | __main__:trials:24 - Trial = 8837/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.787 | DEBUG    | __main__:trials:29 - Trial = 8837/30000 | Total reward = 59.99
2022-01-26 14:17:07.790 | DEBUG    | __main__:trials:24 - Trial = 8838/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.791 | DEBUG    | __main__:trials:29 - Trial = 8838/30000 | Total reward = 49.32
2022-01-26 14:17:07.795 | DEBUG    | __main__:trials:24 - Trial = 8839/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.796 | DEBUG    | __main__:trials:29 - Trial = 8839/30000 | Total reward = 48.95
2022-01-26 14:17:07.800 | DEBUG    | __main__:trials:24 - Trial = 8840/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.801 | DEBUG    | __main__:trials:29 - Trial = 8840/30000 | Total reward = 46.91
2022-01-26 14:17:07.805 | DEBUG    | __main__:trials:24 - Trial = 8841/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.805 | DEBUG    | __main__:trials:29 - Trial = 8841/30000 | Total reward = 40.73
2022-01-26 14:17:07.810 | DEBUG    | __main__:trials:24 - Trial = 8842/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.812 | DEBUG    | __main__:trials:29 - Trial = 8842/30000 | Total reward = 45.94
2022-01-26 14:17:07.816 | DEBUG    | __main__:trials:24 - Trial = 8843/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.818 | DEBUG    | __main__:trials:29 - Trial = 8843/30000 | Total reward = 52.02
2022-01-26 14:17:07.821 | DEBUG    | __main__:trials:24 - Trial = 8844/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.823 | DEBUG    | __main__:trials:29 - Trial = 8844/30000 | Total reward = 36.28
2022-01-26 14:17:07.827 | DEBUG    | __main__:trials:24 - Trial = 8845/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.828 | DEBUG    | __main__:trials:29 - Trial = 8845/30000 | Total reward = 48.79
2022-01-26 14:17:07.831 | DEBUG    | __main__:trials:24 - Trial = 8846/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.833 | DEBUG    | __main__:trials:29 - Trial = 8846/30000 | Total reward = 49.51
2022-01-26 14:17:07.837 | DEBUG    | __main__:trials:24 - Trial = 8847/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.839 | DEBUG    | __main__:trials:29 - Trial = 8847/30000 | Total reward = 24.38
2022-01-26 14:17:07.842 | DEBUG    | __main__:trials:24 - Trial = 8848/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.843 | DEBUG    | __main__:trials:29 - Trial = 8848/30000 | Total reward = 47.21
2022-01-26 14:17:07.847 | DEBUG    | __main__:trials:24 - Trial = 8849/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.849 | DEBUG    | __main__:trials:29 - Trial = 8849/30000 | Total reward = 41.18
2022-01-26 14:17:07.853 | DEBUG    | __main__:trials:24 - Trial = 8850/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.854 | DEBUG    | __main__:trials:29 - Trial = 8850/30000 | Total reward = 41.82
2022-01-26 14:17:07.858 | DEBUG    | __main__:trials:24 - Trial = 8851/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.859 | DEBUG    | __main__:trials:29 - Trial = 8851/30000 | Total reward = 47.45
2022-01-26 14:17:07.863 | DEBUG    | __main__:trials:24 - Trial = 8852/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.864 | DEBUG    | __main__:trials:29 - Trial = 8852/30000 | Total reward = 47.62
2022-01-26 14:17:07.867 | DEBUG    | __main__:trials:24 - Trial = 8853/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.869 | DEBUG    | __main__:trials:29 - Trial = 8853/30000 | Total reward = 35.77
2022-01-26 14:17:07.872 | DEBUG    | __main__:trials:24 - Trial = 8854/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.874 | DEBUG    | __main__:trials:29 - Trial = 8854/30000 | Total reward = 34.88
2022-01-26 14:17:07.878 | DEBUG    | __main__:trials:24 - Trial = 8855/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.878 | DEBUG    | __main__:trials:29 - Trial = 8855/30000 | Total reward = 49.14
2022-01-26 14:17:07.882 | DEBUG    | __main__:trials:24 - Trial = 8856/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.884 | DEBUG    | __main__:trials:29 - Trial = 8856/30000 | Total reward = 44.77
2022-01-26 14:17:07.888 | DEBUG    | __main__:trials:24 - Trial = 8857/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.889 | DEBUG    | __main__:trials:29 - Trial = 8857/30000 | Total reward = 41.20
2022-01-26 14:17:07.892 | DEBUG    | __main__:trials:24 - Trial = 8858/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.894 | DEBUG    | __main__:trials:29 - Trial = 8858/30000 | Total reward = 42.86
2022-01-26 14:17:07.898 | DEBUG    | __main__:trials:24 - Trial = 8859/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.900 | DEBUG    | __main__:trials:29 - Trial = 8859/30000 | Total reward = 41.08
2022-01-26 14:17:07.903 | DEBUG    | __main__:trials:24 - Trial = 8860/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.905 | DEBUG    | __main__:trials:29 - Trial = 8860/30000 | Total reward = 44.30
2022-01-26 14:17:07.908 | DEBUG    | __main__:trials:24 - Trial = 8861/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.910 | DEBUG    | __main__:trials:29 - Trial = 8861/30000 | Total reward = 49.31
2022-01-26 14:17:07.914 | DEBUG    | __main__:trials:24 - Trial = 8862/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.915 | DEBUG    | __main__:trials:29 - Trial = 8862/30000 | Total reward = 46.41
2022-01-26 14:17:07.918 | DEBUG    | __main__:trials:24 - Trial = 8863/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.920 | DEBUG    | __main__:trials:29 - Trial = 8863/30000 | Total reward = 47.21
2022-01-26 14:17:07.923 | DEBUG    | __main__:trials:24 - Trial = 8864/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.925 | DEBUG    | __main__:trials:29 - Trial = 8864/30000 | Total reward = 52.89
2022-01-26 14:17:07.928 | DEBUG    | __main__:trials:24 - Trial = 8865/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.930 | DEBUG    | __main__:trials:29 - Trial = 8865/30000 | Total reward = 53.54
2022-01-26 14:17:07.933 | DEBUG    | __main__:trials:24 - Trial = 8866/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.934 | DEBUG    | __main__:trials:29 - Trial = 8866/30000 | Total reward = 39.23
2022-01-26 14:17:07.937 | DEBUG    | __main__:trials:24 - Trial = 8867/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.938 | DEBUG    | __main__:trials:29 - Trial = 8867/30000 | Total reward = 45.08
2022-01-26 14:17:07.941 | DEBUG    | __main__:trials:24 - Trial = 8868/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.943 | DEBUG    | __main__:trials:29 - Trial = 8868/30000 | Total reward = 46.54
2022-01-26 14:17:07.946 | DEBUG    | __main__:trials:24 - Trial = 8869/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.947 | DEBUG    | __main__:trials:29 - Trial = 8869/30000 | Total reward = 42.84
2022-01-26 14:17:07.950 | DEBUG    | __main__:trials:24 - Trial = 8870/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.951 | DEBUG    | __main__:trials:29 - Trial = 8870/30000 | Total reward = 46.70
2022-01-26 14:17:07.954 | DEBUG    | __main__:trials:24 - Trial = 8871/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.956 | DEBUG    | __main__:trials:29 - Trial = 8871/30000 | Total reward = 46.19
2022-01-26 14:17:07.960 | DEBUG    | __main__:trials:24 - Trial = 8872/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.961 | DEBUG    | __main__:trials:29 - Trial = 8872/30000 | Total reward = 41.95
2022-01-26 14:17:07.965 | DEBUG    | __main__:trials:24 - Trial = 8873/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.967 | DEBUG    | __main__:trials:29 - Trial = 8873/30000 | Total reward = 46.02
2022-01-26 14:17:07.970 | DEBUG    | __main__:trials:24 - Trial = 8874/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.972 | DEBUG    | __main__:trials:29 - Trial = 8874/30000 | Total reward = 41.44
2022-01-26 14:17:07.975 | DEBUG    | __main__:trials:24 - Trial = 8875/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.977 | DEBUG    | __main__:trials:29 - Trial = 8875/30000 | Total reward = 51.88
2022-01-26 14:17:07.980 | DEBUG    | __main__:trials:24 - Trial = 8876/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.982 | DEBUG    | __main__:trials:29 - Trial = 8876/30000 | Total reward = 42.84
2022-01-26 14:17:07.985 | DEBUG    | __main__:trials:24 - Trial = 8877/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.986 | DEBUG    | __main__:trials:29 - Trial = 8877/30000 | Total reward = 42.54
2022-01-26 14:17:07.989 | DEBUG    | __main__:trials:24 - Trial = 8878/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.991 | DEBUG    | __main__:trials:29 - Trial = 8878/30000 | Total reward = 51.65
2022-01-26 14:17:07.995 | DEBUG    | __main__:trials:24 - Trial = 8879/30000 | Max number of steps (20) reached
2022-01-26 14:17:07.995 | DEBUG    | __main__:trials:29 - Trial = 8879/30000 | Total reward = 50.98
2022-01-26 14:17:07.998 | DEBUG    | __main__:trials:26 - Trial = 8880/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:07.998 | DEBUG    | __main__:trials:29 - Trial = 8880/30000 | Total reward = 18.93
2022-01-26 14:17:08.003 | DEBUG    | __main__:trials:24 - Trial = 8881/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.004 | DEBUG    | __main__:trials:29 - Trial = 8881/30000 | Total reward = 64.74
2022-01-26 14:17:08.008 | DEBUG    | __main__:trials:24 - Trial = 8882/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.010 | DEBUG    | __main__:trials:29 - Trial = 8882/30000 | Total reward = 47.77
2022-01-26 14:17:08.013 | DEBUG    | __main__:trials:24 - Trial = 8883/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.015 | DEBUG    | __main__:trials:29 - Trial = 8883/30000 | Total reward = 35.95
2022-01-26 14:17:08.018 | DEBUG    | __main__:trials:26 - Trial = 8884/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.020 | DEBUG    | __main__:trials:29 - Trial = 8884/30000 | Total reward = 33.66
2022-01-26 14:17:08.024 | DEBUG    | __main__:trials:24 - Trial = 8885/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.025 | DEBUG    | __main__:trials:29 - Trial = 8885/30000 | Total reward = 65.59
2022-01-26 14:17:08.028 | DEBUG    | __main__:trials:24 - Trial = 8886/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.030 | DEBUG    | __main__:trials:29 - Trial = 8886/30000 | Total reward = 51.38
2022-01-26 14:17:08.034 | DEBUG    | __main__:trials:24 - Trial = 8887/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.036 | DEBUG    | __main__:trials:29 - Trial = 8887/30000 | Total reward = 30.84
2022-01-26 14:17:08.039 | DEBUG    | __main__:trials:24 - Trial = 8888/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.040 | DEBUG    | __main__:trials:29 - Trial = 8888/30000 | Total reward = 60.42
2022-01-26 14:17:08.044 | DEBUG    | __main__:trials:24 - Trial = 8889/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.046 | DEBUG    | __main__:trials:29 - Trial = 8889/30000 | Total reward = 65.65
2022-01-26 14:17:08.049 | DEBUG    | __main__:trials:24 - Trial = 8890/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.051 | DEBUG    | __main__:trials:29 - Trial = 8890/30000 | Total reward = 53.13
2022-01-26 14:17:08.055 | DEBUG    | __main__:trials:24 - Trial = 8891/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.056 | DEBUG    | __main__:trials:29 - Trial = 8891/30000 | Total reward = 57.34
2022-01-26 14:17:08.060 | DEBUG    | __main__:trials:24 - Trial = 8892/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.062 | DEBUG    | __main__:trials:29 - Trial = 8892/30000 | Total reward = 46.46
2022-01-26 14:17:08.066 | DEBUG    | __main__:trials:24 - Trial = 8893/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.067 | DEBUG    | __main__:trials:29 - Trial = 8893/30000 | Total reward = 44.61
2022-01-26 14:17:08.071 | DEBUG    | __main__:trials:24 - Trial = 8894/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.072 | DEBUG    | __main__:trials:29 - Trial = 8894/30000 | Total reward = 47.13
2022-01-26 14:17:08.076 | DEBUG    | __main__:trials:24 - Trial = 8895/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.078 | DEBUG    | __main__:trials:29 - Trial = 8895/30000 | Total reward = 59.72
2022-01-26 14:17:08.082 | DEBUG    | __main__:trials:24 - Trial = 8896/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.082 | DEBUG    | __main__:trials:29 - Trial = 8896/30000 | Total reward = 43.66
2022-01-26 14:17:08.086 | DEBUG    | __main__:trials:24 - Trial = 8897/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.088 | DEBUG    | __main__:trials:29 - Trial = 8897/30000 | Total reward = 42.40
2022-01-26 14:17:08.092 | DEBUG    | __main__:trials:24 - Trial = 8898/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.092 | DEBUG    | __main__:trials:29 - Trial = 8898/30000 | Total reward = 45.60
2022-01-26 14:17:08.096 | DEBUG    | __main__:trials:24 - Trial = 8899/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.098 | DEBUG    | __main__:trials:29 - Trial = 8899/30000 | Total reward = 51.99
2022-01-26 14:17:08.102 | DEBUG    | __main__:trials:24 - Trial = 8900/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.103 | DEBUG    | __main__:trials:29 - Trial = 8900/30000 | Total reward = 42.82
2022-01-26 14:17:08.106 | DEBUG    | __main__:trials:24 - Trial = 8901/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.107 | DEBUG    | __main__:trials:29 - Trial = 8901/30000 | Total reward = 56.08
2022-01-26 14:17:08.110 | DEBUG    | __main__:trials:24 - Trial = 8902/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.112 | DEBUG    | __main__:trials:29 - Trial = 8902/30000 | Total reward = 62.39
2022-01-26 14:17:08.116 | DEBUG    | __main__:trials:24 - Trial = 8903/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.117 | DEBUG    | __main__:trials:29 - Trial = 8903/30000 | Total reward = 44.03
2022-01-26 14:17:08.121 | DEBUG    | __main__:trials:24 - Trial = 8904/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.123 | DEBUG    | __main__:trials:29 - Trial = 8904/30000 | Total reward = 46.81
2022-01-26 14:17:08.126 | DEBUG    | __main__:trials:24 - Trial = 8905/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.128 | DEBUG    | __main__:trials:29 - Trial = 8905/30000 | Total reward = 56.81
2022-01-26 14:17:08.132 | DEBUG    | __main__:trials:24 - Trial = 8906/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.133 | DEBUG    | __main__:trials:29 - Trial = 8906/30000 | Total reward = 41.57
2022-01-26 14:17:08.136 | DEBUG    | __main__:trials:24 - Trial = 8907/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.138 | DEBUG    | __main__:trials:29 - Trial = 8907/30000 | Total reward = 46.11
2022-01-26 14:17:08.142 | DEBUG    | __main__:trials:24 - Trial = 8908/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.143 | DEBUG    | __main__:trials:29 - Trial = 8908/30000 | Total reward = 49.46
2022-01-26 14:17:08.147 | DEBUG    | __main__:trials:24 - Trial = 8909/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.149 | DEBUG    | __main__:trials:29 - Trial = 8909/30000 | Total reward = 50.85
2022-01-26 14:17:08.152 | DEBUG    | __main__:trials:24 - Trial = 8910/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.154 | DEBUG    | __main__:trials:29 - Trial = 8910/30000 | Total reward = 48.38
2022-01-26 14:17:08.158 | DEBUG    | __main__:trials:24 - Trial = 8911/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.159 | DEBUG    | __main__:trials:29 - Trial = 8911/30000 | Total reward = 39.57
2022-01-26 14:17:08.163 | DEBUG    | __main__:trials:24 - Trial = 8912/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.164 | DEBUG    | __main__:trials:29 - Trial = 8912/30000 | Total reward = 41.65
2022-01-26 14:17:08.169 | DEBUG    | __main__:trials:24 - Trial = 8913/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.170 | DEBUG    | __main__:trials:29 - Trial = 8913/30000 | Total reward = 55.07
2022-01-26 14:17:08.174 | DEBUG    | __main__:trials:24 - Trial = 8914/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.175 | DEBUG    | __main__:trials:29 - Trial = 8914/30000 | Total reward = 51.43
2022-01-26 14:17:08.179 | DEBUG    | __main__:trials:24 - Trial = 8915/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.181 | DEBUG    | __main__:trials:29 - Trial = 8915/30000 | Total reward = 57.61
2022-01-26 14:17:08.184 | DEBUG    | __main__:trials:24 - Trial = 8916/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.186 | DEBUG    | __main__:trials:29 - Trial = 8916/30000 | Total reward = 42.71
2022-01-26 14:17:08.190 | DEBUG    | __main__:trials:24 - Trial = 8917/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.191 | DEBUG    | __main__:trials:29 - Trial = 8917/30000 | Total reward = 47.00
2022-01-26 14:17:08.195 | DEBUG    | __main__:trials:24 - Trial = 8918/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.196 | DEBUG    | __main__:trials:29 - Trial = 8918/30000 | Total reward = 45.99
2022-01-26 14:17:08.200 | DEBUG    | __main__:trials:24 - Trial = 8919/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.201 | DEBUG    | __main__:trials:29 - Trial = 8919/30000 | Total reward = 46.91
2022-01-26 14:17:08.205 | DEBUG    | __main__:trials:24 - Trial = 8920/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.206 | DEBUG    | __main__:trials:29 - Trial = 8920/30000 | Total reward = 54.17
2022-01-26 14:17:08.210 | DEBUG    | __main__:trials:24 - Trial = 8921/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.211 | DEBUG    | __main__:trials:29 - Trial = 8921/30000 | Total reward = 39.15
2022-01-26 14:17:08.215 | DEBUG    | __main__:trials:24 - Trial = 8922/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.217 | DEBUG    | __main__:trials:29 - Trial = 8922/30000 | Total reward = 36.49
2022-01-26 14:17:08.220 | DEBUG    | __main__:trials:24 - Trial = 8923/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.222 | DEBUG    | __main__:trials:29 - Trial = 8923/30000 | Total reward = 39.12
2022-01-26 14:17:08.226 | DEBUG    | __main__:trials:24 - Trial = 8924/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.227 | DEBUG    | __main__:trials:29 - Trial = 8924/30000 | Total reward = 39.44
2022-01-26 14:17:08.231 | DEBUG    | __main__:trials:24 - Trial = 8925/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.232 | DEBUG    | __main__:trials:29 - Trial = 8925/30000 | Total reward = 38.69
2022-01-26 14:17:08.236 | DEBUG    | __main__:trials:24 - Trial = 8926/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.237 | DEBUG    | __main__:trials:29 - Trial = 8926/30000 | Total reward = 41.71
2022-01-26 14:17:08.240 | DEBUG    | __main__:trials:24 - Trial = 8927/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.242 | DEBUG    | __main__:trials:29 - Trial = 8927/30000 | Total reward = 32.36
2022-01-26 14:17:08.246 | DEBUG    | __main__:trials:24 - Trial = 8928/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.247 | DEBUG    | __main__:trials:29 - Trial = 8928/30000 | Total reward = 50.05
2022-01-26 14:17:08.249 | DEBUG    | __main__:trials:26 - Trial = 8929/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.251 | DEBUG    | __main__:trials:29 - Trial = 8929/30000 | Total reward = 12.57
2022-01-26 14:17:08.255 | DEBUG    | __main__:trials:24 - Trial = 8930/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.256 | DEBUG    | __main__:trials:29 - Trial = 8930/30000 | Total reward = 41.75
2022-01-26 14:17:08.260 | DEBUG    | __main__:trials:24 - Trial = 8931/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.261 | DEBUG    | __main__:trials:29 - Trial = 8931/30000 | Total reward = 64.45
2022-01-26 14:17:08.264 | DEBUG    | __main__:trials:24 - Trial = 8932/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.266 | DEBUG    | __main__:trials:29 - Trial = 8932/30000 | Total reward = 36.27
2022-01-26 14:17:08.270 | DEBUG    | __main__:trials:24 - Trial = 8933/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.271 | DEBUG    | __main__:trials:29 - Trial = 8933/30000 | Total reward = 39.76
2022-01-26 14:17:08.274 | DEBUG    | __main__:trials:26 - Trial = 8934/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.276 | DEBUG    | __main__:trials:29 - Trial = 8934/30000 | Total reward = 10.46
2022-01-26 14:17:08.279 | DEBUG    | __main__:trials:24 - Trial = 8935/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.281 | DEBUG    | __main__:trials:29 - Trial = 8935/30000 | Total reward = 35.08
2022-01-26 14:17:08.285 | DEBUG    | __main__:trials:24 - Trial = 8936/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.286 | DEBUG    | __main__:trials:29 - Trial = 8936/30000 | Total reward = 33.36
2022-01-26 14:17:08.290 | DEBUG    | __main__:trials:24 - Trial = 8937/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.292 | DEBUG    | __main__:trials:29 - Trial = 8937/30000 | Total reward = 40.67
2022-01-26 14:17:08.295 | DEBUG    | __main__:trials:26 - Trial = 8938/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.297 | DEBUG    | __main__:trials:29 - Trial = 8938/30000 | Total reward = 15.64
2022-01-26 14:17:08.299 | DEBUG    | __main__:trials:24 - Trial = 8939/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.301 | DEBUG    | __main__:trials:29 - Trial = 8939/30000 | Total reward = 53.32
2022-01-26 14:17:08.305 | DEBUG    | __main__:trials:24 - Trial = 8940/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.306 | DEBUG    | __main__:trials:29 - Trial = 8940/30000 | Total reward = 38.86
2022-01-26 14:17:08.310 | DEBUG    | __main__:trials:24 - Trial = 8941/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.311 | DEBUG    | __main__:trials:29 - Trial = 8941/30000 | Total reward = 32.45
2022-01-26 14:17:08.315 | DEBUG    | __main__:trials:24 - Trial = 8942/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.317 | DEBUG    | __main__:trials:29 - Trial = 8942/30000 | Total reward = 35.97
2022-01-26 14:17:08.320 | DEBUG    | __main__:trials:24 - Trial = 8943/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.322 | DEBUG    | __main__:trials:29 - Trial = 8943/30000 | Total reward = 38.25
2022-01-26 14:17:08.325 | DEBUG    | __main__:trials:24 - Trial = 8944/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.327 | DEBUG    | __main__:trials:29 - Trial = 8944/30000 | Total reward = 38.54
2022-01-26 14:17:08.330 | DEBUG    | __main__:trials:24 - Trial = 8945/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.332 | DEBUG    | __main__:trials:29 - Trial = 8945/30000 | Total reward = 27.13
2022-01-26 14:17:08.336 | DEBUG    | __main__:trials:24 - Trial = 8946/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.338 | DEBUG    | __main__:trials:29 - Trial = 8946/30000 | Total reward = 43.33
2022-01-26 14:17:08.341 | DEBUG    | __main__:trials:24 - Trial = 8947/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.343 | DEBUG    | __main__:trials:29 - Trial = 8947/30000 | Total reward = 46.65
2022-01-26 14:17:08.347 | DEBUG    | __main__:trials:24 - Trial = 8948/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.348 | DEBUG    | __main__:trials:29 - Trial = 8948/30000 | Total reward = 36.95
2022-01-26 14:17:08.352 | DEBUG    | __main__:trials:24 - Trial = 8949/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.353 | DEBUG    | __main__:trials:29 - Trial = 8949/30000 | Total reward = 49.15
2022-01-26 14:17:08.357 | DEBUG    | __main__:trials:24 - Trial = 8950/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.357 | DEBUG    | __main__:trials:29 - Trial = 8950/30000 | Total reward = 37.94
2022-01-26 14:17:08.362 | DEBUG    | __main__:trials:24 - Trial = 8951/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.363 | DEBUG    | __main__:trials:29 - Trial = 8951/30000 | Total reward = 47.92
2022-01-26 14:17:08.367 | DEBUG    | __main__:trials:24 - Trial = 8952/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.368 | DEBUG    | __main__:trials:29 - Trial = 8952/30000 | Total reward = 43.10
2022-01-26 14:17:08.372 | DEBUG    | __main__:trials:24 - Trial = 8953/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.374 | DEBUG    | __main__:trials:29 - Trial = 8953/30000 | Total reward = 47.80
2022-01-26 14:17:08.377 | DEBUG    | __main__:trials:24 - Trial = 8954/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.379 | DEBUG    | __main__:trials:29 - Trial = 8954/30000 | Total reward = 48.77
2022-01-26 14:17:08.382 | DEBUG    | __main__:trials:26 - Trial = 8955/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.383 | DEBUG    | __main__:trials:29 - Trial = 8955/30000 | Total reward = 11.03
2022-01-26 14:17:08.387 | DEBUG    | __main__:trials:24 - Trial = 8956/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.389 | DEBUG    | __main__:trials:29 - Trial = 8956/30000 | Total reward = 43.35
2022-01-26 14:17:08.391 | DEBUG    | __main__:trials:24 - Trial = 8957/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.393 | DEBUG    | __main__:trials:29 - Trial = 8957/30000 | Total reward = 28.95
2022-01-26 14:17:08.397 | DEBUG    | __main__:trials:24 - Trial = 8958/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.399 | DEBUG    | __main__:trials:29 - Trial = 8958/30000 | Total reward = 44.25
2022-01-26 14:17:08.403 | DEBUG    | __main__:trials:24 - Trial = 8959/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.404 | DEBUG    | __main__:trials:29 - Trial = 8959/30000 | Total reward = 47.21
2022-01-26 14:17:08.408 | DEBUG    | __main__:trials:24 - Trial = 8960/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.409 | DEBUG    | __main__:trials:29 - Trial = 8960/30000 | Total reward = 51.93
2022-01-26 14:17:08.413 | DEBUG    | __main__:trials:24 - Trial = 8961/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.415 | DEBUG    | __main__:trials:29 - Trial = 8961/30000 | Total reward = 42.96
2022-01-26 14:17:08.418 | DEBUG    | __main__:trials:24 - Trial = 8962/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.419 | DEBUG    | __main__:trials:29 - Trial = 8962/30000 | Total reward = 33.40
2022-01-26 14:17:08.422 | DEBUG    | __main__:trials:24 - Trial = 8963/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.424 | DEBUG    | __main__:trials:29 - Trial = 8963/30000 | Total reward = 42.18
2022-01-26 14:17:08.428 | DEBUG    | __main__:trials:24 - Trial = 8964/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.429 | DEBUG    | __main__:trials:29 - Trial = 8964/30000 | Total reward = 51.26
2022-01-26 14:17:08.433 | DEBUG    | __main__:trials:24 - Trial = 8965/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.434 | DEBUG    | __main__:trials:29 - Trial = 8965/30000 | Total reward = 40.28
2022-01-26 14:17:08.437 | DEBUG    | __main__:trials:24 - Trial = 8966/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.438 | DEBUG    | __main__:trials:29 - Trial = 8966/30000 | Total reward = 37.69
2022-01-26 14:17:08.441 | DEBUG    | __main__:trials:24 - Trial = 8967/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.442 | DEBUG    | __main__:trials:29 - Trial = 8967/30000 | Total reward = 49.20
2022-01-26 14:17:08.445 | DEBUG    | __main__:trials:24 - Trial = 8968/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.447 | DEBUG    | __main__:trials:29 - Trial = 8968/30000 | Total reward = 34.36
2022-01-26 14:17:08.451 | DEBUG    | __main__:trials:24 - Trial = 8969/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.453 | DEBUG    | __main__:trials:29 - Trial = 8969/30000 | Total reward = 41.28
2022-01-26 14:17:08.456 | DEBUG    | __main__:trials:24 - Trial = 8970/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.458 | DEBUG    | __main__:trials:29 - Trial = 8970/30000 | Total reward = 38.25
2022-01-26 14:17:08.461 | DEBUG    | __main__:trials:24 - Trial = 8971/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.462 | DEBUG    | __main__:trials:29 - Trial = 8971/30000 | Total reward = 39.40
2022-01-26 14:17:08.466 | DEBUG    | __main__:trials:24 - Trial = 8972/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.467 | DEBUG    | __main__:trials:29 - Trial = 8972/30000 | Total reward = 41.96
2022-01-26 14:17:08.470 | DEBUG    | __main__:trials:24 - Trial = 8973/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.472 | DEBUG    | __main__:trials:29 - Trial = 8973/30000 | Total reward = 37.66
2022-01-26 14:17:08.475 | DEBUG    | __main__:trials:24 - Trial = 8974/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.477 | DEBUG    | __main__:trials:29 - Trial = 8974/30000 | Total reward = 40.60
2022-01-26 14:17:08.480 | DEBUG    | __main__:trials:24 - Trial = 8975/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.482 | DEBUG    | __main__:trials:29 - Trial = 8975/30000 | Total reward = 48.50
2022-01-26 14:17:08.486 | DEBUG    | __main__:trials:24 - Trial = 8976/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.487 | DEBUG    | __main__:trials:29 - Trial = 8976/30000 | Total reward = 42.89
2022-01-26 14:17:08.491 | DEBUG    | __main__:trials:24 - Trial = 8977/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.492 | DEBUG    | __main__:trials:29 - Trial = 8977/30000 | Total reward = 32.83
2022-01-26 14:17:08.496 | DEBUG    | __main__:trials:24 - Trial = 8978/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.497 | DEBUG    | __main__:trials:29 - Trial = 8978/30000 | Total reward = 45.85
2022-01-26 14:17:08.501 | DEBUG    | __main__:trials:24 - Trial = 8979/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.502 | DEBUG    | __main__:trials:29 - Trial = 8979/30000 | Total reward = 40.89
2022-01-26 14:17:08.506 | DEBUG    | __main__:trials:24 - Trial = 8980/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.507 | DEBUG    | __main__:trials:29 - Trial = 8980/30000 | Total reward = 19.16
2022-01-26 14:17:08.512 | DEBUG    | __main__:trials:24 - Trial = 8981/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.514 | DEBUG    | __main__:trials:29 - Trial = 8981/30000 | Total reward = 47.50
2022-01-26 14:17:08.517 | DEBUG    | __main__:trials:24 - Trial = 8982/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.519 | DEBUG    | __main__:trials:29 - Trial = 8982/30000 | Total reward = 36.56
2022-01-26 14:17:08.523 | DEBUG    | __main__:trials:24 - Trial = 8983/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.524 | DEBUG    | __main__:trials:29 - Trial = 8983/30000 | Total reward = 43.10
2022-01-26 14:17:08.527 | DEBUG    | __main__:trials:24 - Trial = 8984/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.529 | DEBUG    | __main__:trials:29 - Trial = 8984/30000 | Total reward = 45.22
2022-01-26 14:17:08.532 | DEBUG    | __main__:trials:24 - Trial = 8985/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.534 | DEBUG    | __main__:trials:29 - Trial = 8985/30000 | Total reward = 52.77
2022-01-26 14:17:08.538 | DEBUG    | __main__:trials:24 - Trial = 8986/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.539 | DEBUG    | __main__:trials:29 - Trial = 8986/30000 | Total reward = 49.27
2022-01-26 14:17:08.543 | DEBUG    | __main__:trials:24 - Trial = 8987/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.544 | DEBUG    | __main__:trials:29 - Trial = 8987/30000 | Total reward = 45.86
2022-01-26 14:17:08.548 | DEBUG    | __main__:trials:24 - Trial = 8988/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.550 | DEBUG    | __main__:trials:29 - Trial = 8988/30000 | Total reward = 41.28
2022-01-26 14:17:08.553 | DEBUG    | __main__:trials:24 - Trial = 8989/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.555 | DEBUG    | __main__:trials:29 - Trial = 8989/30000 | Total reward = 45.09
2022-01-26 14:17:08.559 | DEBUG    | __main__:trials:24 - Trial = 8990/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.560 | DEBUG    | __main__:trials:29 - Trial = 8990/30000 | Total reward = 50.37
2022-01-26 14:17:08.563 | DEBUG    | __main__:trials:24 - Trial = 8991/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.565 | DEBUG    | __main__:trials:29 - Trial = 8991/30000 | Total reward = 40.91
2022-01-26 14:17:08.568 | DEBUG    | __main__:trials:24 - Trial = 8992/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.570 | DEBUG    | __main__:trials:29 - Trial = 8992/30000 | Total reward = 46.58
2022-01-26 14:17:08.573 | DEBUG    | __main__:trials:24 - Trial = 8993/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.574 | DEBUG    | __main__:trials:29 - Trial = 8993/30000 | Total reward = 49.11
2022-01-26 14:17:08.578 | DEBUG    | __main__:trials:24 - Trial = 8994/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.579 | DEBUG    | __main__:trials:29 - Trial = 8994/30000 | Total reward = 40.72
2022-01-26 14:17:08.583 | DEBUG    | __main__:trials:24 - Trial = 8995/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.584 | DEBUG    | __main__:trials:29 - Trial = 8995/30000 | Total reward = 39.32
2022-01-26 14:17:08.588 | DEBUG    | __main__:trials:24 - Trial = 8996/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.589 | DEBUG    | __main__:trials:29 - Trial = 8996/30000 | Total reward = 47.00
2022-01-26 14:17:08.593 | DEBUG    | __main__:trials:24 - Trial = 8997/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.594 | DEBUG    | __main__:trials:29 - Trial = 8997/30000 | Total reward = 41.28
2022-01-26 14:17:08.598 | DEBUG    | __main__:trials:24 - Trial = 8998/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.599 | DEBUG    | __main__:trials:29 - Trial = 8998/30000 | Total reward = 35.34
2022-01-26 14:17:08.603 | DEBUG    | __main__:trials:24 - Trial = 8999/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.604 | DEBUG    | __main__:trials:29 - Trial = 8999/30000 | Total reward = 41.60
2022-01-26 14:17:08.608 | DEBUG    | __main__:trials:24 - Trial = 9000/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.609 | DEBUG    | __main__:trials:29 - Trial = 9000/30000 | Total reward = 47.67
2022-01-26 14:17:08.613 | DEBUG    | __main__:trials:24 - Trial = 9001/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.615 | DEBUG    | __main__:trials:29 - Trial = 9001/30000 | Total reward = 36.35
2022-01-26 14:17:08.618 | DEBUG    | __main__:trials:24 - Trial = 9002/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.619 | DEBUG    | __main__:trials:29 - Trial = 9002/30000 | Total reward = 39.30
2022-01-26 14:17:08.623 | DEBUG    | __main__:trials:24 - Trial = 9003/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.624 | DEBUG    | __main__:trials:29 - Trial = 9003/30000 | Total reward = 47.74
2022-01-26 14:17:08.628 | DEBUG    | __main__:trials:24 - Trial = 9004/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.630 | DEBUG    | __main__:trials:29 - Trial = 9004/30000 | Total reward = 40.58
2022-01-26 14:17:08.633 | DEBUG    | __main__:trials:24 - Trial = 9005/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.634 | DEBUG    | __main__:trials:29 - Trial = 9005/30000 | Total reward = 42.85
2022-01-26 14:17:08.638 | DEBUG    | __main__:trials:24 - Trial = 9006/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.638 | DEBUG    | __main__:trials:29 - Trial = 9006/30000 | Total reward = 51.03
2022-01-26 14:17:08.643 | DEBUG    | __main__:trials:24 - Trial = 9007/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.644 | DEBUG    | __main__:trials:29 - Trial = 9007/30000 | Total reward = 42.20
2022-01-26 14:17:08.648 | DEBUG    | __main__:trials:24 - Trial = 9008/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.648 | DEBUG    | __main__:trials:29 - Trial = 9008/30000 | Total reward = 41.82
2022-01-26 14:17:08.653 | DEBUG    | __main__:trials:24 - Trial = 9009/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.654 | DEBUG    | __main__:trials:29 - Trial = 9009/30000 | Total reward = 38.25
2022-01-26 14:17:08.657 | DEBUG    | __main__:trials:24 - Trial = 9010/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.658 | DEBUG    | __main__:trials:29 - Trial = 9010/30000 | Total reward = 41.23
2022-01-26 14:17:08.661 | DEBUG    | __main__:trials:24 - Trial = 9011/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.662 | DEBUG    | __main__:trials:29 - Trial = 9011/30000 | Total reward = 45.36
2022-01-26 14:17:08.665 | DEBUG    | __main__:trials:24 - Trial = 9012/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.667 | DEBUG    | __main__:trials:29 - Trial = 9012/30000 | Total reward = 41.56
2022-01-26 14:17:08.671 | DEBUG    | __main__:trials:24 - Trial = 9013/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.672 | DEBUG    | __main__:trials:29 - Trial = 9013/30000 | Total reward = 38.87
2022-01-26 14:17:08.676 | DEBUG    | __main__:trials:24 - Trial = 9014/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.676 | DEBUG    | __main__:trials:29 - Trial = 9014/30000 | Total reward = 44.24
2022-01-26 14:17:08.681 | DEBUG    | __main__:trials:24 - Trial = 9015/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.682 | DEBUG    | __main__:trials:29 - Trial = 9015/30000 | Total reward = 41.65
2022-01-26 14:17:08.686 | DEBUG    | __main__:trials:24 - Trial = 9016/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.688 | DEBUG    | __main__:trials:29 - Trial = 9016/30000 | Total reward = 41.28
2022-01-26 14:17:08.691 | DEBUG    | __main__:trials:24 - Trial = 9017/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.693 | DEBUG    | __main__:trials:29 - Trial = 9017/30000 | Total reward = 30.39
2022-01-26 14:17:08.696 | DEBUG    | __main__:trials:24 - Trial = 9018/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.697 | DEBUG    | __main__:trials:29 - Trial = 9018/30000 | Total reward = 38.67
2022-01-26 14:17:08.701 | DEBUG    | __main__:trials:24 - Trial = 9019/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.702 | DEBUG    | __main__:trials:29 - Trial = 9019/30000 | Total reward = 43.95
2022-01-26 14:17:08.706 | DEBUG    | __main__:trials:24 - Trial = 9020/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.706 | DEBUG    | __main__:trials:29 - Trial = 9020/30000 | Total reward = 43.96
2022-01-26 14:17:08.711 | DEBUG    | __main__:trials:24 - Trial = 9021/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.711 | DEBUG    | __main__:trials:29 - Trial = 9021/30000 | Total reward = 35.63
2022-01-26 14:17:08.716 | DEBUG    | __main__:trials:24 - Trial = 9022/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.717 | DEBUG    | __main__:trials:29 - Trial = 9022/30000 | Total reward = 44.74
2022-01-26 14:17:08.721 | DEBUG    | __main__:trials:24 - Trial = 9023/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.722 | DEBUG    | __main__:trials:29 - Trial = 9023/30000 | Total reward = 51.05
2022-01-26 14:17:08.726 | DEBUG    | __main__:trials:24 - Trial = 9024/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.728 | DEBUG    | __main__:trials:29 - Trial = 9024/30000 | Total reward = 36.41
2022-01-26 14:17:08.731 | DEBUG    | __main__:trials:24 - Trial = 9025/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.732 | DEBUG    | __main__:trials:29 - Trial = 9025/30000 | Total reward = 37.02
2022-01-26 14:17:08.736 | DEBUG    | __main__:trials:24 - Trial = 9026/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.737 | DEBUG    | __main__:trials:29 - Trial = 9026/30000 | Total reward = 33.63
2022-01-26 14:17:08.742 | DEBUG    | __main__:trials:24 - Trial = 9027/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.742 | DEBUG    | __main__:trials:29 - Trial = 9027/30000 | Total reward = 50.07
2022-01-26 14:17:08.746 | DEBUG    | __main__:trials:24 - Trial = 9028/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.748 | DEBUG    | __main__:trials:29 - Trial = 9028/30000 | Total reward = 36.40
2022-01-26 14:17:08.751 | DEBUG    | __main__:trials:24 - Trial = 9029/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.753 | DEBUG    | __main__:trials:29 - Trial = 9029/30000 | Total reward = 50.48
2022-01-26 14:17:08.756 | DEBUG    | __main__:trials:24 - Trial = 9030/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.757 | DEBUG    | __main__:trials:29 - Trial = 9030/30000 | Total reward = 51.46
2022-01-26 14:17:08.760 | DEBUG    | __main__:trials:24 - Trial = 9031/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.762 | DEBUG    | __main__:trials:29 - Trial = 9031/30000 | Total reward = 40.71
2022-01-26 14:17:08.765 | DEBUG    | __main__:trials:24 - Trial = 9032/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.766 | DEBUG    | __main__:trials:29 - Trial = 9032/30000 | Total reward = 32.07
2022-01-26 14:17:08.769 | DEBUG    | __main__:trials:24 - Trial = 9033/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.770 | DEBUG    | __main__:trials:29 - Trial = 9033/30000 | Total reward = 45.61
2022-01-26 14:17:08.773 | DEBUG    | __main__:trials:24 - Trial = 9034/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.774 | DEBUG    | __main__:trials:29 - Trial = 9034/30000 | Total reward = 36.82
2022-01-26 14:17:08.777 | DEBUG    | __main__:trials:24 - Trial = 9035/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.778 | DEBUG    | __main__:trials:29 - Trial = 9035/30000 | Total reward = 43.09
2022-01-26 14:17:08.781 | DEBUG    | __main__:trials:24 - Trial = 9036/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.784 | DEBUG    | __main__:trials:29 - Trial = 9036/30000 | Total reward = 31.97
2022-01-26 14:17:08.786 | DEBUG    | __main__:trials:24 - Trial = 9037/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.787 | DEBUG    | __main__:trials:29 - Trial = 9037/30000 | Total reward = 44.69
2022-01-26 14:17:08.790 | DEBUG    | __main__:trials:24 - Trial = 9038/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.792 | DEBUG    | __main__:trials:29 - Trial = 9038/30000 | Total reward = 46.02
2022-01-26 14:17:08.796 | DEBUG    | __main__:trials:24 - Trial = 9039/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.797 | DEBUG    | __main__:trials:29 - Trial = 9039/30000 | Total reward = 39.97
2022-01-26 14:17:08.800 | DEBUG    | __main__:trials:24 - Trial = 9040/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.801 | DEBUG    | __main__:trials:29 - Trial = 9040/30000 | Total reward = 41.59
2022-01-26 14:17:08.806 | DEBUG    | __main__:trials:24 - Trial = 9041/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.806 | DEBUG    | __main__:trials:29 - Trial = 9041/30000 | Total reward = 39.96
2022-01-26 14:17:08.810 | DEBUG    | __main__:trials:24 - Trial = 9042/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.812 | DEBUG    | __main__:trials:29 - Trial = 9042/30000 | Total reward = 39.54
2022-01-26 14:17:08.815 | DEBUG    | __main__:trials:24 - Trial = 9043/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.816 | DEBUG    | __main__:trials:29 - Trial = 9043/30000 | Total reward = 38.48
2022-01-26 14:17:08.821 | DEBUG    | __main__:trials:24 - Trial = 9044/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.822 | DEBUG    | __main__:trials:29 - Trial = 9044/30000 | Total reward = 47.33
2022-01-26 14:17:08.826 | DEBUG    | __main__:trials:24 - Trial = 9045/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.827 | DEBUG    | __main__:trials:29 - Trial = 9045/30000 | Total reward = 41.28
2022-01-26 14:17:08.830 | DEBUG    | __main__:trials:24 - Trial = 9046/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.831 | DEBUG    | __main__:trials:29 - Trial = 9046/30000 | Total reward = 31.73
2022-01-26 14:17:08.835 | DEBUG    | __main__:trials:24 - Trial = 9047/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.836 | DEBUG    | __main__:trials:29 - Trial = 9047/30000 | Total reward = 39.75
2022-01-26 14:17:08.840 | DEBUG    | __main__:trials:24 - Trial = 9048/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.842 | DEBUG    | __main__:trials:29 - Trial = 9048/30000 | Total reward = 44.09
2022-01-26 14:17:08.846 | DEBUG    | __main__:trials:24 - Trial = 9049/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.847 | DEBUG    | __main__:trials:29 - Trial = 9049/30000 | Total reward = 43.28
2022-01-26 14:17:08.851 | DEBUG    | __main__:trials:24 - Trial = 9050/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.852 | DEBUG    | __main__:trials:29 - Trial = 9050/30000 | Total reward = 42.58
2022-01-26 14:17:08.856 | DEBUG    | __main__:trials:24 - Trial = 9051/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.858 | DEBUG    | __main__:trials:29 - Trial = 9051/30000 | Total reward = 41.05
2022-01-26 14:17:08.861 | DEBUG    | __main__:trials:24 - Trial = 9052/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.863 | DEBUG    | __main__:trials:29 - Trial = 9052/30000 | Total reward = 37.65
2022-01-26 14:17:08.866 | DEBUG    | __main__:trials:24 - Trial = 9053/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.867 | DEBUG    | __main__:trials:29 - Trial = 9053/30000 | Total reward = 38.46
2022-01-26 14:17:08.872 | DEBUG    | __main__:trials:24 - Trial = 9054/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.873 | DEBUG    | __main__:trials:29 - Trial = 9054/30000 | Total reward = 31.96
2022-01-26 14:17:08.877 | DEBUG    | __main__:trials:24 - Trial = 9055/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.878 | DEBUG    | __main__:trials:29 - Trial = 9055/30000 | Total reward = 33.36
2022-01-26 14:17:08.881 | DEBUG    | __main__:trials:24 - Trial = 9056/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.882 | DEBUG    | __main__:trials:29 - Trial = 9056/30000 | Total reward = 32.58
2022-01-26 14:17:08.886 | DEBUG    | __main__:trials:24 - Trial = 9057/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.888 | DEBUG    | __main__:trials:29 - Trial = 9057/30000 | Total reward = 43.77
2022-01-26 14:17:08.891 | DEBUG    | __main__:trials:24 - Trial = 9058/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.892 | DEBUG    | __main__:trials:29 - Trial = 9058/30000 | Total reward = 33.36
2022-01-26 14:17:08.896 | DEBUG    | __main__:trials:24 - Trial = 9059/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.897 | DEBUG    | __main__:trials:29 - Trial = 9059/30000 | Total reward = 41.85
2022-01-26 14:17:08.900 | DEBUG    | __main__:trials:24 - Trial = 9060/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.901 | DEBUG    | __main__:trials:29 - Trial = 9060/30000 | Total reward = 34.31
2022-01-26 14:17:08.905 | DEBUG    | __main__:trials:24 - Trial = 9061/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.906 | DEBUG    | __main__:trials:29 - Trial = 9061/30000 | Total reward = 35.44
2022-01-26 14:17:08.908 | DEBUG    | __main__:trials:26 - Trial = 9062/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.909 | DEBUG    | __main__:trials:29 - Trial = 9062/30000 | Total reward = 6.70
2022-01-26 14:17:08.912 | DEBUG    | __main__:trials:24 - Trial = 9063/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.913 | DEBUG    | __main__:trials:29 - Trial = 9063/30000 | Total reward = 33.05
2022-01-26 14:17:08.916 | DEBUG    | __main__:trials:24 - Trial = 9064/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.917 | DEBUG    | __main__:trials:29 - Trial = 9064/30000 | Total reward = 44.59
2022-01-26 14:17:08.920 | DEBUG    | __main__:trials:26 - Trial = 9065/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.922 | DEBUG    | __main__:trials:29 - Trial = 9065/30000 | Total reward = 21.80
2022-01-26 14:17:08.925 | DEBUG    | __main__:trials:24 - Trial = 9066/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.926 | DEBUG    | __main__:trials:29 - Trial = 9066/30000 | Total reward = 37.38
2022-01-26 14:17:08.929 | DEBUG    | __main__:trials:26 - Trial = 9067/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.930 | DEBUG    | __main__:trials:29 - Trial = 9067/30000 | Total reward = 7.41
2022-01-26 14:17:08.933 | DEBUG    | __main__:trials:24 - Trial = 9068/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.934 | DEBUG    | __main__:trials:29 - Trial = 9068/30000 | Total reward = 38.64
2022-01-26 14:17:08.937 | DEBUG    | __main__:trials:24 - Trial = 9069/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.938 | DEBUG    | __main__:trials:29 - Trial = 9069/30000 | Total reward = 29.06
2022-01-26 14:17:08.941 | DEBUG    | __main__:trials:24 - Trial = 9070/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.942 | DEBUG    | __main__:trials:29 - Trial = 9070/30000 | Total reward = 45.75
2022-01-26 14:17:08.945 | DEBUG    | __main__:trials:24 - Trial = 9071/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.946 | DEBUG    | __main__:trials:29 - Trial = 9071/30000 | Total reward = 33.09
2022-01-26 14:17:08.949 | DEBUG    | __main__:trials:24 - Trial = 9072/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.951 | DEBUG    | __main__:trials:29 - Trial = 9072/30000 | Total reward = 41.39
2022-01-26 14:17:08.955 | DEBUG    | __main__:trials:24 - Trial = 9073/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.956 | DEBUG    | __main__:trials:29 - Trial = 9073/30000 | Total reward = 55.02
2022-01-26 14:17:08.959 | DEBUG    | __main__:trials:24 - Trial = 9074/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.961 | DEBUG    | __main__:trials:29 - Trial = 9074/30000 | Total reward = 38.16
2022-01-26 14:17:08.963 | DEBUG    | __main__:trials:26 - Trial = 9075/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:08.964 | DEBUG    | __main__:trials:29 - Trial = 9075/30000 | Total reward = 12.13
2022-01-26 14:17:08.968 | DEBUG    | __main__:trials:24 - Trial = 9076/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.969 | DEBUG    | __main__:trials:29 - Trial = 9076/30000 | Total reward = 62.22
2022-01-26 14:17:08.973 | DEBUG    | __main__:trials:24 - Trial = 9077/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.975 | DEBUG    | __main__:trials:29 - Trial = 9077/30000 | Total reward = 40.05
2022-01-26 14:17:08.978 | DEBUG    | __main__:trials:24 - Trial = 9078/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.979 | DEBUG    | __main__:trials:29 - Trial = 9078/30000 | Total reward = 46.05
2022-01-26 14:17:08.983 | DEBUG    | __main__:trials:24 - Trial = 9079/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.985 | DEBUG    | __main__:trials:29 - Trial = 9079/30000 | Total reward = 41.28
2022-01-26 14:17:08.988 | DEBUG    | __main__:trials:24 - Trial = 9080/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.989 | DEBUG    | __main__:trials:29 - Trial = 9080/30000 | Total reward = 41.85
2022-01-26 14:17:08.993 | DEBUG    | __main__:trials:24 - Trial = 9081/30000 | Max number of steps (20) reached
2022-01-26 14:17:08.994 | DEBUG    | __main__:trials:29 - Trial = 9081/30000 | Total reward = 38.44
2022-01-26 14:17:08.998 | DEBUG    | __main__:trials:24 - Trial = 9082/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.000 | DEBUG    | __main__:trials:29 - Trial = 9082/30000 | Total reward = 44.19
2022-01-26 14:17:09.003 | DEBUG    | __main__:trials:24 - Trial = 9083/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.004 | DEBUG    | __main__:trials:29 - Trial = 9083/30000 | Total reward = 42.20
2022-01-26 14:17:09.008 | DEBUG    | __main__:trials:24 - Trial = 9084/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.009 | DEBUG    | __main__:trials:29 - Trial = 9084/30000 | Total reward = 31.57
2022-01-26 14:17:09.013 | DEBUG    | __main__:trials:24 - Trial = 9085/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.015 | DEBUG    | __main__:trials:29 - Trial = 9085/30000 | Total reward = 44.19
2022-01-26 14:17:09.018 | DEBUG    | __main__:trials:24 - Trial = 9086/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.020 | DEBUG    | __main__:trials:29 - Trial = 9086/30000 | Total reward = 47.36
2022-01-26 14:17:09.023 | DEBUG    | __main__:trials:24 - Trial = 9087/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.024 | DEBUG    | __main__:trials:29 - Trial = 9087/30000 | Total reward = 44.27
2022-01-26 14:17:09.027 | DEBUG    | __main__:trials:24 - Trial = 9088/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.029 | DEBUG    | __main__:trials:29 - Trial = 9088/30000 | Total reward = 33.36
2022-01-26 14:17:09.032 | DEBUG    | __main__:trials:24 - Trial = 9089/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.034 | DEBUG    | __main__:trials:29 - Trial = 9089/30000 | Total reward = 30.27
2022-01-26 14:17:09.037 | DEBUG    | __main__:trials:24 - Trial = 9090/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.039 | DEBUG    | __main__:trials:29 - Trial = 9090/30000 | Total reward = 38.33
2022-01-26 14:17:09.042 | DEBUG    | __main__:trials:24 - Trial = 9091/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.043 | DEBUG    | __main__:trials:29 - Trial = 9091/30000 | Total reward = 26.67
2022-01-26 14:17:09.047 | DEBUG    | __main__:trials:24 - Trial = 9092/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.049 | DEBUG    | __main__:trials:29 - Trial = 9092/30000 | Total reward = 33.20
2022-01-26 14:17:09.052 | DEBUG    | __main__:trials:24 - Trial = 9093/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.054 | DEBUG    | __main__:trials:29 - Trial = 9093/30000 | Total reward = 41.78
2022-01-26 14:17:09.057 | DEBUG    | __main__:trials:24 - Trial = 9094/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.058 | DEBUG    | __main__:trials:29 - Trial = 9094/30000 | Total reward = 43.26
2022-01-26 14:17:09.062 | DEBUG    | __main__:trials:24 - Trial = 9095/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.063 | DEBUG    | __main__:trials:29 - Trial = 9095/30000 | Total reward = 37.08
2022-01-26 14:17:09.067 | DEBUG    | __main__:trials:24 - Trial = 9096/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.069 | DEBUG    | __main__:trials:29 - Trial = 9096/30000 | Total reward = 37.51
2022-01-26 14:17:09.072 | DEBUG    | __main__:trials:24 - Trial = 9097/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.074 | DEBUG    | __main__:trials:29 - Trial = 9097/30000 | Total reward = 39.52
2022-01-26 14:17:09.077 | DEBUG    | __main__:trials:24 - Trial = 9098/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.078 | DEBUG    | __main__:trials:29 - Trial = 9098/30000 | Total reward = 46.95
2022-01-26 14:17:09.082 | DEBUG    | __main__:trials:24 - Trial = 9099/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.084 | DEBUG    | __main__:trials:29 - Trial = 9099/30000 | Total reward = 47.29
2022-01-26 14:17:09.088 | DEBUG    | __main__:trials:24 - Trial = 9100/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.089 | DEBUG    | __main__:trials:29 - Trial = 9100/30000 | Total reward = 42.89
2022-01-26 14:17:09.093 | DEBUG    | __main__:trials:24 - Trial = 9101/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.093 | DEBUG    | __main__:trials:29 - Trial = 9101/30000 | Total reward = 52.29
2022-01-26 14:17:09.097 | DEBUG    | __main__:trials:24 - Trial = 9102/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.098 | DEBUG    | __main__:trials:29 - Trial = 9102/30000 | Total reward = 41.74
2022-01-26 14:17:09.102 | DEBUG    | __main__:trials:24 - Trial = 9103/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.102 | DEBUG    | __main__:trials:29 - Trial = 9103/30000 | Total reward = 38.09
2022-01-26 14:17:09.107 | DEBUG    | __main__:trials:24 - Trial = 9104/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.107 | DEBUG    | __main__:trials:29 - Trial = 9104/30000 | Total reward = 45.82
2022-01-26 14:17:09.112 | DEBUG    | __main__:trials:24 - Trial = 9105/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.114 | DEBUG    | __main__:trials:29 - Trial = 9105/30000 | Total reward = 50.59
2022-01-26 14:17:09.117 | DEBUG    | __main__:trials:24 - Trial = 9106/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.119 | DEBUG    | __main__:trials:29 - Trial = 9106/30000 | Total reward = 51.38
2022-01-26 14:17:09.122 | DEBUG    | __main__:trials:24 - Trial = 9107/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.124 | DEBUG    | __main__:trials:29 - Trial = 9107/30000 | Total reward = 54.11
2022-01-26 14:17:09.127 | DEBUG    | __main__:trials:24 - Trial = 9108/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.129 | DEBUG    | __main__:trials:29 - Trial = 9108/30000 | Total reward = 66.58
2022-01-26 14:17:09.132 | DEBUG    | __main__:trials:24 - Trial = 9109/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.133 | DEBUG    | __main__:trials:29 - Trial = 9109/30000 | Total reward = 31.24
2022-01-26 14:17:09.136 | DEBUG    | __main__:trials:24 - Trial = 9110/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.138 | DEBUG    | __main__:trials:29 - Trial = 9110/30000 | Total reward = 41.98
2022-01-26 14:17:09.142 | DEBUG    | __main__:trials:24 - Trial = 9111/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.143 | DEBUG    | __main__:trials:29 - Trial = 9111/30000 | Total reward = 40.46
2022-01-26 14:17:09.146 | DEBUG    | __main__:trials:24 - Trial = 9112/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.148 | DEBUG    | __main__:trials:29 - Trial = 9112/30000 | Total reward = 39.24
2022-01-26 14:17:09.151 | DEBUG    | __main__:trials:24 - Trial = 9113/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.152 | DEBUG    | __main__:trials:29 - Trial = 9113/30000 | Total reward = 43.23
2022-01-26 14:17:09.156 | DEBUG    | __main__:trials:24 - Trial = 9114/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.157 | DEBUG    | __main__:trials:29 - Trial = 9114/30000 | Total reward = 48.38
2022-01-26 14:17:09.161 | DEBUG    | __main__:trials:24 - Trial = 9115/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.162 | DEBUG    | __main__:trials:29 - Trial = 9115/30000 | Total reward = 42.32
2022-01-26 14:17:09.165 | DEBUG    | __main__:trials:24 - Trial = 9116/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.166 | DEBUG    | __main__:trials:29 - Trial = 9116/30000 | Total reward = 55.35
2022-01-26 14:17:09.169 | DEBUG    | __main__:trials:26 - Trial = 9117/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:09.170 | DEBUG    | __main__:trials:29 - Trial = 9117/30000 | Total reward = 36.58
2022-01-26 14:17:09.174 | DEBUG    | __main__:trials:24 - Trial = 9118/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.176 | DEBUG    | __main__:trials:29 - Trial = 9118/30000 | Total reward = 41.45
2022-01-26 14:17:09.179 | DEBUG    | __main__:trials:24 - Trial = 9119/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.181 | DEBUG    | __main__:trials:29 - Trial = 9119/30000 | Total reward = 51.65
2022-01-26 14:17:09.184 | DEBUG    | __main__:trials:24 - Trial = 9120/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.185 | DEBUG    | __main__:trials:29 - Trial = 9120/30000 | Total reward = 44.79
2022-01-26 14:17:09.188 | DEBUG    | __main__:trials:24 - Trial = 9121/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.190 | DEBUG    | __main__:trials:29 - Trial = 9121/30000 | Total reward = 51.55
2022-01-26 14:17:09.193 | DEBUG    | __main__:trials:24 - Trial = 9122/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.193 | DEBUG    | __main__:trials:29 - Trial = 9122/30000 | Total reward = 51.97
2022-01-26 14:17:09.197 | DEBUG    | __main__:trials:24 - Trial = 9123/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.198 | DEBUG    | __main__:trials:29 - Trial = 9123/30000 | Total reward = 51.11
2022-01-26 14:17:09.201 | DEBUG    | __main__:trials:24 - Trial = 9124/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.202 | DEBUG    | __main__:trials:29 - Trial = 9124/30000 | Total reward = 41.85
2022-01-26 14:17:09.205 | DEBUG    | __main__:trials:24 - Trial = 9125/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.207 | DEBUG    | __main__:trials:29 - Trial = 9125/30000 | Total reward = 57.98
2022-01-26 14:17:09.210 | DEBUG    | __main__:trials:24 - Trial = 9126/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.211 | DEBUG    | __main__:trials:29 - Trial = 9126/30000 | Total reward = 49.81
2022-01-26 14:17:09.214 | DEBUG    | __main__:trials:24 - Trial = 9127/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.216 | DEBUG    | __main__:trials:29 - Trial = 9127/30000 | Total reward = 41.55
2022-01-26 14:17:09.219 | DEBUG    | __main__:trials:24 - Trial = 9128/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.221 | DEBUG    | __main__:trials:29 - Trial = 9128/30000 | Total reward = 42.19
2022-01-26 14:17:09.225 | DEBUG    | __main__:trials:24 - Trial = 9129/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.226 | DEBUG    | __main__:trials:29 - Trial = 9129/30000 | Total reward = 38.57
2022-01-26 14:17:09.230 | DEBUG    | __main__:trials:26 - Trial = 9130/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:09.231 | DEBUG    | __main__:trials:29 - Trial = 9130/30000 | Total reward = 41.09
2022-01-26 14:17:09.235 | DEBUG    | __main__:trials:24 - Trial = 9131/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.236 | DEBUG    | __main__:trials:29 - Trial = 9131/30000 | Total reward = 54.45
2022-01-26 14:17:09.239 | DEBUG    | __main__:trials:24 - Trial = 9132/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.241 | DEBUG    | __main__:trials:29 - Trial = 9132/30000 | Total reward = 67.41
2022-01-26 14:17:09.245 | DEBUG    | __main__:trials:24 - Trial = 9133/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.246 | DEBUG    | __main__:trials:29 - Trial = 9133/30000 | Total reward = 47.21
2022-01-26 14:17:09.250 | DEBUG    | __main__:trials:24 - Trial = 9134/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.251 | DEBUG    | __main__:trials:29 - Trial = 9134/30000 | Total reward = 51.15
2022-01-26 14:17:09.255 | DEBUG    | __main__:trials:24 - Trial = 9135/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.256 | DEBUG    | __main__:trials:29 - Trial = 9135/30000 | Total reward = 47.21
2022-01-26 14:17:09.260 | DEBUG    | __main__:trials:24 - Trial = 9136/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.261 | DEBUG    | __main__:trials:29 - Trial = 9136/30000 | Total reward = 56.44
2022-01-26 14:17:09.265 | DEBUG    | __main__:trials:24 - Trial = 9137/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.266 | DEBUG    | __main__:trials:29 - Trial = 9137/30000 | Total reward = 34.16
2022-01-26 14:17:09.270 | DEBUG    | __main__:trials:24 - Trial = 9138/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.271 | DEBUG    | __main__:trials:29 - Trial = 9138/30000 | Total reward = 37.57
2022-01-26 14:17:09.274 | DEBUG    | __main__:trials:24 - Trial = 9139/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.276 | DEBUG    | __main__:trials:29 - Trial = 9139/30000 | Total reward = 48.62
2022-01-26 14:17:09.279 | DEBUG    | __main__:trials:24 - Trial = 9140/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.280 | DEBUG    | __main__:trials:29 - Trial = 9140/30000 | Total reward = 47.54
2022-01-26 14:17:09.284 | DEBUG    | __main__:trials:24 - Trial = 9141/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.286 | DEBUG    | __main__:trials:29 - Trial = 9141/30000 | Total reward = 45.68
2022-01-26 14:17:09.289 | DEBUG    | __main__:trials:24 - Trial = 9142/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.291 | DEBUG    | __main__:trials:29 - Trial = 9142/30000 | Total reward = 60.69
2022-01-26 14:17:09.295 | DEBUG    | __main__:trials:24 - Trial = 9143/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.295 | DEBUG    | __main__:trials:29 - Trial = 9143/30000 | Total reward = 50.93
2022-01-26 14:17:09.300 | DEBUG    | __main__:trials:24 - Trial = 9144/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.300 | DEBUG    | __main__:trials:29 - Trial = 9144/30000 | Total reward = 49.55
2022-01-26 14:17:09.304 | DEBUG    | __main__:trials:24 - Trial = 9145/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.305 | DEBUG    | __main__:trials:29 - Trial = 9145/30000 | Total reward = 53.41
2022-01-26 14:17:09.308 | DEBUG    | __main__:trials:24 - Trial = 9146/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.309 | DEBUG    | __main__:trials:29 - Trial = 9146/30000 | Total reward = 40.55
2022-01-26 14:17:09.313 | DEBUG    | __main__:trials:24 - Trial = 9147/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.313 | DEBUG    | __main__:trials:29 - Trial = 9147/30000 | Total reward = 61.35
2022-01-26 14:17:09.317 | DEBUG    | __main__:trials:24 - Trial = 9148/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.318 | DEBUG    | __main__:trials:29 - Trial = 9148/30000 | Total reward = 41.48
2022-01-26 14:17:09.321 | DEBUG    | __main__:trials:24 - Trial = 9149/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.323 | DEBUG    | __main__:trials:29 - Trial = 9149/30000 | Total reward = 63.93
2022-01-26 14:17:09.327 | DEBUG    | __main__:trials:24 - Trial = 9150/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.328 | DEBUG    | __main__:trials:29 - Trial = 9150/30000 | Total reward = 57.34
2022-01-26 14:17:09.332 | DEBUG    | __main__:trials:24 - Trial = 9151/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.333 | DEBUG    | __main__:trials:29 - Trial = 9151/30000 | Total reward = 56.86
2022-01-26 14:17:09.337 | DEBUG    | __main__:trials:24 - Trial = 9152/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.338 | DEBUG    | __main__:trials:29 - Trial = 9152/30000 | Total reward = 37.14
2022-01-26 14:17:09.342 | DEBUG    | __main__:trials:24 - Trial = 9153/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.343 | DEBUG    | __main__:trials:29 - Trial = 9153/30000 | Total reward = 46.24
2022-01-26 14:17:09.347 | DEBUG    | __main__:trials:24 - Trial = 9154/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.349 | DEBUG    | __main__:trials:29 - Trial = 9154/30000 | Total reward = 46.18
2022-01-26 14:17:09.352 | DEBUG    | __main__:trials:24 - Trial = 9155/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.353 | DEBUG    | __main__:trials:29 - Trial = 9155/30000 | Total reward = 44.82
2022-01-26 14:17:09.357 | DEBUG    | __main__:trials:24 - Trial = 9156/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.359 | DEBUG    | __main__:trials:29 - Trial = 9156/30000 | Total reward = 39.12
2022-01-26 14:17:09.362 | DEBUG    | __main__:trials:24 - Trial = 9157/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.364 | DEBUG    | __main__:trials:29 - Trial = 9157/30000 | Total reward = 44.83
2022-01-26 14:17:09.367 | DEBUG    | __main__:trials:24 - Trial = 9158/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.368 | DEBUG    | __main__:trials:29 - Trial = 9158/30000 | Total reward = 45.36
2022-01-26 14:17:09.372 | DEBUG    | __main__:trials:24 - Trial = 9159/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.373 | DEBUG    | __main__:trials:29 - Trial = 9159/30000 | Total reward = 48.23
2022-01-26 14:17:09.376 | DEBUG    | __main__:trials:24 - Trial = 9160/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.378 | DEBUG    | __main__:trials:29 - Trial = 9160/30000 | Total reward = 40.19
2022-01-26 14:17:09.382 | DEBUG    | __main__:trials:24 - Trial = 9161/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.383 | DEBUG    | __main__:trials:29 - Trial = 9161/30000 | Total reward = 46.37
2022-01-26 14:17:09.387 | DEBUG    | __main__:trials:24 - Trial = 9162/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.387 | DEBUG    | __main__:trials:29 - Trial = 9162/30000 | Total reward = 47.66
2022-01-26 14:17:09.392 | DEBUG    | __main__:trials:24 - Trial = 9163/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.393 | DEBUG    | __main__:trials:29 - Trial = 9163/30000 | Total reward = 44.80
2022-01-26 14:17:09.397 | DEBUG    | __main__:trials:24 - Trial = 9164/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.399 | DEBUG    | __main__:trials:29 - Trial = 9164/30000 | Total reward = 58.64
2022-01-26 14:17:09.401 | DEBUG    | __main__:trials:24 - Trial = 9165/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.403 | DEBUG    | __main__:trials:29 - Trial = 9165/30000 | Total reward = 37.93
2022-01-26 14:17:09.407 | DEBUG    | __main__:trials:24 - Trial = 9166/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.408 | DEBUG    | __main__:trials:29 - Trial = 9166/30000 | Total reward = 44.29
2022-01-26 14:17:09.412 | DEBUG    | __main__:trials:24 - Trial = 9167/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.414 | DEBUG    | __main__:trials:29 - Trial = 9167/30000 | Total reward = 53.08
2022-01-26 14:17:09.418 | DEBUG    | __main__:trials:24 - Trial = 9168/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.418 | DEBUG    | __main__:trials:29 - Trial = 9168/30000 | Total reward = 39.25
2022-01-26 14:17:09.422 | DEBUG    | __main__:trials:24 - Trial = 9169/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.423 | DEBUG    | __main__:trials:29 - Trial = 9169/30000 | Total reward = 51.63
2022-01-26 14:17:09.427 | DEBUG    | __main__:trials:24 - Trial = 9170/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.429 | DEBUG    | __main__:trials:29 - Trial = 9170/30000 | Total reward = 39.62
2022-01-26 14:17:09.432 | DEBUG    | __main__:trials:24 - Trial = 9171/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.433 | DEBUG    | __main__:trials:29 - Trial = 9171/30000 | Total reward = 47.99
2022-01-26 14:17:09.437 | DEBUG    | __main__:trials:24 - Trial = 9172/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.439 | DEBUG    | __main__:trials:29 - Trial = 9172/30000 | Total reward = 55.20
2022-01-26 14:17:09.442 | DEBUG    | __main__:trials:24 - Trial = 9173/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.444 | DEBUG    | __main__:trials:29 - Trial = 9173/30000 | Total reward = 52.37
2022-01-26 14:17:09.447 | DEBUG    | __main__:trials:24 - Trial = 9174/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.448 | DEBUG    | __main__:trials:29 - Trial = 9174/30000 | Total reward = 43.91
2022-01-26 14:17:09.452 | DEBUG    | __main__:trials:24 - Trial = 9175/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.453 | DEBUG    | __main__:trials:29 - Trial = 9175/30000 | Total reward = 44.06
2022-01-26 14:17:09.457 | DEBUG    | __main__:trials:24 - Trial = 9176/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.459 | DEBUG    | __main__:trials:29 - Trial = 9176/30000 | Total reward = 44.88
2022-01-26 14:17:09.462 | DEBUG    | __main__:trials:24 - Trial = 9177/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.464 | DEBUG    | __main__:trials:29 - Trial = 9177/30000 | Total reward = 45.60
2022-01-26 14:17:09.468 | DEBUG    | __main__:trials:24 - Trial = 9178/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.469 | DEBUG    | __main__:trials:29 - Trial = 9178/30000 | Total reward = 46.11
2022-01-26 14:17:09.472 | DEBUG    | __main__:trials:24 - Trial = 9179/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.474 | DEBUG    | __main__:trials:29 - Trial = 9179/30000 | Total reward = 46.19
2022-01-26 14:17:09.478 | DEBUG    | __main__:trials:24 - Trial = 9180/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.479 | DEBUG    | __main__:trials:29 - Trial = 9180/30000 | Total reward = 46.86
2022-01-26 14:17:09.483 | DEBUG    | __main__:trials:24 - Trial = 9181/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.484 | DEBUG    | __main__:trials:29 - Trial = 9181/30000 | Total reward = 46.64
2022-01-26 14:17:09.488 | DEBUG    | __main__:trials:24 - Trial = 9182/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.488 | DEBUG    | __main__:trials:29 - Trial = 9182/30000 | Total reward = 47.97
2022-01-26 14:17:09.493 | DEBUG    | __main__:trials:24 - Trial = 9183/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.494 | DEBUG    | __main__:trials:29 - Trial = 9183/30000 | Total reward = 37.54
2022-01-26 14:17:09.498 | DEBUG    | __main__:trials:24 - Trial = 9184/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.498 | DEBUG    | __main__:trials:29 - Trial = 9184/30000 | Total reward = 46.52
2022-01-26 14:17:09.502 | DEBUG    | __main__:trials:24 - Trial = 9185/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.504 | DEBUG    | __main__:trials:29 - Trial = 9185/30000 | Total reward = 39.28
2022-01-26 14:17:09.507 | DEBUG    | __main__:trials:24 - Trial = 9186/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.509 | DEBUG    | __main__:trials:29 - Trial = 9186/30000 | Total reward = 47.86
2022-01-26 14:17:09.512 | DEBUG    | __main__:trials:24 - Trial = 9187/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.514 | DEBUG    | __main__:trials:29 - Trial = 9187/30000 | Total reward = 43.47
2022-01-26 14:17:09.518 | DEBUG    | __main__:trials:24 - Trial = 9188/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.519 | DEBUG    | __main__:trials:29 - Trial = 9188/30000 | Total reward = 52.50
2022-01-26 14:17:09.523 | DEBUG    | __main__:trials:24 - Trial = 9189/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.523 | DEBUG    | __main__:trials:29 - Trial = 9189/30000 | Total reward = 43.50
2022-01-26 14:17:09.528 | DEBUG    | __main__:trials:24 - Trial = 9190/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.529 | DEBUG    | __main__:trials:29 - Trial = 9190/30000 | Total reward = 39.89
2022-01-26 14:17:09.532 | DEBUG    | __main__:trials:24 - Trial = 9191/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.534 | DEBUG    | __main__:trials:29 - Trial = 9191/30000 | Total reward = 56.39
2022-01-26 14:17:09.537 | DEBUG    | __main__:trials:24 - Trial = 9192/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.539 | DEBUG    | __main__:trials:29 - Trial = 9192/30000 | Total reward = 46.32
2022-01-26 14:17:09.542 | DEBUG    | __main__:trials:24 - Trial = 9193/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.544 | DEBUG    | __main__:trials:29 - Trial = 9193/30000 | Total reward = 46.96
2022-01-26 14:17:09.547 | DEBUG    | __main__:trials:24 - Trial = 9194/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.548 | DEBUG    | __main__:trials:29 - Trial = 9194/30000 | Total reward = 57.72
2022-01-26 14:17:09.552 | DEBUG    | __main__:trials:24 - Trial = 9195/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.553 | DEBUG    | __main__:trials:29 - Trial = 9195/30000 | Total reward = 45.01
2022-01-26 14:17:09.557 | DEBUG    | __main__:trials:24 - Trial = 9196/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.558 | DEBUG    | __main__:trials:29 - Trial = 9196/30000 | Total reward = 54.58
2022-01-26 14:17:09.561 | DEBUG    | __main__:trials:24 - Trial = 9197/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.562 | DEBUG    | __main__:trials:29 - Trial = 9197/30000 | Total reward = 46.84
2022-01-26 14:17:09.565 | DEBUG    | __main__:trials:24 - Trial = 9198/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.567 | DEBUG    | __main__:trials:29 - Trial = 9198/30000 | Total reward = 65.92
2022-01-26 14:17:09.570 | DEBUG    | __main__:trials:26 - Trial = 9199/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:09.571 | DEBUG    | __main__:trials:29 - Trial = 9199/30000 | Total reward = 25.04
2022-01-26 14:17:09.575 | DEBUG    | __main__:trials:24 - Trial = 9200/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.577 | DEBUG    | __main__:trials:29 - Trial = 9200/30000 | Total reward = 40.02
2022-01-26 14:17:09.580 | DEBUG    | __main__:trials:24 - Trial = 9201/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.582 | DEBUG    | __main__:trials:29 - Trial = 9201/30000 | Total reward = 59.83
2022-01-26 14:17:09.585 | DEBUG    | __main__:trials:24 - Trial = 9202/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.586 | DEBUG    | __main__:trials:29 - Trial = 9202/30000 | Total reward = 44.36
2022-01-26 14:17:09.591 | DEBUG    | __main__:trials:24 - Trial = 9203/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.591 | DEBUG    | __main__:trials:29 - Trial = 9203/30000 | Total reward = 44.40
2022-01-26 14:17:09.596 | DEBUG    | __main__:trials:24 - Trial = 9204/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.597 | DEBUG    | __main__:trials:29 - Trial = 9204/30000 | Total reward = 46.98
2022-01-26 14:17:09.601 | DEBUG    | __main__:trials:24 - Trial = 9205/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.602 | DEBUG    | __main__:trials:29 - Trial = 9205/30000 | Total reward = 50.80
2022-01-26 14:17:09.606 | DEBUG    | __main__:trials:24 - Trial = 9206/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.607 | DEBUG    | __main__:trials:29 - Trial = 9206/30000 | Total reward = 47.24
2022-01-26 14:17:09.611 | DEBUG    | __main__:trials:24 - Trial = 9207/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.612 | DEBUG    | __main__:trials:29 - Trial = 9207/30000 | Total reward = 47.69
2022-01-26 14:17:09.616 | DEBUG    | __main__:trials:24 - Trial = 9208/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.617 | DEBUG    | __main__:trials:29 - Trial = 9208/30000 | Total reward = 38.67
2022-01-26 14:17:09.620 | DEBUG    | __main__:trials:24 - Trial = 9209/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.622 | DEBUG    | __main__:trials:29 - Trial = 9209/30000 | Total reward = 41.76
2022-01-26 14:17:09.625 | DEBUG    | __main__:trials:24 - Trial = 9210/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.626 | DEBUG    | __main__:trials:29 - Trial = 9210/30000 | Total reward = 61.82
2022-01-26 14:17:09.630 | DEBUG    | __main__:trials:24 - Trial = 9211/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.631 | DEBUG    | __main__:trials:29 - Trial = 9211/30000 | Total reward = 45.85
2022-01-26 14:17:09.635 | DEBUG    | __main__:trials:24 - Trial = 9212/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.637 | DEBUG    | __main__:trials:29 - Trial = 9212/30000 | Total reward = 54.74
2022-01-26 14:17:09.640 | DEBUG    | __main__:trials:24 - Trial = 9213/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.641 | DEBUG    | __main__:trials:29 - Trial = 9213/30000 | Total reward = 57.45
2022-01-26 14:17:09.646 | DEBUG    | __main__:trials:24 - Trial = 9214/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.646 | DEBUG    | __main__:trials:29 - Trial = 9214/30000 | Total reward = 49.28
2022-01-26 14:17:09.651 | DEBUG    | __main__:trials:24 - Trial = 9215/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.651 | DEBUG    | __main__:trials:29 - Trial = 9215/30000 | Total reward = 50.93
2022-01-26 14:17:09.656 | DEBUG    | __main__:trials:24 - Trial = 9216/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.658 | DEBUG    | __main__:trials:29 - Trial = 9216/30000 | Total reward = 39.49
2022-01-26 14:17:09.661 | DEBUG    | __main__:trials:24 - Trial = 9217/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.663 | DEBUG    | __main__:trials:29 - Trial = 9217/30000 | Total reward = 38.82
2022-01-26 14:17:09.666 | DEBUG    | __main__:trials:24 - Trial = 9218/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.667 | DEBUG    | __main__:trials:29 - Trial = 9218/30000 | Total reward = 52.83
2022-01-26 14:17:09.671 | DEBUG    | __main__:trials:24 - Trial = 9219/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.672 | DEBUG    | __main__:trials:29 - Trial = 9219/30000 | Total reward = 48.03
2022-01-26 14:17:09.676 | DEBUG    | __main__:trials:24 - Trial = 9220/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.677 | DEBUG    | __main__:trials:29 - Trial = 9220/30000 | Total reward = 45.44
2022-01-26 14:17:09.681 | DEBUG    | __main__:trials:24 - Trial = 9221/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.683 | DEBUG    | __main__:trials:29 - Trial = 9221/30000 | Total reward = 47.38
2022-01-26 14:17:09.687 | DEBUG    | __main__:trials:24 - Trial = 9222/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.688 | DEBUG    | __main__:trials:29 - Trial = 9222/30000 | Total reward = 36.62
2022-01-26 14:17:09.692 | DEBUG    | __main__:trials:24 - Trial = 9223/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.692 | DEBUG    | __main__:trials:29 - Trial = 9223/30000 | Total reward = 52.02
2022-01-26 14:17:09.696 | DEBUG    | __main__:trials:24 - Trial = 9224/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.697 | DEBUG    | __main__:trials:29 - Trial = 9224/30000 | Total reward = 38.21
2022-01-26 14:17:09.700 | DEBUG    | __main__:trials:24 - Trial = 9225/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.702 | DEBUG    | __main__:trials:29 - Trial = 9225/30000 | Total reward = 45.04
2022-01-26 14:17:09.705 | DEBUG    | __main__:trials:24 - Trial = 9226/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.706 | DEBUG    | __main__:trials:29 - Trial = 9226/30000 | Total reward = 45.54
2022-01-26 14:17:09.710 | DEBUG    | __main__:trials:24 - Trial = 9227/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.711 | DEBUG    | __main__:trials:29 - Trial = 9227/30000 | Total reward = 42.71
2022-01-26 14:17:09.714 | DEBUG    | __main__:trials:24 - Trial = 9228/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.716 | DEBUG    | __main__:trials:29 - Trial = 9228/30000 | Total reward = 47.03
2022-01-26 14:17:09.720 | DEBUG    | __main__:trials:24 - Trial = 9229/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.720 | DEBUG    | __main__:trials:29 - Trial = 9229/30000 | Total reward = 43.23
2022-01-26 14:17:09.724 | DEBUG    | __main__:trials:24 - Trial = 9230/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.725 | DEBUG    | __main__:trials:29 - Trial = 9230/30000 | Total reward = 41.71
2022-01-26 14:17:09.729 | DEBUG    | __main__:trials:24 - Trial = 9231/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.731 | DEBUG    | __main__:trials:29 - Trial = 9231/30000 | Total reward = 52.59
2022-01-26 14:17:09.735 | DEBUG    | __main__:trials:24 - Trial = 9232/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.736 | DEBUG    | __main__:trials:29 - Trial = 9232/30000 | Total reward = 46.60
2022-01-26 14:17:09.739 | DEBUG    | __main__:trials:24 - Trial = 9233/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.741 | DEBUG    | __main__:trials:29 - Trial = 9233/30000 | Total reward = 33.11
2022-01-26 14:17:09.745 | DEBUG    | __main__:trials:24 - Trial = 9234/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.746 | DEBUG    | __main__:trials:29 - Trial = 9234/30000 | Total reward = 43.95
2022-01-26 14:17:09.749 | DEBUG    | __main__:trials:24 - Trial = 9235/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.750 | DEBUG    | __main__:trials:29 - Trial = 9235/30000 | Total reward = 47.24
2022-01-26 14:17:09.753 | DEBUG    | __main__:trials:24 - Trial = 9236/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.754 | DEBUG    | __main__:trials:29 - Trial = 9236/30000 | Total reward = 50.15
2022-01-26 14:17:09.757 | DEBUG    | __main__:trials:24 - Trial = 9237/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.759 | DEBUG    | __main__:trials:29 - Trial = 9237/30000 | Total reward = 66.29
2022-01-26 14:17:09.764 | DEBUG    | __main__:trials:24 - Trial = 9238/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.765 | DEBUG    | __main__:trials:29 - Trial = 9238/30000 | Total reward = 63.33
2022-01-26 14:17:09.769 | DEBUG    | __main__:trials:24 - Trial = 9239/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.770 | DEBUG    | __main__:trials:29 - Trial = 9239/30000 | Total reward = 48.94
2022-01-26 14:17:09.773 | DEBUG    | __main__:trials:24 - Trial = 9240/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.774 | DEBUG    | __main__:trials:29 - Trial = 9240/30000 | Total reward = 50.04
2022-01-26 14:17:09.778 | DEBUG    | __main__:trials:24 - Trial = 9241/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.779 | DEBUG    | __main__:trials:29 - Trial = 9241/30000 | Total reward = 48.84
2022-01-26 14:17:09.783 | DEBUG    | __main__:trials:24 - Trial = 9242/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.784 | DEBUG    | __main__:trials:29 - Trial = 9242/30000 | Total reward = 43.68
2022-01-26 14:17:09.788 | DEBUG    | __main__:trials:24 - Trial = 9243/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.790 | DEBUG    | __main__:trials:29 - Trial = 9243/30000 | Total reward = 46.51
2022-01-26 14:17:09.793 | DEBUG    | __main__:trials:24 - Trial = 9244/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.794 | DEBUG    | __main__:trials:29 - Trial = 9244/30000 | Total reward = 47.50
2022-01-26 14:17:09.798 | DEBUG    | __main__:trials:24 - Trial = 9245/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.800 | DEBUG    | __main__:trials:29 - Trial = 9245/30000 | Total reward = 51.77
2022-01-26 14:17:09.803 | DEBUG    | __main__:trials:24 - Trial = 9246/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.805 | DEBUG    | __main__:trials:29 - Trial = 9246/30000 | Total reward = 48.64
2022-01-26 14:17:09.808 | DEBUG    | __main__:trials:24 - Trial = 9247/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.809 | DEBUG    | __main__:trials:29 - Trial = 9247/30000 | Total reward = 44.68
2022-01-26 14:17:09.812 | DEBUG    | __main__:trials:24 - Trial = 9248/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.814 | DEBUG    | __main__:trials:29 - Trial = 9248/30000 | Total reward = 47.24
2022-01-26 14:17:09.817 | DEBUG    | __main__:trials:24 - Trial = 9249/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.819 | DEBUG    | __main__:trials:29 - Trial = 9249/30000 | Total reward = 44.32
2022-01-26 14:17:09.822 | DEBUG    | __main__:trials:24 - Trial = 9250/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.824 | DEBUG    | __main__:trials:29 - Trial = 9250/30000 | Total reward = 48.43
2022-01-26 14:17:09.827 | DEBUG    | __main__:trials:24 - Trial = 9251/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.829 | DEBUG    | __main__:trials:29 - Trial = 9251/30000 | Total reward = 46.09
2022-01-26 14:17:09.832 | DEBUG    | __main__:trials:24 - Trial = 9252/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.833 | DEBUG    | __main__:trials:29 - Trial = 9252/30000 | Total reward = 47.96
2022-01-26 14:17:09.838 | DEBUG    | __main__:trials:24 - Trial = 9253/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.839 | DEBUG    | __main__:trials:29 - Trial = 9253/30000 | Total reward = 55.47
2022-01-26 14:17:09.843 | DEBUG    | __main__:trials:24 - Trial = 9254/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.845 | DEBUG    | __main__:trials:29 - Trial = 9254/30000 | Total reward = 34.57
2022-01-26 14:17:09.849 | DEBUG    | __main__:trials:24 - Trial = 9255/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.850 | DEBUG    | __main__:trials:29 - Trial = 9255/30000 | Total reward = 49.25
2022-01-26 14:17:09.853 | DEBUG    | __main__:trials:26 - Trial = 9256/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:09.854 | DEBUG    | __main__:trials:29 - Trial = 9256/30000 | Total reward = 33.54
2022-01-26 14:17:09.857 | DEBUG    | __main__:trials:24 - Trial = 9257/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.859 | DEBUG    | __main__:trials:29 - Trial = 9257/30000 | Total reward = 46.02
2022-01-26 14:17:09.862 | DEBUG    | __main__:trials:24 - Trial = 9258/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.864 | DEBUG    | __main__:trials:29 - Trial = 9258/30000 | Total reward = 14.66
2022-01-26 14:17:09.867 | DEBUG    | __main__:trials:24 - Trial = 9259/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.868 | DEBUG    | __main__:trials:29 - Trial = 9259/30000 | Total reward = 45.32
2022-01-26 14:17:09.871 | DEBUG    | __main__:trials:24 - Trial = 9260/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.873 | DEBUG    | __main__:trials:29 - Trial = 9260/30000 | Total reward = 36.12
2022-01-26 14:17:09.876 | DEBUG    | __main__:trials:24 - Trial = 9261/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.877 | DEBUG    | __main__:trials:29 - Trial = 9261/30000 | Total reward = 57.90
2022-01-26 14:17:09.880 | DEBUG    | __main__:trials:24 - Trial = 9262/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.881 | DEBUG    | __main__:trials:29 - Trial = 9262/30000 | Total reward = 37.13
2022-01-26 14:17:09.884 | DEBUG    | __main__:trials:24 - Trial = 9263/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.885 | DEBUG    | __main__:trials:29 - Trial = 9263/30000 | Total reward = 55.41
2022-01-26 14:17:09.889 | DEBUG    | __main__:trials:24 - Trial = 9264/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.890 | DEBUG    | __main__:trials:29 - Trial = 9264/30000 | Total reward = 39.80
2022-01-26 14:17:09.893 | DEBUG    | __main__:trials:24 - Trial = 9265/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.894 | DEBUG    | __main__:trials:29 - Trial = 9265/30000 | Total reward = 47.24
2022-01-26 14:17:09.898 | DEBUG    | __main__:trials:24 - Trial = 9266/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.899 | DEBUG    | __main__:trials:29 - Trial = 9266/30000 | Total reward = 40.14
2022-01-26 14:17:09.903 | DEBUG    | __main__:trials:24 - Trial = 9267/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.903 | DEBUG    | __main__:trials:29 - Trial = 9267/30000 | Total reward = 46.91
2022-01-26 14:17:09.906 | DEBUG    | __main__:trials:24 - Trial = 9268/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.907 | DEBUG    | __main__:trials:29 - Trial = 9268/30000 | Total reward = 38.97
2022-01-26 14:17:09.910 | DEBUG    | __main__:trials:24 - Trial = 9269/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.912 | DEBUG    | __main__:trials:29 - Trial = 9269/30000 | Total reward = 46.60
2022-01-26 14:17:09.915 | DEBUG    | __main__:trials:24 - Trial = 9270/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.916 | DEBUG    | __main__:trials:29 - Trial = 9270/30000 | Total reward = 47.24
2022-01-26 14:17:09.919 | DEBUG    | __main__:trials:24 - Trial = 9271/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.920 | DEBUG    | __main__:trials:29 - Trial = 9271/30000 | Total reward = 31.03
2022-01-26 14:17:09.923 | DEBUG    | __main__:trials:24 - Trial = 9272/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.924 | DEBUG    | __main__:trials:29 - Trial = 9272/30000 | Total reward = 48.50
2022-01-26 14:17:09.927 | DEBUG    | __main__:trials:24 - Trial = 9273/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.928 | DEBUG    | __main__:trials:29 - Trial = 9273/30000 | Total reward = 55.40
2022-01-26 14:17:09.931 | DEBUG    | __main__:trials:24 - Trial = 9274/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.932 | DEBUG    | __main__:trials:29 - Trial = 9274/30000 | Total reward = 43.64
2022-01-26 14:17:09.936 | DEBUG    | __main__:trials:24 - Trial = 9275/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.938 | DEBUG    | __main__:trials:29 - Trial = 9275/30000 | Total reward = 44.23
2022-01-26 14:17:09.941 | DEBUG    | __main__:trials:24 - Trial = 9276/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.943 | DEBUG    | __main__:trials:29 - Trial = 9276/30000 | Total reward = 45.10
2022-01-26 14:17:09.946 | DEBUG    | __main__:trials:24 - Trial = 9277/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.947 | DEBUG    | __main__:trials:29 - Trial = 9277/30000 | Total reward = 39.60
2022-01-26 14:17:09.951 | DEBUG    | __main__:trials:24 - Trial = 9278/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.951 | DEBUG    | __main__:trials:29 - Trial = 9278/30000 | Total reward = 47.30
2022-01-26 14:17:09.955 | DEBUG    | __main__:trials:24 - Trial = 9279/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.957 | DEBUG    | __main__:trials:29 - Trial = 9279/30000 | Total reward = 46.00
2022-01-26 14:17:09.960 | DEBUG    | __main__:trials:24 - Trial = 9280/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.962 | DEBUG    | __main__:trials:29 - Trial = 9280/30000 | Total reward = 48.74
2022-01-26 14:17:09.966 | DEBUG    | __main__:trials:24 - Trial = 9281/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.967 | DEBUG    | __main__:trials:29 - Trial = 9281/30000 | Total reward = 37.06
2022-01-26 14:17:09.971 | DEBUG    | __main__:trials:24 - Trial = 9282/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.972 | DEBUG    | __main__:trials:29 - Trial = 9282/30000 | Total reward = 47.27
2022-01-26 14:17:09.976 | DEBUG    | __main__:trials:24 - Trial = 9283/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.977 | DEBUG    | __main__:trials:29 - Trial = 9283/30000 | Total reward = 51.65
2022-01-26 14:17:09.981 | DEBUG    | __main__:trials:24 - Trial = 9284/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.982 | DEBUG    | __main__:trials:29 - Trial = 9284/30000 | Total reward = 55.41
2022-01-26 14:17:09.986 | DEBUG    | __main__:trials:24 - Trial = 9285/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.987 | DEBUG    | __main__:trials:29 - Trial = 9285/30000 | Total reward = 57.89
2022-01-26 14:17:09.992 | DEBUG    | __main__:trials:24 - Trial = 9286/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.993 | DEBUG    | __main__:trials:29 - Trial = 9286/30000 | Total reward = 63.27
2022-01-26 14:17:09.997 | DEBUG    | __main__:trials:24 - Trial = 9287/30000 | Max number of steps (20) reached
2022-01-26 14:17:09.998 | DEBUG    | __main__:trials:29 - Trial = 9287/30000 | Total reward = 34.37
2022-01-26 14:17:10.002 | DEBUG    | __main__:trials:24 - Trial = 9288/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.002 | DEBUG    | __main__:trials:29 - Trial = 9288/30000 | Total reward = 43.32
2022-01-26 14:17:10.007 | DEBUG    | __main__:trials:24 - Trial = 9289/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.007 | DEBUG    | __main__:trials:29 - Trial = 9289/30000 | Total reward = 44.85
2022-01-26 14:17:10.011 | DEBUG    | __main__:trials:24 - Trial = 9290/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.012 | DEBUG    | __main__:trials:29 - Trial = 9290/30000 | Total reward = 47.43
2022-01-26 14:17:10.016 | DEBUG    | __main__:trials:24 - Trial = 9291/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.017 | DEBUG    | __main__:trials:29 - Trial = 9291/30000 | Total reward = 48.95
2022-01-26 14:17:10.021 | DEBUG    | __main__:trials:24 - Trial = 9292/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.023 | DEBUG    | __main__:trials:29 - Trial = 9292/30000 | Total reward = 53.69
2022-01-26 14:17:10.026 | DEBUG    | __main__:trials:24 - Trial = 9293/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.028 | DEBUG    | __main__:trials:29 - Trial = 9293/30000 | Total reward = 67.49
2022-01-26 14:17:10.031 | DEBUG    | __main__:trials:24 - Trial = 9294/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.032 | DEBUG    | __main__:trials:29 - Trial = 9294/30000 | Total reward = 58.77
2022-01-26 14:17:10.035 | DEBUG    | __main__:trials:24 - Trial = 9295/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.037 | DEBUG    | __main__:trials:29 - Trial = 9295/30000 | Total reward = 44.53
2022-01-26 14:17:10.041 | DEBUG    | __main__:trials:24 - Trial = 9296/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.042 | DEBUG    | __main__:trials:29 - Trial = 9296/30000 | Total reward = 45.98
2022-01-26 14:17:10.046 | DEBUG    | __main__:trials:24 - Trial = 9297/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.047 | DEBUG    | __main__:trials:29 - Trial = 9297/30000 | Total reward = 62.49
2022-01-26 14:17:10.051 | DEBUG    | __main__:trials:24 - Trial = 9298/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.052 | DEBUG    | __main__:trials:29 - Trial = 9298/30000 | Total reward = 52.69
2022-01-26 14:17:10.055 | DEBUG    | __main__:trials:24 - Trial = 9299/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.057 | DEBUG    | __main__:trials:29 - Trial = 9299/30000 | Total reward = 46.52
2022-01-26 14:17:10.061 | DEBUG    | __main__:trials:24 - Trial = 9300/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.062 | DEBUG    | __main__:trials:29 - Trial = 9300/30000 | Total reward = 45.33
2022-01-26 14:17:10.066 | DEBUG    | __main__:trials:24 - Trial = 9301/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.067 | DEBUG    | __main__:trials:29 - Trial = 9301/30000 | Total reward = 58.89
2022-01-26 14:17:10.071 | DEBUG    | __main__:trials:24 - Trial = 9302/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.072 | DEBUG    | __main__:trials:29 - Trial = 9302/30000 | Total reward = 38.01
2022-01-26 14:17:10.077 | DEBUG    | __main__:trials:24 - Trial = 9303/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.078 | DEBUG    | __main__:trials:29 - Trial = 9303/30000 | Total reward = 43.33
2022-01-26 14:17:10.082 | DEBUG    | __main__:trials:24 - Trial = 9304/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.082 | DEBUG    | __main__:trials:29 - Trial = 9304/30000 | Total reward = 38.92
2022-01-26 14:17:10.086 | DEBUG    | __main__:trials:24 - Trial = 9305/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.088 | DEBUG    | __main__:trials:29 - Trial = 9305/30000 | Total reward = 48.20
2022-01-26 14:17:10.092 | DEBUG    | __main__:trials:24 - Trial = 9306/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.093 | DEBUG    | __main__:trials:29 - Trial = 9306/30000 | Total reward = 49.02
2022-01-26 14:17:10.097 | DEBUG    | __main__:trials:24 - Trial = 9307/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.098 | DEBUG    | __main__:trials:29 - Trial = 9307/30000 | Total reward = 42.76
2022-01-26 14:17:10.101 | DEBUG    | __main__:trials:24 - Trial = 9308/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.102 | DEBUG    | __main__:trials:29 - Trial = 9308/30000 | Total reward = 49.58
2022-01-26 14:17:10.105 | DEBUG    | __main__:trials:24 - Trial = 9309/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.107 | DEBUG    | __main__:trials:29 - Trial = 9309/30000 | Total reward = 43.62
2022-01-26 14:17:10.109 | DEBUG    | __main__:trials:24 - Trial = 9310/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.110 | DEBUG    | __main__:trials:29 - Trial = 9310/30000 | Total reward = 44.61
2022-01-26 14:17:10.114 | DEBUG    | __main__:trials:24 - Trial = 9311/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.114 | DEBUG    | __main__:trials:29 - Trial = 9311/30000 | Total reward = 45.16
2022-01-26 14:17:10.118 | DEBUG    | __main__:trials:24 - Trial = 9312/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.119 | DEBUG    | __main__:trials:29 - Trial = 9312/30000 | Total reward = 60.99
2022-01-26 14:17:10.123 | DEBUG    | __main__:trials:24 - Trial = 9313/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.124 | DEBUG    | __main__:trials:29 - Trial = 9313/30000 | Total reward = 58.39
2022-01-26 14:17:10.128 | DEBUG    | __main__:trials:24 - Trial = 9314/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.130 | DEBUG    | __main__:trials:29 - Trial = 9314/30000 | Total reward = 39.50
2022-01-26 14:17:10.133 | DEBUG    | __main__:trials:24 - Trial = 9315/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.135 | DEBUG    | __main__:trials:29 - Trial = 9315/30000 | Total reward = 43.94
2022-01-26 14:17:10.138 | DEBUG    | __main__:trials:24 - Trial = 9316/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.140 | DEBUG    | __main__:trials:29 - Trial = 9316/30000 | Total reward = 56.95
2022-01-26 14:17:10.144 | DEBUG    | __main__:trials:24 - Trial = 9317/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.144 | DEBUG    | __main__:trials:29 - Trial = 9317/30000 | Total reward = 47.18
2022-01-26 14:17:10.148 | DEBUG    | __main__:trials:24 - Trial = 9318/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.149 | DEBUG    | __main__:trials:29 - Trial = 9318/30000 | Total reward = 43.19
2022-01-26 14:17:10.153 | DEBUG    | __main__:trials:24 - Trial = 9319/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.155 | DEBUG    | __main__:trials:29 - Trial = 9319/30000 | Total reward = 43.35
2022-01-26 14:17:10.159 | DEBUG    | __main__:trials:24 - Trial = 9320/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.160 | DEBUG    | __main__:trials:29 - Trial = 9320/30000 | Total reward = 38.78
2022-01-26 14:17:10.163 | DEBUG    | __main__:trials:24 - Trial = 9321/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.165 | DEBUG    | __main__:trials:29 - Trial = 9321/30000 | Total reward = 41.55
2022-01-26 14:17:10.168 | DEBUG    | __main__:trials:24 - Trial = 9322/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.170 | DEBUG    | __main__:trials:29 - Trial = 9322/30000 | Total reward = 36.43
2022-01-26 14:17:10.172 | DEBUG    | __main__:trials:24 - Trial = 9323/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.173 | DEBUG    | __main__:trials:29 - Trial = 9323/30000 | Total reward = 43.99
2022-01-26 14:17:10.177 | DEBUG    | __main__:trials:24 - Trial = 9324/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.177 | DEBUG    | __main__:trials:29 - Trial = 9324/30000 | Total reward = 54.55
2022-01-26 14:17:10.181 | DEBUG    | __main__:trials:24 - Trial = 9325/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.181 | DEBUG    | __main__:trials:29 - Trial = 9325/30000 | Total reward = 43.48
2022-01-26 14:17:10.185 | DEBUG    | __main__:trials:24 - Trial = 9326/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.186 | DEBUG    | __main__:trials:29 - Trial = 9326/30000 | Total reward = 48.03
2022-01-26 14:17:10.189 | DEBUG    | __main__:trials:24 - Trial = 9327/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.190 | DEBUG    | __main__:trials:29 - Trial = 9327/30000 | Total reward = 42.38
2022-01-26 14:17:10.193 | DEBUG    | __main__:trials:24 - Trial = 9328/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.195 | DEBUG    | __main__:trials:29 - Trial = 9328/30000 | Total reward = 47.80
2022-01-26 14:17:10.198 | DEBUG    | __main__:trials:24 - Trial = 9329/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.199 | DEBUG    | __main__:trials:29 - Trial = 9329/30000 | Total reward = 40.18
2022-01-26 14:17:10.202 | DEBUG    | __main__:trials:24 - Trial = 9330/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.204 | DEBUG    | __main__:trials:29 - Trial = 9330/30000 | Total reward = 48.18
2022-01-26 14:17:10.208 | DEBUG    | __main__:trials:24 - Trial = 9331/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.209 | DEBUG    | __main__:trials:29 - Trial = 9331/30000 | Total reward = 45.90
2022-01-26 14:17:10.212 | DEBUG    | __main__:trials:24 - Trial = 9332/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.214 | DEBUG    | __main__:trials:29 - Trial = 9332/30000 | Total reward = 49.24
2022-01-26 14:17:10.216 | DEBUG    | __main__:trials:26 - Trial = 9333/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.216 | DEBUG    | __main__:trials:29 - Trial = 9333/30000 | Total reward = 14.47
2022-01-26 14:17:10.220 | DEBUG    | __main__:trials:24 - Trial = 9334/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.222 | DEBUG    | __main__:trials:29 - Trial = 9334/30000 | Total reward = 47.21
2022-01-26 14:17:10.225 | DEBUG    | __main__:trials:24 - Trial = 9335/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.226 | DEBUG    | __main__:trials:29 - Trial = 9335/30000 | Total reward = 37.81
2022-01-26 14:17:10.229 | DEBUG    | __main__:trials:24 - Trial = 9336/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.230 | DEBUG    | __main__:trials:29 - Trial = 9336/30000 | Total reward = 41.68
2022-01-26 14:17:10.233 | DEBUG    | __main__:trials:24 - Trial = 9337/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.235 | DEBUG    | __main__:trials:29 - Trial = 9337/30000 | Total reward = 48.03
2022-01-26 14:17:10.238 | DEBUG    | __main__:trials:24 - Trial = 9338/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.239 | DEBUG    | __main__:trials:29 - Trial = 9338/30000 | Total reward = 48.33
2022-01-26 14:17:10.242 | DEBUG    | __main__:trials:24 - Trial = 9339/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.244 | DEBUG    | __main__:trials:29 - Trial = 9339/30000 | Total reward = 40.64
2022-01-26 14:17:10.247 | DEBUG    | __main__:trials:24 - Trial = 9340/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.248 | DEBUG    | __main__:trials:29 - Trial = 9340/30000 | Total reward = 46.84
2022-01-26 14:17:10.251 | DEBUG    | __main__:trials:24 - Trial = 9341/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.253 | DEBUG    | __main__:trials:29 - Trial = 9341/30000 | Total reward = 48.61
2022-01-26 14:17:10.256 | DEBUG    | __main__:trials:24 - Trial = 9342/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.258 | DEBUG    | __main__:trials:29 - Trial = 9342/30000 | Total reward = 50.05
2022-01-26 14:17:10.261 | DEBUG    | __main__:trials:24 - Trial = 9343/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.262 | DEBUG    | __main__:trials:29 - Trial = 9343/30000 | Total reward = 45.45
2022-01-26 14:17:10.266 | DEBUG    | __main__:trials:24 - Trial = 9344/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.267 | DEBUG    | __main__:trials:29 - Trial = 9344/30000 | Total reward = 52.11
2022-01-26 14:17:10.270 | DEBUG    | __main__:trials:24 - Trial = 9345/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.272 | DEBUG    | __main__:trials:29 - Trial = 9345/30000 | Total reward = 57.24
2022-01-26 14:17:10.276 | DEBUG    | __main__:trials:24 - Trial = 9346/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.277 | DEBUG    | __main__:trials:29 - Trial = 9346/30000 | Total reward = 56.06
2022-01-26 14:17:10.281 | DEBUG    | __main__:trials:24 - Trial = 9347/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.282 | DEBUG    | __main__:trials:29 - Trial = 9347/30000 | Total reward = 43.81
2022-01-26 14:17:10.286 | DEBUG    | __main__:trials:24 - Trial = 9348/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.288 | DEBUG    | __main__:trials:29 - Trial = 9348/30000 | Total reward = 64.12
2022-01-26 14:17:10.291 | DEBUG    | __main__:trials:24 - Trial = 9349/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.292 | DEBUG    | __main__:trials:29 - Trial = 9349/30000 | Total reward = 47.71
2022-01-26 14:17:10.296 | DEBUG    | __main__:trials:24 - Trial = 9350/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.298 | DEBUG    | __main__:trials:29 - Trial = 9350/30000 | Total reward = 44.30
2022-01-26 14:17:10.302 | DEBUG    | __main__:trials:24 - Trial = 9351/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.302 | DEBUG    | __main__:trials:29 - Trial = 9351/30000 | Total reward = 52.17
2022-01-26 14:17:10.307 | DEBUG    | __main__:trials:24 - Trial = 9352/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.308 | DEBUG    | __main__:trials:29 - Trial = 9352/30000 | Total reward = 35.97
2022-01-26 14:17:10.312 | DEBUG    | __main__:trials:24 - Trial = 9353/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.313 | DEBUG    | __main__:trials:29 - Trial = 9353/30000 | Total reward = 46.69
2022-01-26 14:17:10.317 | DEBUG    | __main__:trials:24 - Trial = 9354/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.317 | DEBUG    | __main__:trials:29 - Trial = 9354/30000 | Total reward = 48.73
2022-01-26 14:17:10.321 | DEBUG    | __main__:trials:24 - Trial = 9355/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.323 | DEBUG    | __main__:trials:29 - Trial = 9355/30000 | Total reward = 39.83
2022-01-26 14:17:10.326 | DEBUG    | __main__:trials:24 - Trial = 9356/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.328 | DEBUG    | __main__:trials:29 - Trial = 9356/30000 | Total reward = 46.20
2022-01-26 14:17:10.330 | DEBUG    | __main__:trials:24 - Trial = 9357/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.332 | DEBUG    | __main__:trials:29 - Trial = 9357/30000 | Total reward = 34.55
2022-01-26 14:17:10.335 | DEBUG    | __main__:trials:24 - Trial = 9358/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.337 | DEBUG    | __main__:trials:29 - Trial = 9358/30000 | Total reward = 48.51
2022-01-26 14:17:10.340 | DEBUG    | __main__:trials:24 - Trial = 9359/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.341 | DEBUG    | __main__:trials:29 - Trial = 9359/30000 | Total reward = 49.81
2022-01-26 14:17:10.345 | DEBUG    | __main__:trials:24 - Trial = 9360/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.346 | DEBUG    | __main__:trials:29 - Trial = 9360/30000 | Total reward = 40.88
2022-01-26 14:17:10.349 | DEBUG    | __main__:trials:24 - Trial = 9361/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.350 | DEBUG    | __main__:trials:29 - Trial = 9361/30000 | Total reward = 44.28
2022-01-26 14:17:10.355 | DEBUG    | __main__:trials:24 - Trial = 9362/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.356 | DEBUG    | __main__:trials:29 - Trial = 9362/30000 | Total reward = 54.13
2022-01-26 14:17:10.359 | DEBUG    | __main__:trials:26 - Trial = 9363/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.360 | DEBUG    | __main__:trials:29 - Trial = 9363/30000 | Total reward = 14.93
2022-01-26 14:17:10.363 | DEBUG    | __main__:trials:26 - Trial = 9364/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.364 | DEBUG    | __main__:trials:29 - Trial = 9364/30000 | Total reward = 17.19
2022-01-26 14:17:10.367 | DEBUG    | __main__:trials:26 - Trial = 9365/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.367 | DEBUG    | __main__:trials:29 - Trial = 9365/30000 | Total reward = 14.93
2022-01-26 14:17:10.371 | DEBUG    | __main__:trials:24 - Trial = 9366/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.372 | DEBUG    | __main__:trials:29 - Trial = 9366/30000 | Total reward = 49.25
2022-01-26 14:17:10.376 | DEBUG    | __main__:trials:24 - Trial = 9367/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.377 | DEBUG    | __main__:trials:29 - Trial = 9367/30000 | Total reward = 47.95
2022-01-26 14:17:10.381 | DEBUG    | __main__:trials:24 - Trial = 9368/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.381 | DEBUG    | __main__:trials:29 - Trial = 9368/30000 | Total reward = 62.97
2022-01-26 14:17:10.385 | DEBUG    | __main__:trials:24 - Trial = 9369/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.386 | DEBUG    | __main__:trials:29 - Trial = 9369/30000 | Total reward = 56.31
2022-01-26 14:17:10.390 | DEBUG    | __main__:trials:24 - Trial = 9370/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.391 | DEBUG    | __main__:trials:29 - Trial = 9370/30000 | Total reward = 58.69
2022-01-26 14:17:10.395 | DEBUG    | __main__:trials:24 - Trial = 9371/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.395 | DEBUG    | __main__:trials:29 - Trial = 9371/30000 | Total reward = 24.75
2022-01-26 14:17:10.399 | DEBUG    | __main__:trials:24 - Trial = 9372/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.400 | DEBUG    | __main__:trials:29 - Trial = 9372/30000 | Total reward = 49.58
2022-01-26 14:17:10.404 | DEBUG    | __main__:trials:24 - Trial = 9373/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.405 | DEBUG    | __main__:trials:29 - Trial = 9373/30000 | Total reward = 47.30
2022-01-26 14:17:10.408 | DEBUG    | __main__:trials:24 - Trial = 9374/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.410 | DEBUG    | __main__:trials:29 - Trial = 9374/30000 | Total reward = 40.10
2022-01-26 14:17:10.414 | DEBUG    | __main__:trials:24 - Trial = 9375/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.415 | DEBUG    | __main__:trials:29 - Trial = 9375/30000 | Total reward = 47.08
2022-01-26 14:17:10.418 | DEBUG    | __main__:trials:24 - Trial = 9376/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.420 | DEBUG    | __main__:trials:29 - Trial = 9376/30000 | Total reward = 46.57
2022-01-26 14:17:10.423 | DEBUG    | __main__:trials:24 - Trial = 9377/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.425 | DEBUG    | __main__:trials:29 - Trial = 9377/30000 | Total reward = 48.02
2022-01-26 14:17:10.428 | DEBUG    | __main__:trials:24 - Trial = 9378/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.430 | DEBUG    | __main__:trials:29 - Trial = 9378/30000 | Total reward = 53.56
2022-01-26 14:17:10.433 | DEBUG    | __main__:trials:24 - Trial = 9379/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.434 | DEBUG    | __main__:trials:29 - Trial = 9379/30000 | Total reward = 51.24
2022-01-26 14:17:10.438 | DEBUG    | __main__:trials:24 - Trial = 9380/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.439 | DEBUG    | __main__:trials:29 - Trial = 9380/30000 | Total reward = 41.84
2022-01-26 14:17:10.443 | DEBUG    | __main__:trials:24 - Trial = 9381/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.444 | DEBUG    | __main__:trials:29 - Trial = 9381/30000 | Total reward = 49.67
2022-01-26 14:17:10.448 | DEBUG    | __main__:trials:24 - Trial = 9382/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.449 | DEBUG    | __main__:trials:29 - Trial = 9382/30000 | Total reward = 55.41
2022-01-26 14:17:10.453 | DEBUG    | __main__:trials:24 - Trial = 9383/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.454 | DEBUG    | __main__:trials:29 - Trial = 9383/30000 | Total reward = 53.74
2022-01-26 14:17:10.457 | DEBUG    | __main__:trials:24 - Trial = 9384/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.459 | DEBUG    | __main__:trials:29 - Trial = 9384/30000 | Total reward = 52.85
2022-01-26 14:17:10.463 | DEBUG    | __main__:trials:24 - Trial = 9385/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.464 | DEBUG    | __main__:trials:29 - Trial = 9385/30000 | Total reward = 46.91
2022-01-26 14:17:10.468 | DEBUG    | __main__:trials:24 - Trial = 9386/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.469 | DEBUG    | __main__:trials:29 - Trial = 9386/30000 | Total reward = 47.50
2022-01-26 14:17:10.473 | DEBUG    | __main__:trials:24 - Trial = 9387/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.474 | DEBUG    | __main__:trials:29 - Trial = 9387/30000 | Total reward = 54.62
2022-01-26 14:17:10.478 | DEBUG    | __main__:trials:24 - Trial = 9388/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.478 | DEBUG    | __main__:trials:29 - Trial = 9388/30000 | Total reward = 41.70
2022-01-26 14:17:10.483 | DEBUG    | __main__:trials:24 - Trial = 9389/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.485 | DEBUG    | __main__:trials:29 - Trial = 9389/30000 | Total reward = 45.87
2022-01-26 14:17:10.488 | DEBUG    | __main__:trials:24 - Trial = 9390/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.489 | DEBUG    | __main__:trials:29 - Trial = 9390/30000 | Total reward = 45.15
2022-01-26 14:17:10.492 | DEBUG    | __main__:trials:24 - Trial = 9391/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.493 | DEBUG    | __main__:trials:29 - Trial = 9391/30000 | Total reward = 41.19
2022-01-26 14:17:10.497 | DEBUG    | __main__:trials:24 - Trial = 9392/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.498 | DEBUG    | __main__:trials:29 - Trial = 9392/30000 | Total reward = 49.30
2022-01-26 14:17:10.502 | DEBUG    | __main__:trials:24 - Trial = 9393/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.503 | DEBUG    | __main__:trials:29 - Trial = 9393/30000 | Total reward = 59.96
2022-01-26 14:17:10.507 | DEBUG    | __main__:trials:24 - Trial = 9394/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.508 | DEBUG    | __main__:trials:29 - Trial = 9394/30000 | Total reward = 46.99
2022-01-26 14:17:10.512 | DEBUG    | __main__:trials:24 - Trial = 9395/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.513 | DEBUG    | __main__:trials:29 - Trial = 9395/30000 | Total reward = 48.46
2022-01-26 14:17:10.516 | DEBUG    | __main__:trials:26 - Trial = 9396/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.517 | DEBUG    | __main__:trials:29 - Trial = 9396/30000 | Total reward = 17.60
2022-01-26 14:17:10.520 | DEBUG    | __main__:trials:24 - Trial = 9397/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.522 | DEBUG    | __main__:trials:29 - Trial = 9397/30000 | Total reward = 45.25
2022-01-26 14:17:10.526 | DEBUG    | __main__:trials:24 - Trial = 9398/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.526 | DEBUG    | __main__:trials:29 - Trial = 9398/30000 | Total reward = 47.91
2022-01-26 14:17:10.531 | DEBUG    | __main__:trials:24 - Trial = 9399/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.531 | DEBUG    | __main__:trials:29 - Trial = 9399/30000 | Total reward = 47.71
2022-01-26 14:17:10.536 | DEBUG    | __main__:trials:24 - Trial = 9400/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.537 | DEBUG    | __main__:trials:29 - Trial = 9400/30000 | Total reward = 41.88
2022-01-26 14:17:10.540 | DEBUG    | __main__:trials:24 - Trial = 9401/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.542 | DEBUG    | __main__:trials:29 - Trial = 9401/30000 | Total reward = 34.03
2022-01-26 14:17:10.545 | DEBUG    | __main__:trials:24 - Trial = 9402/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.547 | DEBUG    | __main__:trials:29 - Trial = 9402/30000 | Total reward = 51.07
2022-01-26 14:17:10.550 | DEBUG    | __main__:trials:24 - Trial = 9403/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.552 | DEBUG    | __main__:trials:29 - Trial = 9403/30000 | Total reward = 32.07
2022-01-26 14:17:10.556 | DEBUG    | __main__:trials:24 - Trial = 9404/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.557 | DEBUG    | __main__:trials:29 - Trial = 9404/30000 | Total reward = 32.11
2022-01-26 14:17:10.561 | DEBUG    | __main__:trials:24 - Trial = 9405/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.562 | DEBUG    | __main__:trials:29 - Trial = 9405/30000 | Total reward = 43.60
2022-01-26 14:17:10.566 | DEBUG    | __main__:trials:24 - Trial = 9406/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.567 | DEBUG    | __main__:trials:29 - Trial = 9406/30000 | Total reward = 48.01
2022-01-26 14:17:10.571 | DEBUG    | __main__:trials:24 - Trial = 9407/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.572 | DEBUG    | __main__:trials:29 - Trial = 9407/30000 | Total reward = 42.96
2022-01-26 14:17:10.576 | DEBUG    | __main__:trials:24 - Trial = 9408/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.578 | DEBUG    | __main__:trials:29 - Trial = 9408/30000 | Total reward = 36.87
2022-01-26 14:17:10.581 | DEBUG    | __main__:trials:24 - Trial = 9409/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.582 | DEBUG    | __main__:trials:29 - Trial = 9409/30000 | Total reward = 44.93
2022-01-26 14:17:10.585 | DEBUG    | __main__:trials:24 - Trial = 9410/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.587 | DEBUG    | __main__:trials:29 - Trial = 9410/30000 | Total reward = 49.55
2022-01-26 14:17:10.590 | DEBUG    | __main__:trials:24 - Trial = 9411/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.592 | DEBUG    | __main__:trials:29 - Trial = 9411/30000 | Total reward = 47.03
2022-01-26 14:17:10.595 | DEBUG    | __main__:trials:24 - Trial = 9412/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.597 | DEBUG    | __main__:trials:29 - Trial = 9412/30000 | Total reward = 44.78
2022-01-26 14:17:10.600 | DEBUG    | __main__:trials:24 - Trial = 9413/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.602 | DEBUG    | __main__:trials:29 - Trial = 9413/30000 | Total reward = 47.50
2022-01-26 14:17:10.605 | DEBUG    | __main__:trials:24 - Trial = 9414/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.607 | DEBUG    | __main__:trials:29 - Trial = 9414/30000 | Total reward = 52.48
2022-01-26 14:17:10.610 | DEBUG    | __main__:trials:24 - Trial = 9415/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.612 | DEBUG    | __main__:trials:29 - Trial = 9415/30000 | Total reward = 46.67
2022-01-26 14:17:10.615 | DEBUG    | __main__:trials:24 - Trial = 9416/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.616 | DEBUG    | __main__:trials:29 - Trial = 9416/30000 | Total reward = 52.20
2022-01-26 14:17:10.620 | DEBUG    | __main__:trials:24 - Trial = 9417/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.621 | DEBUG    | __main__:trials:29 - Trial = 9417/30000 | Total reward = 48.14
2022-01-26 14:17:10.624 | DEBUG    | __main__:trials:24 - Trial = 9418/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.625 | DEBUG    | __main__:trials:29 - Trial = 9418/30000 | Total reward = 46.24
2022-01-26 14:17:10.629 | DEBUG    | __main__:trials:24 - Trial = 9419/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.630 | DEBUG    | __main__:trials:29 - Trial = 9419/30000 | Total reward = 50.13
2022-01-26 14:17:10.634 | DEBUG    | __main__:trials:24 - Trial = 9420/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.635 | DEBUG    | __main__:trials:29 - Trial = 9420/30000 | Total reward = 45.97
2022-01-26 14:17:10.638 | DEBUG    | __main__:trials:24 - Trial = 9421/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.640 | DEBUG    | __main__:trials:29 - Trial = 9421/30000 | Total reward = 46.78
2022-01-26 14:17:10.643 | DEBUG    | __main__:trials:24 - Trial = 9422/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.644 | DEBUG    | __main__:trials:29 - Trial = 9422/30000 | Total reward = 47.24
2022-01-26 14:17:10.648 | DEBUG    | __main__:trials:24 - Trial = 9423/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.649 | DEBUG    | __main__:trials:29 - Trial = 9423/30000 | Total reward = 45.95
2022-01-26 14:17:10.653 | DEBUG    | __main__:trials:24 - Trial = 9424/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.654 | DEBUG    | __main__:trials:29 - Trial = 9424/30000 | Total reward = 43.82
2022-01-26 14:17:10.658 | DEBUG    | __main__:trials:24 - Trial = 9425/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.659 | DEBUG    | __main__:trials:29 - Trial = 9425/30000 | Total reward = 53.89
2022-01-26 14:17:10.663 | DEBUG    | __main__:trials:24 - Trial = 9426/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.664 | DEBUG    | __main__:trials:29 - Trial = 9426/30000 | Total reward = 54.05
2022-01-26 14:17:10.667 | DEBUG    | __main__:trials:24 - Trial = 9427/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.669 | DEBUG    | __main__:trials:29 - Trial = 9427/30000 | Total reward = 44.93
2022-01-26 14:17:10.672 | DEBUG    | __main__:trials:24 - Trial = 9428/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.673 | DEBUG    | __main__:trials:29 - Trial = 9428/30000 | Total reward = 46.54
2022-01-26 14:17:10.676 | DEBUG    | __main__:trials:24 - Trial = 9429/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.678 | DEBUG    | __main__:trials:29 - Trial = 9429/30000 | Total reward = 46.98
2022-01-26 14:17:10.681 | DEBUG    | __main__:trials:24 - Trial = 9430/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.682 | DEBUG    | __main__:trials:29 - Trial = 9430/30000 | Total reward = 61.32
2022-01-26 14:17:10.685 | DEBUG    | __main__:trials:24 - Trial = 9431/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.686 | DEBUG    | __main__:trials:29 - Trial = 9431/30000 | Total reward = 33.34
2022-01-26 14:17:10.689 | DEBUG    | __main__:trials:24 - Trial = 9432/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.690 | DEBUG    | __main__:trials:29 - Trial = 9432/30000 | Total reward = 48.03
2022-01-26 14:17:10.694 | DEBUG    | __main__:trials:24 - Trial = 9433/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.695 | DEBUG    | __main__:trials:29 - Trial = 9433/30000 | Total reward = 40.81
2022-01-26 14:17:10.698 | DEBUG    | __main__:trials:24 - Trial = 9434/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.700 | DEBUG    | __main__:trials:29 - Trial = 9434/30000 | Total reward = 45.95
2022-01-26 14:17:10.704 | DEBUG    | __main__:trials:24 - Trial = 9435/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.704 | DEBUG    | __main__:trials:29 - Trial = 9435/30000 | Total reward = 33.74
2022-01-26 14:17:10.708 | DEBUG    | __main__:trials:24 - Trial = 9436/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.709 | DEBUG    | __main__:trials:29 - Trial = 9436/30000 | Total reward = 40.40
2022-01-26 14:17:10.714 | DEBUG    | __main__:trials:24 - Trial = 9437/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.715 | DEBUG    | __main__:trials:29 - Trial = 9437/30000 | Total reward = 47.32
2022-01-26 14:17:10.719 | DEBUG    | __main__:trials:24 - Trial = 9438/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.720 | DEBUG    | __main__:trials:29 - Trial = 9438/30000 | Total reward = 51.23
2022-01-26 14:17:10.724 | DEBUG    | __main__:trials:24 - Trial = 9439/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.726 | DEBUG    | __main__:trials:29 - Trial = 9439/30000 | Total reward = 42.87
2022-01-26 14:17:10.729 | DEBUG    | __main__:trials:24 - Trial = 9440/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.731 | DEBUG    | __main__:trials:29 - Trial = 9440/30000 | Total reward = 45.53
2022-01-26 14:17:10.735 | DEBUG    | __main__:trials:24 - Trial = 9441/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.735 | DEBUG    | __main__:trials:29 - Trial = 9441/30000 | Total reward = 59.43
2022-01-26 14:17:10.739 | DEBUG    | __main__:trials:24 - Trial = 9442/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.740 | DEBUG    | __main__:trials:29 - Trial = 9442/30000 | Total reward = 43.48
2022-01-26 14:17:10.744 | DEBUG    | __main__:trials:24 - Trial = 9443/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.745 | DEBUG    | __main__:trials:29 - Trial = 9443/30000 | Total reward = 51.24
2022-01-26 14:17:10.748 | DEBUG    | __main__:trials:24 - Trial = 9444/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.750 | DEBUG    | __main__:trials:29 - Trial = 9444/30000 | Total reward = 63.18
2022-01-26 14:17:10.754 | DEBUG    | __main__:trials:24 - Trial = 9445/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.755 | DEBUG    | __main__:trials:29 - Trial = 9445/30000 | Total reward = 40.53
2022-01-26 14:17:10.758 | DEBUG    | __main__:trials:24 - Trial = 9446/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.760 | DEBUG    | __main__:trials:29 - Trial = 9446/30000 | Total reward = 40.68
2022-01-26 14:17:10.764 | DEBUG    | __main__:trials:24 - Trial = 9447/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.765 | DEBUG    | __main__:trials:29 - Trial = 9447/30000 | Total reward = 48.68
2022-01-26 14:17:10.768 | DEBUG    | __main__:trials:24 - Trial = 9448/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.770 | DEBUG    | __main__:trials:29 - Trial = 9448/30000 | Total reward = 34.30
2022-01-26 14:17:10.774 | DEBUG    | __main__:trials:24 - Trial = 9449/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.775 | DEBUG    | __main__:trials:29 - Trial = 9449/30000 | Total reward = 47.75
2022-01-26 14:17:10.779 | DEBUG    | __main__:trials:24 - Trial = 9450/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.781 | DEBUG    | __main__:trials:29 - Trial = 9450/30000 | Total reward = 44.53
2022-01-26 14:17:10.784 | DEBUG    | __main__:trials:24 - Trial = 9451/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.786 | DEBUG    | __main__:trials:29 - Trial = 9451/30000 | Total reward = 48.03
2022-01-26 14:17:10.789 | DEBUG    | __main__:trials:24 - Trial = 9452/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.791 | DEBUG    | __main__:trials:29 - Trial = 9452/30000 | Total reward = 58.64
2022-01-26 14:17:10.794 | DEBUG    | __main__:trials:24 - Trial = 9453/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.796 | DEBUG    | __main__:trials:29 - Trial = 9453/30000 | Total reward = 46.65
2022-01-26 14:17:10.800 | DEBUG    | __main__:trials:24 - Trial = 9454/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.800 | DEBUG    | __main__:trials:29 - Trial = 9454/30000 | Total reward = 41.26
2022-01-26 14:17:10.805 | DEBUG    | __main__:trials:24 - Trial = 9455/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.806 | DEBUG    | __main__:trials:29 - Trial = 9455/30000 | Total reward = 63.57
2022-01-26 14:17:10.809 | DEBUG    | __main__:trials:24 - Trial = 9456/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.811 | DEBUG    | __main__:trials:29 - Trial = 9456/30000 | Total reward = 51.30
2022-01-26 14:17:10.815 | DEBUG    | __main__:trials:26 - Trial = 9457/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.815 | DEBUG    | __main__:trials:29 - Trial = 9457/30000 | Total reward = 39.76
2022-01-26 14:17:10.819 | DEBUG    | __main__:trials:24 - Trial = 9458/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.821 | DEBUG    | __main__:trials:29 - Trial = 9458/30000 | Total reward = 41.21
2022-01-26 14:17:10.824 | DEBUG    | __main__:trials:24 - Trial = 9459/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.825 | DEBUG    | __main__:trials:29 - Trial = 9459/30000 | Total reward = 55.59
2022-01-26 14:17:10.829 | DEBUG    | __main__:trials:24 - Trial = 9460/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.830 | DEBUG    | __main__:trials:29 - Trial = 9460/30000 | Total reward = 45.24
2022-01-26 14:17:10.835 | DEBUG    | __main__:trials:24 - Trial = 9461/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.836 | DEBUG    | __main__:trials:29 - Trial = 9461/30000 | Total reward = 43.79
2022-01-26 14:17:10.839 | DEBUG    | __main__:trials:24 - Trial = 9462/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.841 | DEBUG    | __main__:trials:29 - Trial = 9462/30000 | Total reward = 47.03
2022-01-26 14:17:10.844 | DEBUG    | __main__:trials:24 - Trial = 9463/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.846 | DEBUG    | __main__:trials:29 - Trial = 9463/30000 | Total reward = 34.34
2022-01-26 14:17:10.849 | DEBUG    | __main__:trials:24 - Trial = 9464/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.850 | DEBUG    | __main__:trials:29 - Trial = 9464/30000 | Total reward = 55.46
2022-01-26 14:17:10.853 | DEBUG    | __main__:trials:26 - Trial = 9465/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.854 | DEBUG    | __main__:trials:29 - Trial = 9465/30000 | Total reward = 22.44
2022-01-26 14:17:10.858 | DEBUG    | __main__:trials:24 - Trial = 9466/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.858 | DEBUG    | __main__:trials:29 - Trial = 9466/30000 | Total reward = 36.46
2022-01-26 14:17:10.863 | DEBUG    | __main__:trials:24 - Trial = 9467/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.865 | DEBUG    | __main__:trials:29 - Trial = 9467/30000 | Total reward = 42.38
2022-01-26 14:17:10.868 | DEBUG    | __main__:trials:24 - Trial = 9468/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.870 | DEBUG    | __main__:trials:29 - Trial = 9468/30000 | Total reward = 46.91
2022-01-26 14:17:10.873 | DEBUG    | __main__:trials:26 - Trial = 9469/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:10.874 | DEBUG    | __main__:trials:29 - Trial = 9469/30000 | Total reward = 26.54
2022-01-26 14:17:10.877 | DEBUG    | __main__:trials:24 - Trial = 9470/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.879 | DEBUG    | __main__:trials:29 - Trial = 9470/30000 | Total reward = 41.37
2022-01-26 14:17:10.882 | DEBUG    | __main__:trials:24 - Trial = 9471/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.884 | DEBUG    | __main__:trials:29 - Trial = 9471/30000 | Total reward = 47.22
2022-01-26 14:17:10.888 | DEBUG    | __main__:trials:24 - Trial = 9472/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.888 | DEBUG    | __main__:trials:29 - Trial = 9472/30000 | Total reward = 46.55
2022-01-26 14:17:10.893 | DEBUG    | __main__:trials:24 - Trial = 9473/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.894 | DEBUG    | __main__:trials:29 - Trial = 9473/30000 | Total reward = 37.04
2022-01-26 14:17:10.898 | DEBUG    | __main__:trials:24 - Trial = 9474/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.898 | DEBUG    | __main__:trials:29 - Trial = 9474/30000 | Total reward = 41.22
2022-01-26 14:17:10.903 | DEBUG    | __main__:trials:24 - Trial = 9475/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.904 | DEBUG    | __main__:trials:29 - Trial = 9475/30000 | Total reward = 47.80
2022-01-26 14:17:10.908 | DEBUG    | __main__:trials:24 - Trial = 9476/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.910 | DEBUG    | __main__:trials:29 - Trial = 9476/30000 | Total reward = 47.83
2022-01-26 14:17:10.913 | DEBUG    | __main__:trials:24 - Trial = 9477/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.915 | DEBUG    | __main__:trials:29 - Trial = 9477/30000 | Total reward = 45.07
2022-01-26 14:17:10.918 | DEBUG    | __main__:trials:24 - Trial = 9478/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.919 | DEBUG    | __main__:trials:29 - Trial = 9478/30000 | Total reward = 47.68
2022-01-26 14:17:10.923 | DEBUG    | __main__:trials:24 - Trial = 9479/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.925 | DEBUG    | __main__:trials:29 - Trial = 9479/30000 | Total reward = 43.70
2022-01-26 14:17:10.927 | DEBUG    | __main__:trials:24 - Trial = 9480/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.929 | DEBUG    | __main__:trials:29 - Trial = 9480/30000 | Total reward = 43.04
2022-01-26 14:17:10.932 | DEBUG    | __main__:trials:24 - Trial = 9481/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.933 | DEBUG    | __main__:trials:29 - Trial = 9481/30000 | Total reward = 31.68
2022-01-26 14:17:10.936 | DEBUG    | __main__:trials:24 - Trial = 9482/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.937 | DEBUG    | __main__:trials:29 - Trial = 9482/30000 | Total reward = 45.05
2022-01-26 14:17:10.941 | DEBUG    | __main__:trials:24 - Trial = 9483/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.942 | DEBUG    | __main__:trials:29 - Trial = 9483/30000 | Total reward = 49.85
2022-01-26 14:17:10.946 | DEBUG    | __main__:trials:24 - Trial = 9484/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.947 | DEBUG    | __main__:trials:29 - Trial = 9484/30000 | Total reward = 48.15
2022-01-26 14:17:10.951 | DEBUG    | __main__:trials:24 - Trial = 9485/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.951 | DEBUG    | __main__:trials:29 - Trial = 9485/30000 | Total reward = 47.15
2022-01-26 14:17:10.956 | DEBUG    | __main__:trials:24 - Trial = 9486/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.956 | DEBUG    | __main__:trials:29 - Trial = 9486/30000 | Total reward = 45.56
2022-01-26 14:17:10.961 | DEBUG    | __main__:trials:24 - Trial = 9487/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.962 | DEBUG    | __main__:trials:29 - Trial = 9487/30000 | Total reward = 43.66
2022-01-26 14:17:10.965 | DEBUG    | __main__:trials:24 - Trial = 9488/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.967 | DEBUG    | __main__:trials:29 - Trial = 9488/30000 | Total reward = 45.45
2022-01-26 14:17:10.970 | DEBUG    | __main__:trials:24 - Trial = 9489/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.972 | DEBUG    | __main__:trials:29 - Trial = 9489/30000 | Total reward = 34.86
2022-01-26 14:17:10.976 | DEBUG    | __main__:trials:24 - Trial = 9490/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.976 | DEBUG    | __main__:trials:29 - Trial = 9490/30000 | Total reward = 47.03
2022-01-26 14:17:10.981 | DEBUG    | __main__:trials:24 - Trial = 9491/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.983 | DEBUG    | __main__:trials:29 - Trial = 9491/30000 | Total reward = 47.03
2022-01-26 14:17:10.986 | DEBUG    | __main__:trials:24 - Trial = 9492/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.988 | DEBUG    | __main__:trials:29 - Trial = 9492/30000 | Total reward = 38.75
2022-01-26 14:17:10.991 | DEBUG    | __main__:trials:24 - Trial = 9493/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.993 | DEBUG    | __main__:trials:29 - Trial = 9493/30000 | Total reward = 49.30
2022-01-26 14:17:10.996 | DEBUG    | __main__:trials:24 - Trial = 9494/30000 | Max number of steps (20) reached
2022-01-26 14:17:10.998 | DEBUG    | __main__:trials:29 - Trial = 9494/30000 | Total reward = 48.58
2022-01-26 14:17:11.002 | DEBUG    | __main__:trials:24 - Trial = 9495/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.002 | DEBUG    | __main__:trials:29 - Trial = 9495/30000 | Total reward = 59.42
2022-01-26 14:17:11.007 | DEBUG    | __main__:trials:24 - Trial = 9496/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.008 | DEBUG    | __main__:trials:29 - Trial = 9496/30000 | Total reward = 47.21
2022-01-26 14:17:11.011 | DEBUG    | __main__:trials:24 - Trial = 9497/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.013 | DEBUG    | __main__:trials:29 - Trial = 9497/30000 | Total reward = 45.51
2022-01-26 14:17:11.016 | DEBUG    | __main__:trials:24 - Trial = 9498/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.018 | DEBUG    | __main__:trials:29 - Trial = 9498/30000 | Total reward = 47.86
2022-01-26 14:17:11.022 | DEBUG    | __main__:trials:24 - Trial = 9499/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.022 | DEBUG    | __main__:trials:29 - Trial = 9499/30000 | Total reward = 62.21
2022-01-26 14:17:11.027 | DEBUG    | __main__:trials:24 - Trial = 9500/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.028 | DEBUG    | __main__:trials:29 - Trial = 9500/30000 | Total reward = 53.32
2022-01-26 14:17:11.031 | DEBUG    | __main__:trials:24 - Trial = 9501/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.033 | DEBUG    | __main__:trials:29 - Trial = 9501/30000 | Total reward = 48.27
2022-01-26 14:17:11.036 | DEBUG    | __main__:trials:24 - Trial = 9502/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.037 | DEBUG    | __main__:trials:29 - Trial = 9502/30000 | Total reward = 33.86
2022-01-26 14:17:11.040 | DEBUG    | __main__:trials:24 - Trial = 9503/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.042 | DEBUG    | __main__:trials:29 - Trial = 9503/30000 | Total reward = 41.22
2022-01-26 14:17:11.045 | DEBUG    | __main__:trials:24 - Trial = 9504/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.045 | DEBUG    | __main__:trials:29 - Trial = 9504/30000 | Total reward = 57.64
2022-01-26 14:17:11.050 | DEBUG    | __main__:trials:24 - Trial = 9505/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.050 | DEBUG    | __main__:trials:29 - Trial = 9505/30000 | Total reward = 45.48
2022-01-26 14:17:11.055 | DEBUG    | __main__:trials:24 - Trial = 9506/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.057 | DEBUG    | __main__:trials:29 - Trial = 9506/30000 | Total reward = 62.30
2022-01-26 14:17:11.060 | DEBUG    | __main__:trials:24 - Trial = 9507/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.062 | DEBUG    | __main__:trials:29 - Trial = 9507/30000 | Total reward = 41.99
2022-01-26 14:17:11.066 | DEBUG    | __main__:trials:24 - Trial = 9508/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.067 | DEBUG    | __main__:trials:29 - Trial = 9508/30000 | Total reward = 48.31
2022-01-26 14:17:11.070 | DEBUG    | __main__:trials:24 - Trial = 9509/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.072 | DEBUG    | __main__:trials:29 - Trial = 9509/30000 | Total reward = 46.33
2022-01-26 14:17:11.075 | DEBUG    | __main__:trials:24 - Trial = 9510/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.077 | DEBUG    | __main__:trials:29 - Trial = 9510/30000 | Total reward = 46.91
2022-01-26 14:17:11.079 | DEBUG    | __main__:trials:24 - Trial = 9511/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.081 | DEBUG    | __main__:trials:29 - Trial = 9511/30000 | Total reward = 47.06
2022-01-26 14:17:11.084 | DEBUG    | __main__:trials:24 - Trial = 9512/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.086 | DEBUG    | __main__:trials:29 - Trial = 9512/30000 | Total reward = 40.74
2022-01-26 14:17:11.089 | DEBUG    | __main__:trials:24 - Trial = 9513/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.091 | DEBUG    | __main__:trials:29 - Trial = 9513/30000 | Total reward = 50.99
2022-01-26 14:17:11.095 | DEBUG    | __main__:trials:24 - Trial = 9514/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.095 | DEBUG    | __main__:trials:29 - Trial = 9514/30000 | Total reward = 41.10
2022-01-26 14:17:11.100 | DEBUG    | __main__:trials:24 - Trial = 9515/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.100 | DEBUG    | __main__:trials:29 - Trial = 9515/30000 | Total reward = 40.20
2022-01-26 14:17:11.104 | DEBUG    | __main__:trials:26 - Trial = 9516/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:11.106 | DEBUG    | __main__:trials:29 - Trial = 9516/30000 | Total reward = 22.18
2022-01-26 14:17:11.108 | DEBUG    | __main__:trials:24 - Trial = 9517/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.109 | DEBUG    | __main__:trials:29 - Trial = 9517/30000 | Total reward = 62.18
2022-01-26 14:17:11.113 | DEBUG    | __main__:trials:24 - Trial = 9518/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.113 | DEBUG    | __main__:trials:29 - Trial = 9518/30000 | Total reward = 53.04
2022-01-26 14:17:11.117 | DEBUG    | __main__:trials:24 - Trial = 9519/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.118 | DEBUG    | __main__:trials:29 - Trial = 9519/30000 | Total reward = 47.15
2022-01-26 14:17:11.122 | DEBUG    | __main__:trials:24 - Trial = 9520/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.123 | DEBUG    | __main__:trials:29 - Trial = 9520/30000 | Total reward = 47.03
2022-01-26 14:17:11.126 | DEBUG    | __main__:trials:24 - Trial = 9521/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.128 | DEBUG    | __main__:trials:29 - Trial = 9521/30000 | Total reward = 39.61
2022-01-26 14:17:11.131 | DEBUG    | __main__:trials:24 - Trial = 9522/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.133 | DEBUG    | __main__:trials:29 - Trial = 9522/30000 | Total reward = 63.78
2022-01-26 14:17:11.136 | DEBUG    | __main__:trials:24 - Trial = 9523/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.137 | DEBUG    | __main__:trials:29 - Trial = 9523/30000 | Total reward = 50.28
2022-01-26 14:17:11.140 | DEBUG    | __main__:trials:24 - Trial = 9524/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.141 | DEBUG    | __main__:trials:29 - Trial = 9524/30000 | Total reward = 42.23
2022-01-26 14:17:11.145 | DEBUG    | __main__:trials:24 - Trial = 9525/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.146 | DEBUG    | __main__:trials:29 - Trial = 9525/30000 | Total reward = 44.51
2022-01-26 14:17:11.149 | DEBUG    | __main__:trials:24 - Trial = 9526/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.151 | DEBUG    | __main__:trials:29 - Trial = 9526/30000 | Total reward = 47.39
2022-01-26 14:17:11.153 | DEBUG    | __main__:trials:24 - Trial = 9527/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.154 | DEBUG    | __main__:trials:29 - Trial = 9527/30000 | Total reward = 47.03
2022-01-26 14:17:11.157 | DEBUG    | __main__:trials:24 - Trial = 9528/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.158 | DEBUG    | __main__:trials:29 - Trial = 9528/30000 | Total reward = 30.26
2022-01-26 14:17:11.162 | DEBUG    | __main__:trials:24 - Trial = 9529/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.163 | DEBUG    | __main__:trials:29 - Trial = 9529/30000 | Total reward = 39.11
2022-01-26 14:17:11.166 | DEBUG    | __main__:trials:24 - Trial = 9530/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.167 | DEBUG    | __main__:trials:29 - Trial = 9530/30000 | Total reward = 47.21
2022-01-26 14:17:11.171 | DEBUG    | __main__:trials:24 - Trial = 9531/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.171 | DEBUG    | __main__:trials:29 - Trial = 9531/30000 | Total reward = 46.77
2022-01-26 14:17:11.175 | DEBUG    | __main__:trials:24 - Trial = 9532/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.175 | DEBUG    | __main__:trials:29 - Trial = 9532/30000 | Total reward = 50.38
2022-01-26 14:17:11.178 | DEBUG    | __main__:trials:24 - Trial = 9533/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.179 | DEBUG    | __main__:trials:29 - Trial = 9533/30000 | Total reward = 40.41
2022-01-26 14:17:11.183 | DEBUG    | __main__:trials:24 - Trial = 9534/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.184 | DEBUG    | __main__:trials:29 - Trial = 9534/30000 | Total reward = 47.03
2022-01-26 14:17:11.188 | DEBUG    | __main__:trials:24 - Trial = 9535/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.188 | DEBUG    | __main__:trials:29 - Trial = 9535/30000 | Total reward = 51.68
2022-01-26 14:17:11.192 | DEBUG    | __main__:trials:24 - Trial = 9536/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.193 | DEBUG    | __main__:trials:29 - Trial = 9536/30000 | Total reward = 43.89
2022-01-26 14:17:11.197 | DEBUG    | __main__:trials:24 - Trial = 9537/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.198 | DEBUG    | __main__:trials:29 - Trial = 9537/30000 | Total reward = 36.04
2022-01-26 14:17:11.201 | DEBUG    | __main__:trials:24 - Trial = 9538/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.202 | DEBUG    | __main__:trials:29 - Trial = 9538/30000 | Total reward = 40.66
2022-01-26 14:17:11.205 | DEBUG    | __main__:trials:24 - Trial = 9539/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.207 | DEBUG    | __main__:trials:29 - Trial = 9539/30000 | Total reward = 35.87
2022-01-26 14:17:11.210 | DEBUG    | __main__:trials:24 - Trial = 9540/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.211 | DEBUG    | __main__:trials:29 - Trial = 9540/30000 | Total reward = 54.52
2022-01-26 14:17:11.214 | DEBUG    | __main__:trials:24 - Trial = 9541/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.215 | DEBUG    | __main__:trials:29 - Trial = 9541/30000 | Total reward = 50.54
2022-01-26 14:17:11.219 | DEBUG    | __main__:trials:24 - Trial = 9542/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.220 | DEBUG    | __main__:trials:29 - Trial = 9542/30000 | Total reward = 48.76
2022-01-26 14:17:11.223 | DEBUG    | __main__:trials:24 - Trial = 9543/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.224 | DEBUG    | __main__:trials:29 - Trial = 9543/30000 | Total reward = 39.25
2022-01-26 14:17:11.227 | DEBUG    | __main__:trials:24 - Trial = 9544/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.229 | DEBUG    | __main__:trials:29 - Trial = 9544/30000 | Total reward = 41.59
2022-01-26 14:17:11.233 | DEBUG    | __main__:trials:24 - Trial = 9545/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.233 | DEBUG    | __main__:trials:29 - Trial = 9545/30000 | Total reward = 61.13
2022-01-26 14:17:11.237 | DEBUG    | __main__:trials:24 - Trial = 9546/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.238 | DEBUG    | __main__:trials:29 - Trial = 9546/30000 | Total reward = 40.10
2022-01-26 14:17:11.242 | DEBUG    | __main__:trials:24 - Trial = 9547/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.243 | DEBUG    | __main__:trials:29 - Trial = 9547/30000 | Total reward = 41.40
2022-01-26 14:17:11.247 | DEBUG    | __main__:trials:24 - Trial = 9548/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.248 | DEBUG    | __main__:trials:29 - Trial = 9548/30000 | Total reward = 44.03
2022-01-26 14:17:11.252 | DEBUG    | __main__:trials:24 - Trial = 9549/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.252 | DEBUG    | __main__:trials:29 - Trial = 9549/30000 | Total reward = 39.13
2022-01-26 14:17:11.257 | DEBUG    | __main__:trials:24 - Trial = 9550/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.258 | DEBUG    | __main__:trials:29 - Trial = 9550/30000 | Total reward = 64.54
2022-01-26 14:17:11.261 | DEBUG    | __main__:trials:24 - Trial = 9551/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.263 | DEBUG    | __main__:trials:29 - Trial = 9551/30000 | Total reward = 46.34
2022-01-26 14:17:11.266 | DEBUG    | __main__:trials:24 - Trial = 9552/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.268 | DEBUG    | __main__:trials:29 - Trial = 9552/30000 | Total reward = 47.03
2022-01-26 14:17:11.271 | DEBUG    | __main__:trials:24 - Trial = 9553/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.273 | DEBUG    | __main__:trials:29 - Trial = 9553/30000 | Total reward = 41.98
2022-01-26 14:17:11.276 | DEBUG    | __main__:trials:24 - Trial = 9554/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.278 | DEBUG    | __main__:trials:29 - Trial = 9554/30000 | Total reward = 41.93
2022-01-26 14:17:11.282 | DEBUG    | __main__:trials:24 - Trial = 9555/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.283 | DEBUG    | __main__:trials:29 - Trial = 9555/30000 | Total reward = 40.64
2022-01-26 14:17:11.287 | DEBUG    | __main__:trials:24 - Trial = 9556/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.288 | DEBUG    | __main__:trials:29 - Trial = 9556/30000 | Total reward = 45.97
2022-01-26 14:17:11.292 | DEBUG    | __main__:trials:24 - Trial = 9557/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.294 | DEBUG    | __main__:trials:29 - Trial = 9557/30000 | Total reward = 53.64
2022-01-26 14:17:11.297 | DEBUG    | __main__:trials:24 - Trial = 9558/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.299 | DEBUG    | __main__:trials:29 - Trial = 9558/30000 | Total reward = 42.54
2022-01-26 14:17:11.302 | DEBUG    | __main__:trials:24 - Trial = 9559/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.303 | DEBUG    | __main__:trials:29 - Trial = 9559/30000 | Total reward = 53.47
2022-01-26 14:17:11.307 | DEBUG    | __main__:trials:24 - Trial = 9560/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.308 | DEBUG    | __main__:trials:29 - Trial = 9560/30000 | Total reward = 48.41
2022-01-26 14:17:11.312 | DEBUG    | __main__:trials:24 - Trial = 9561/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.313 | DEBUG    | __main__:trials:29 - Trial = 9561/30000 | Total reward = 47.87
2022-01-26 14:17:11.317 | DEBUG    | __main__:trials:24 - Trial = 9562/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.319 | DEBUG    | __main__:trials:29 - Trial = 9562/30000 | Total reward = 47.03
2022-01-26 14:17:11.323 | DEBUG    | __main__:trials:24 - Trial = 9563/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.324 | DEBUG    | __main__:trials:29 - Trial = 9563/30000 | Total reward = 45.16
2022-01-26 14:17:11.328 | DEBUG    | __main__:trials:24 - Trial = 9564/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.329 | DEBUG    | __main__:trials:29 - Trial = 9564/30000 | Total reward = 40.65
2022-01-26 14:17:11.332 | DEBUG    | __main__:trials:24 - Trial = 9565/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.334 | DEBUG    | __main__:trials:29 - Trial = 9565/30000 | Total reward = 42.85
2022-01-26 14:17:11.337 | DEBUG    | __main__:trials:24 - Trial = 9566/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.339 | DEBUG    | __main__:trials:29 - Trial = 9566/30000 | Total reward = 46.91
2022-01-26 14:17:11.342 | DEBUG    | __main__:trials:24 - Trial = 9567/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.342 | DEBUG    | __main__:trials:29 - Trial = 9567/30000 | Total reward = 45.68
2022-01-26 14:17:11.346 | DEBUG    | __main__:trials:24 - Trial = 9568/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.347 | DEBUG    | __main__:trials:29 - Trial = 9568/30000 | Total reward = 37.10
2022-01-26 14:17:11.351 | DEBUG    | __main__:trials:24 - Trial = 9569/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.352 | DEBUG    | __main__:trials:29 - Trial = 9569/30000 | Total reward = 50.05
2022-01-26 14:17:11.356 | DEBUG    | __main__:trials:24 - Trial = 9570/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.357 | DEBUG    | __main__:trials:29 - Trial = 9570/30000 | Total reward = 44.65
2022-01-26 14:17:11.364 | DEBUG    | __main__:trials:24 - Trial = 9571/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.365 | DEBUG    | __main__:trials:29 - Trial = 9571/30000 | Total reward = 35.23
2022-01-26 14:17:11.368 | DEBUG    | __main__:trials:24 - Trial = 9572/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.369 | DEBUG    | __main__:trials:29 - Trial = 9572/30000 | Total reward = 68.01
2022-01-26 14:17:11.372 | DEBUG    | __main__:trials:24 - Trial = 9573/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.373 | DEBUG    | __main__:trials:29 - Trial = 9573/30000 | Total reward = 50.38
2022-01-26 14:17:11.376 | DEBUG    | __main__:trials:24 - Trial = 9574/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.376 | DEBUG    | __main__:trials:29 - Trial = 9574/30000 | Total reward = 32.62
2022-01-26 14:17:11.379 | DEBUG    | __main__:trials:26 - Trial = 9575/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:11.379 | DEBUG    | __main__:trials:29 - Trial = 9575/30000 | Total reward = 12.87
2022-01-26 14:17:11.382 | DEBUG    | __main__:trials:24 - Trial = 9576/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.383 | DEBUG    | __main__:trials:29 - Trial = 9576/30000 | Total reward = 53.14
2022-01-26 14:17:11.386 | DEBUG    | __main__:trials:24 - Trial = 9577/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.387 | DEBUG    | __main__:trials:29 - Trial = 9577/30000 | Total reward = 43.53
2022-01-26 14:17:11.390 | DEBUG    | __main__:trials:24 - Trial = 9578/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.391 | DEBUG    | __main__:trials:29 - Trial = 9578/30000 | Total reward = 39.36
2022-01-26 14:17:11.394 | DEBUG    | __main__:trials:24 - Trial = 9579/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.394 | DEBUG    | __main__:trials:29 - Trial = 9579/30000 | Total reward = 47.62
2022-01-26 14:17:11.397 | DEBUG    | __main__:trials:24 - Trial = 9580/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.398 | DEBUG    | __main__:trials:29 - Trial = 9580/30000 | Total reward = 60.05
2022-01-26 14:17:11.401 | DEBUG    | __main__:trials:24 - Trial = 9581/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.402 | DEBUG    | __main__:trials:29 - Trial = 9581/30000 | Total reward = 48.20
2022-01-26 14:17:11.405 | DEBUG    | __main__:trials:24 - Trial = 9582/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.406 | DEBUG    | __main__:trials:29 - Trial = 9582/30000 | Total reward = 58.47
2022-01-26 14:17:11.409 | DEBUG    | __main__:trials:24 - Trial = 9583/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.409 | DEBUG    | __main__:trials:29 - Trial = 9583/30000 | Total reward = 40.74
2022-01-26 14:17:11.412 | DEBUG    | __main__:trials:24 - Trial = 9584/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.413 | DEBUG    | __main__:trials:29 - Trial = 9584/30000 | Total reward = 48.69
2022-01-26 14:17:11.417 | DEBUG    | __main__:trials:24 - Trial = 9585/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.417 | DEBUG    | __main__:trials:29 - Trial = 9585/30000 | Total reward = 39.71
2022-01-26 14:17:11.420 | DEBUG    | __main__:trials:24 - Trial = 9586/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.421 | DEBUG    | __main__:trials:29 - Trial = 9586/30000 | Total reward = 54.48
2022-01-26 14:17:11.424 | DEBUG    | __main__:trials:24 - Trial = 9587/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.425 | DEBUG    | __main__:trials:29 - Trial = 9587/30000 | Total reward = 52.95
2022-01-26 14:17:11.428 | DEBUG    | __main__:trials:24 - Trial = 9588/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.428 | DEBUG    | __main__:trials:29 - Trial = 9588/30000 | Total reward = 52.95
2022-01-26 14:17:11.431 | DEBUG    | __main__:trials:24 - Trial = 9589/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.432 | DEBUG    | __main__:trials:29 - Trial = 9589/30000 | Total reward = 58.58
2022-01-26 14:17:11.435 | DEBUG    | __main__:trials:24 - Trial = 9590/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.436 | DEBUG    | __main__:trials:29 - Trial = 9590/30000 | Total reward = 46.09
2022-01-26 14:17:11.439 | DEBUG    | __main__:trials:24 - Trial = 9591/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.440 | DEBUG    | __main__:trials:29 - Trial = 9591/30000 | Total reward = 47.34
2022-01-26 14:17:11.443 | DEBUG    | __main__:trials:24 - Trial = 9592/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.443 | DEBUG    | __main__:trials:29 - Trial = 9592/30000 | Total reward = 44.39
2022-01-26 14:17:11.446 | DEBUG    | __main__:trials:24 - Trial = 9593/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.447 | DEBUG    | __main__:trials:29 - Trial = 9593/30000 | Total reward = 44.28
2022-01-26 14:17:11.450 | DEBUG    | __main__:trials:24 - Trial = 9594/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.451 | DEBUG    | __main__:trials:29 - Trial = 9594/30000 | Total reward = 43.66
2022-01-26 14:17:11.454 | DEBUG    | __main__:trials:24 - Trial = 9595/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.455 | DEBUG    | __main__:trials:29 - Trial = 9595/30000 | Total reward = 48.03
2022-01-26 14:17:11.458 | DEBUG    | __main__:trials:24 - Trial = 9596/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.458 | DEBUG    | __main__:trials:29 - Trial = 9596/30000 | Total reward = 41.02
2022-01-26 14:17:11.461 | DEBUG    | __main__:trials:24 - Trial = 9597/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.462 | DEBUG    | __main__:trials:29 - Trial = 9597/30000 | Total reward = 58.64
2022-01-26 14:17:11.465 | DEBUG    | __main__:trials:24 - Trial = 9598/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.466 | DEBUG    | __main__:trials:29 - Trial = 9598/30000 | Total reward = 30.82
2022-01-26 14:17:11.469 | DEBUG    | __main__:trials:24 - Trial = 9599/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.470 | DEBUG    | __main__:trials:29 - Trial = 9599/30000 | Total reward = 49.75
2022-01-26 14:17:11.473 | DEBUG    | __main__:trials:24 - Trial = 9600/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.474 | DEBUG    | __main__:trials:29 - Trial = 9600/30000 | Total reward = 66.95
2022-01-26 14:17:11.477 | DEBUG    | __main__:trials:24 - Trial = 9601/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.479 | DEBUG    | __main__:trials:29 - Trial = 9601/30000 | Total reward = 46.93
2022-01-26 14:17:11.482 | DEBUG    | __main__:trials:24 - Trial = 9602/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.484 | DEBUG    | __main__:trials:29 - Trial = 9602/30000 | Total reward = 46.87
2022-01-26 14:17:11.487 | DEBUG    | __main__:trials:24 - Trial = 9603/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.489 | DEBUG    | __main__:trials:29 - Trial = 9603/30000 | Total reward = 47.66
2022-01-26 14:17:11.493 | DEBUG    | __main__:trials:24 - Trial = 9604/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.494 | DEBUG    | __main__:trials:29 - Trial = 9604/30000 | Total reward = 44.85
2022-01-26 14:17:11.497 | DEBUG    | __main__:trials:24 - Trial = 9605/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.498 | DEBUG    | __main__:trials:29 - Trial = 9605/30000 | Total reward = 47.86
2022-01-26 14:17:11.501 | DEBUG    | __main__:trials:24 - Trial = 9606/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.503 | DEBUG    | __main__:trials:29 - Trial = 9606/30000 | Total reward = 61.89
2022-01-26 14:17:11.506 | DEBUG    | __main__:trials:24 - Trial = 9607/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.507 | DEBUG    | __main__:trials:29 - Trial = 9607/30000 | Total reward = 58.64
2022-01-26 14:17:11.510 | DEBUG    | __main__:trials:24 - Trial = 9608/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.511 | DEBUG    | __main__:trials:29 - Trial = 9608/30000 | Total reward = 37.77
2022-01-26 14:17:11.514 | DEBUG    | __main__:trials:24 - Trial = 9609/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.516 | DEBUG    | __main__:trials:29 - Trial = 9609/30000 | Total reward = 33.16
2022-01-26 14:17:11.519 | DEBUG    | __main__:trials:24 - Trial = 9610/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.521 | DEBUG    | __main__:trials:29 - Trial = 9610/30000 | Total reward = 58.81
2022-01-26 14:17:11.524 | DEBUG    | __main__:trials:24 - Trial = 9611/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.527 | DEBUG    | __main__:trials:29 - Trial = 9611/30000 | Total reward = 35.78
2022-01-26 14:17:11.530 | DEBUG    | __main__:trials:24 - Trial = 9612/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.532 | DEBUG    | __main__:trials:29 - Trial = 9612/30000 | Total reward = 42.75
2022-01-26 14:17:11.536 | DEBUG    | __main__:trials:24 - Trial = 9613/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.536 | DEBUG    | __main__:trials:29 - Trial = 9613/30000 | Total reward = 39.74
2022-01-26 14:17:11.541 | DEBUG    | __main__:trials:24 - Trial = 9614/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.541 | DEBUG    | __main__:trials:29 - Trial = 9614/30000 | Total reward = 48.03
2022-01-26 14:17:11.545 | DEBUG    | __main__:trials:24 - Trial = 9615/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.548 | DEBUG    | __main__:trials:29 - Trial = 9615/30000 | Total reward = 41.45
2022-01-26 14:17:11.551 | DEBUG    | __main__:trials:24 - Trial = 9616/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.552 | DEBUG    | __main__:trials:29 - Trial = 9616/30000 | Total reward = 37.98
2022-01-26 14:17:11.556 | DEBUG    | __main__:trials:24 - Trial = 9617/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.557 | DEBUG    | __main__:trials:29 - Trial = 9617/30000 | Total reward = 43.54
2022-01-26 14:17:11.561 | DEBUG    | __main__:trials:24 - Trial = 9618/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.562 | DEBUG    | __main__:trials:29 - Trial = 9618/30000 | Total reward = 48.03
2022-01-26 14:17:11.566 | DEBUG    | __main__:trials:24 - Trial = 9619/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.568 | DEBUG    | __main__:trials:29 - Trial = 9619/30000 | Total reward = 49.50
2022-01-26 14:17:11.571 | DEBUG    | __main__:trials:24 - Trial = 9620/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.573 | DEBUG    | __main__:trials:29 - Trial = 9620/30000 | Total reward = 46.25
2022-01-26 14:17:11.576 | DEBUG    | __main__:trials:24 - Trial = 9621/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.578 | DEBUG    | __main__:trials:29 - Trial = 9621/30000 | Total reward = 32.32
2022-01-26 14:17:11.581 | DEBUG    | __main__:trials:24 - Trial = 9622/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.583 | DEBUG    | __main__:trials:29 - Trial = 9622/30000 | Total reward = 39.57
2022-01-26 14:17:11.587 | DEBUG    | __main__:trials:24 - Trial = 9623/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.588 | DEBUG    | __main__:trials:29 - Trial = 9623/30000 | Total reward = 61.89
2022-01-26 14:17:11.592 | DEBUG    | __main__:trials:24 - Trial = 9624/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.592 | DEBUG    | __main__:trials:29 - Trial = 9624/30000 | Total reward = 64.90
2022-01-26 14:17:11.596 | DEBUG    | __main__:trials:24 - Trial = 9625/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.598 | DEBUG    | __main__:trials:29 - Trial = 9625/30000 | Total reward = 60.68
2022-01-26 14:17:11.601 | DEBUG    | __main__:trials:24 - Trial = 9626/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.602 | DEBUG    | __main__:trials:29 - Trial = 9626/30000 | Total reward = 28.38
2022-01-26 14:17:11.606 | DEBUG    | __main__:trials:24 - Trial = 9627/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.607 | DEBUG    | __main__:trials:29 - Trial = 9627/30000 | Total reward = 47.03
2022-01-26 14:17:11.611 | DEBUG    | __main__:trials:24 - Trial = 9628/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.612 | DEBUG    | __main__:trials:29 - Trial = 9628/30000 | Total reward = 37.95
2022-01-26 14:17:11.616 | DEBUG    | __main__:trials:24 - Trial = 9629/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.617 | DEBUG    | __main__:trials:29 - Trial = 9629/30000 | Total reward = 50.49
2022-01-26 14:17:11.621 | DEBUG    | __main__:trials:24 - Trial = 9630/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.622 | DEBUG    | __main__:trials:29 - Trial = 9630/30000 | Total reward = 46.89
2022-01-26 14:17:11.626 | DEBUG    | __main__:trials:24 - Trial = 9631/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.628 | DEBUG    | __main__:trials:29 - Trial = 9631/30000 | Total reward = 49.80
2022-01-26 14:17:11.631 | DEBUG    | __main__:trials:24 - Trial = 9632/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.631 | DEBUG    | __main__:trials:29 - Trial = 9632/30000 | Total reward = 43.37
2022-01-26 14:17:11.635 | DEBUG    | __main__:trials:24 - Trial = 9633/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.635 | DEBUG    | __main__:trials:29 - Trial = 9633/30000 | Total reward = 39.95
2022-01-26 14:17:11.639 | DEBUG    | __main__:trials:24 - Trial = 9634/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.640 | DEBUG    | __main__:trials:29 - Trial = 9634/30000 | Total reward = 44.41
2022-01-26 14:17:11.644 | DEBUG    | __main__:trials:24 - Trial = 9635/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.645 | DEBUG    | __main__:trials:29 - Trial = 9635/30000 | Total reward = 46.04
2022-01-26 14:17:11.648 | DEBUG    | __main__:trials:24 - Trial = 9636/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.650 | DEBUG    | __main__:trials:29 - Trial = 9636/30000 | Total reward = 60.21
2022-01-26 14:17:11.653 | DEBUG    | __main__:trials:24 - Trial = 9637/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.654 | DEBUG    | __main__:trials:29 - Trial = 9637/30000 | Total reward = 46.57
2022-01-26 14:17:11.657 | DEBUG    | __main__:trials:24 - Trial = 9638/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.659 | DEBUG    | __main__:trials:29 - Trial = 9638/30000 | Total reward = 46.19
2022-01-26 14:17:11.662 | DEBUG    | __main__:trials:24 - Trial = 9639/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.663 | DEBUG    | __main__:trials:29 - Trial = 9639/30000 | Total reward = 41.13
2022-01-26 14:17:11.667 | DEBUG    | __main__:trials:24 - Trial = 9640/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.668 | DEBUG    | __main__:trials:29 - Trial = 9640/30000 | Total reward = 51.08
2022-01-26 14:17:11.672 | DEBUG    | __main__:trials:24 - Trial = 9641/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.673 | DEBUG    | __main__:trials:29 - Trial = 9641/30000 | Total reward = 50.99
2022-01-26 14:17:11.677 | DEBUG    | __main__:trials:24 - Trial = 9642/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.679 | DEBUG    | __main__:trials:29 - Trial = 9642/30000 | Total reward = 48.93
2022-01-26 14:17:11.682 | DEBUG    | __main__:trials:24 - Trial = 9643/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.684 | DEBUG    | __main__:trials:29 - Trial = 9643/30000 | Total reward = 65.55
2022-01-26 14:17:11.689 | DEBUG    | __main__:trials:24 - Trial = 9644/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.690 | DEBUG    | __main__:trials:29 - Trial = 9644/30000 | Total reward = 50.87
2022-01-26 14:17:11.695 | DEBUG    | __main__:trials:24 - Trial = 9645/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.695 | DEBUG    | __main__:trials:29 - Trial = 9645/30000 | Total reward = 41.01
2022-01-26 14:17:11.700 | DEBUG    | __main__:trials:24 - Trial = 9646/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.701 | DEBUG    | __main__:trials:29 - Trial = 9646/30000 | Total reward = 44.54
2022-01-26 14:17:11.705 | DEBUG    | __main__:trials:24 - Trial = 9647/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.706 | DEBUG    | __main__:trials:29 - Trial = 9647/30000 | Total reward = 41.11
2022-01-26 14:17:11.709 | DEBUG    | __main__:trials:24 - Trial = 9648/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.710 | DEBUG    | __main__:trials:29 - Trial = 9648/30000 | Total reward = 43.78
2022-01-26 14:17:11.713 | DEBUG    | __main__:trials:24 - Trial = 9649/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.715 | DEBUG    | __main__:trials:29 - Trial = 9649/30000 | Total reward = 40.15
2022-01-26 14:17:11.718 | DEBUG    | __main__:trials:24 - Trial = 9650/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.719 | DEBUG    | __main__:trials:29 - Trial = 9650/30000 | Total reward = 64.79
2022-01-26 14:17:11.723 | DEBUG    | __main__:trials:24 - Trial = 9651/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.724 | DEBUG    | __main__:trials:29 - Trial = 9651/30000 | Total reward = 47.70
2022-01-26 14:17:11.728 | DEBUG    | __main__:trials:24 - Trial = 9652/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.729 | DEBUG    | __main__:trials:29 - Trial = 9652/30000 | Total reward = 50.93
2022-01-26 14:17:11.733 | DEBUG    | __main__:trials:24 - Trial = 9653/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.734 | DEBUG    | __main__:trials:29 - Trial = 9653/30000 | Total reward = 62.59
2022-01-26 14:17:11.738 | DEBUG    | __main__:trials:24 - Trial = 9654/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.739 | DEBUG    | __main__:trials:29 - Trial = 9654/30000 | Total reward = 35.71
2022-01-26 14:17:11.743 | DEBUG    | __main__:trials:24 - Trial = 9655/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.744 | DEBUG    | __main__:trials:29 - Trial = 9655/30000 | Total reward = 58.20
2022-01-26 14:17:11.747 | DEBUG    | __main__:trials:24 - Trial = 9656/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.749 | DEBUG    | __main__:trials:29 - Trial = 9656/30000 | Total reward = 42.81
2022-01-26 14:17:11.752 | DEBUG    | __main__:trials:24 - Trial = 9657/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.753 | DEBUG    | __main__:trials:29 - Trial = 9657/30000 | Total reward = 47.74
2022-01-26 14:17:11.757 | DEBUG    | __main__:trials:24 - Trial = 9658/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.758 | DEBUG    | __main__:trials:29 - Trial = 9658/30000 | Total reward = 47.30
2022-01-26 14:17:11.762 | DEBUG    | __main__:trials:24 - Trial = 9659/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.764 | DEBUG    | __main__:trials:29 - Trial = 9659/30000 | Total reward = 43.56
2022-01-26 14:17:11.767 | DEBUG    | __main__:trials:24 - Trial = 9660/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.769 | DEBUG    | __main__:trials:29 - Trial = 9660/30000 | Total reward = 45.25
2022-01-26 14:17:11.772 | DEBUG    | __main__:trials:24 - Trial = 9661/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.774 | DEBUG    | __main__:trials:29 - Trial = 9661/30000 | Total reward = 51.43
2022-01-26 14:17:11.778 | DEBUG    | __main__:trials:24 - Trial = 9662/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.779 | DEBUG    | __main__:trials:29 - Trial = 9662/30000 | Total reward = 50.06
2022-01-26 14:17:11.783 | DEBUG    | __main__:trials:24 - Trial = 9663/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.784 | DEBUG    | __main__:trials:29 - Trial = 9663/30000 | Total reward = 58.11
2022-01-26 14:17:11.788 | DEBUG    | __main__:trials:24 - Trial = 9664/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.790 | DEBUG    | __main__:trials:29 - Trial = 9664/30000 | Total reward = 67.49
2022-01-26 14:17:11.793 | DEBUG    | __main__:trials:24 - Trial = 9665/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.794 | DEBUG    | __main__:trials:29 - Trial = 9665/30000 | Total reward = 46.91
2022-01-26 14:17:11.798 | DEBUG    | __main__:trials:24 - Trial = 9666/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.799 | DEBUG    | __main__:trials:29 - Trial = 9666/30000 | Total reward = 45.45
2022-01-26 14:17:11.802 | DEBUG    | __main__:trials:24 - Trial = 9667/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.804 | DEBUG    | __main__:trials:29 - Trial = 9667/30000 | Total reward = 40.44
2022-01-26 14:17:11.807 | DEBUG    | __main__:trials:24 - Trial = 9668/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.808 | DEBUG    | __main__:trials:29 - Trial = 9668/30000 | Total reward = 39.66
2022-01-26 14:17:11.811 | DEBUG    | __main__:trials:24 - Trial = 9669/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.813 | DEBUG    | __main__:trials:29 - Trial = 9669/30000 | Total reward = 34.98
2022-01-26 14:17:11.816 | DEBUG    | __main__:trials:24 - Trial = 9670/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.818 | DEBUG    | __main__:trials:29 - Trial = 9670/30000 | Total reward = 55.26
2022-01-26 14:17:11.821 | DEBUG    | __main__:trials:24 - Trial = 9671/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.822 | DEBUG    | __main__:trials:29 - Trial = 9671/30000 | Total reward = 46.31
2022-01-26 14:17:11.826 | DEBUG    | __main__:trials:24 - Trial = 9672/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.827 | DEBUG    | __main__:trials:29 - Trial = 9672/30000 | Total reward = 41.45
2022-01-26 14:17:11.831 | DEBUG    | __main__:trials:24 - Trial = 9673/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.832 | DEBUG    | __main__:trials:29 - Trial = 9673/30000 | Total reward = 40.50
2022-01-26 14:17:11.835 | DEBUG    | __main__:trials:24 - Trial = 9674/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.837 | DEBUG    | __main__:trials:29 - Trial = 9674/30000 | Total reward = 35.06
2022-01-26 14:17:11.840 | DEBUG    | __main__:trials:24 - Trial = 9675/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.842 | DEBUG    | __main__:trials:29 - Trial = 9675/30000 | Total reward = 49.63
2022-01-26 14:17:11.845 | DEBUG    | __main__:trials:24 - Trial = 9676/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.847 | DEBUG    | __main__:trials:29 - Trial = 9676/30000 | Total reward = 41.47
2022-01-26 14:17:11.850 | DEBUG    | __main__:trials:24 - Trial = 9677/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.851 | DEBUG    | __main__:trials:29 - Trial = 9677/30000 | Total reward = 45.25
2022-01-26 14:17:11.855 | DEBUG    | __main__:trials:24 - Trial = 9678/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.857 | DEBUG    | __main__:trials:29 - Trial = 9678/30000 | Total reward = 47.48
2022-01-26 14:17:11.860 | DEBUG    | __main__:trials:24 - Trial = 9679/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.862 | DEBUG    | __main__:trials:29 - Trial = 9679/30000 | Total reward = 45.58
2022-01-26 14:17:11.865 | DEBUG    | __main__:trials:24 - Trial = 9680/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.866 | DEBUG    | __main__:trials:29 - Trial = 9680/30000 | Total reward = 47.48
2022-01-26 14:17:11.870 | DEBUG    | __main__:trials:24 - Trial = 9681/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.871 | DEBUG    | __main__:trials:29 - Trial = 9681/30000 | Total reward = 38.12
2022-01-26 14:17:11.875 | DEBUG    | __main__:trials:24 - Trial = 9682/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.876 | DEBUG    | __main__:trials:29 - Trial = 9682/30000 | Total reward = 66.16
2022-01-26 14:17:11.880 | DEBUG    | __main__:trials:24 - Trial = 9683/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.880 | DEBUG    | __main__:trials:29 - Trial = 9683/30000 | Total reward = 41.43
2022-01-26 14:17:11.885 | DEBUG    | __main__:trials:24 - Trial = 9684/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.886 | DEBUG    | __main__:trials:29 - Trial = 9684/30000 | Total reward = 38.39
2022-01-26 14:17:11.890 | DEBUG    | __main__:trials:24 - Trial = 9685/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.891 | DEBUG    | __main__:trials:29 - Trial = 9685/30000 | Total reward = 45.24
2022-01-26 14:17:11.895 | DEBUG    | __main__:trials:24 - Trial = 9686/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.895 | DEBUG    | __main__:trials:29 - Trial = 9686/30000 | Total reward = 62.47
2022-01-26 14:17:11.899 | DEBUG    | __main__:trials:24 - Trial = 9687/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.901 | DEBUG    | __main__:trials:29 - Trial = 9687/30000 | Total reward = 45.11
2022-01-26 14:17:11.904 | DEBUG    | __main__:trials:24 - Trial = 9688/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.905 | DEBUG    | __main__:trials:29 - Trial = 9688/30000 | Total reward = 38.43
2022-01-26 14:17:11.909 | DEBUG    | __main__:trials:24 - Trial = 9689/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.911 | DEBUG    | __main__:trials:29 - Trial = 9689/30000 | Total reward = 46.81
2022-01-26 14:17:11.914 | DEBUG    | __main__:trials:24 - Trial = 9690/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.915 | DEBUG    | __main__:trials:29 - Trial = 9690/30000 | Total reward = 47.03
2022-01-26 14:17:11.919 | DEBUG    | __main__:trials:24 - Trial = 9691/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.920 | DEBUG    | __main__:trials:29 - Trial = 9691/30000 | Total reward = 42.81
2022-01-26 14:17:11.924 | DEBUG    | __main__:trials:24 - Trial = 9692/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.926 | DEBUG    | __main__:trials:29 - Trial = 9692/30000 | Total reward = 50.60
2022-01-26 14:17:11.929 | DEBUG    | __main__:trials:24 - Trial = 9693/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.930 | DEBUG    | __main__:trials:29 - Trial = 9693/30000 | Total reward = 42.76
2022-01-26 14:17:11.934 | DEBUG    | __main__:trials:24 - Trial = 9694/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.936 | DEBUG    | __main__:trials:29 - Trial = 9694/30000 | Total reward = 50.42
2022-01-26 14:17:11.939 | DEBUG    | __main__:trials:24 - Trial = 9695/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.941 | DEBUG    | __main__:trials:29 - Trial = 9695/30000 | Total reward = 35.65
2022-01-26 14:17:11.944 | DEBUG    | __main__:trials:24 - Trial = 9696/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.946 | DEBUG    | __main__:trials:29 - Trial = 9696/30000 | Total reward = 35.10
2022-01-26 14:17:11.950 | DEBUG    | __main__:trials:24 - Trial = 9697/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.951 | DEBUG    | __main__:trials:29 - Trial = 9697/30000 | Total reward = 45.08
2022-01-26 14:17:11.955 | DEBUG    | __main__:trials:24 - Trial = 9698/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.956 | DEBUG    | __main__:trials:29 - Trial = 9698/30000 | Total reward = 47.93
2022-01-26 14:17:11.960 | DEBUG    | __main__:trials:24 - Trial = 9699/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.962 | DEBUG    | __main__:trials:29 - Trial = 9699/30000 | Total reward = 47.45
2022-01-26 14:17:11.965 | DEBUG    | __main__:trials:24 - Trial = 9700/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.967 | DEBUG    | __main__:trials:29 - Trial = 9700/30000 | Total reward = 50.69
2022-01-26 14:17:11.970 | DEBUG    | __main__:trials:24 - Trial = 9701/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.971 | DEBUG    | __main__:trials:29 - Trial = 9701/30000 | Total reward = 45.05
2022-01-26 14:17:11.976 | DEBUG    | __main__:trials:24 - Trial = 9702/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.977 | DEBUG    | __main__:trials:29 - Trial = 9702/30000 | Total reward = 46.40
2022-01-26 14:17:11.981 | DEBUG    | __main__:trials:24 - Trial = 9703/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.981 | DEBUG    | __main__:trials:29 - Trial = 9703/30000 | Total reward = 49.00
2022-01-26 14:17:11.985 | DEBUG    | __main__:trials:24 - Trial = 9704/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.986 | DEBUG    | __main__:trials:29 - Trial = 9704/30000 | Total reward = 44.24
2022-01-26 14:17:11.990 | DEBUG    | __main__:trials:24 - Trial = 9705/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.991 | DEBUG    | __main__:trials:29 - Trial = 9705/30000 | Total reward = 27.89
2022-01-26 14:17:11.995 | DEBUG    | __main__:trials:24 - Trial = 9706/30000 | Max number of steps (20) reached
2022-01-26 14:17:11.997 | DEBUG    | __main__:trials:29 - Trial = 9706/30000 | Total reward = 46.78
2022-01-26 14:17:12.000 | DEBUG    | __main__:trials:24 - Trial = 9707/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.002 | DEBUG    | __main__:trials:29 - Trial = 9707/30000 | Total reward = 44.05
2022-01-26 14:17:12.006 | DEBUG    | __main__:trials:24 - Trial = 9708/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.007 | DEBUG    | __main__:trials:29 - Trial = 9708/30000 | Total reward = 44.65
2022-01-26 14:17:12.011 | DEBUG    | __main__:trials:24 - Trial = 9709/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.011 | DEBUG    | __main__:trials:29 - Trial = 9709/30000 | Total reward = 36.21
2022-01-26 14:17:12.016 | DEBUG    | __main__:trials:24 - Trial = 9710/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.017 | DEBUG    | __main__:trials:29 - Trial = 9710/30000 | Total reward = 53.79
2022-01-26 14:17:12.021 | DEBUG    | __main__:trials:24 - Trial = 9711/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.021 | DEBUG    | __main__:trials:29 - Trial = 9711/30000 | Total reward = 47.56
2022-01-26 14:17:12.025 | DEBUG    | __main__:trials:24 - Trial = 9712/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.027 | DEBUG    | __main__:trials:29 - Trial = 9712/30000 | Total reward = 58.00
2022-01-26 14:17:12.030 | DEBUG    | __main__:trials:24 - Trial = 9713/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.032 | DEBUG    | __main__:trials:29 - Trial = 9713/30000 | Total reward = 40.33
2022-01-26 14:17:12.036 | DEBUG    | __main__:trials:24 - Trial = 9714/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.037 | DEBUG    | __main__:trials:29 - Trial = 9714/30000 | Total reward = 46.38
2022-01-26 14:17:12.041 | DEBUG    | __main__:trials:24 - Trial = 9715/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.042 | DEBUG    | __main__:trials:29 - Trial = 9715/30000 | Total reward = 49.14
2022-01-26 14:17:12.046 | DEBUG    | __main__:trials:24 - Trial = 9716/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.046 | DEBUG    | __main__:trials:29 - Trial = 9716/30000 | Total reward = 47.50
2022-01-26 14:17:12.050 | DEBUG    | __main__:trials:24 - Trial = 9717/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.051 | DEBUG    | __main__:trials:29 - Trial = 9717/30000 | Total reward = 47.54
2022-01-26 14:17:12.055 | DEBUG    | __main__:trials:24 - Trial = 9718/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.057 | DEBUG    | __main__:trials:29 - Trial = 9718/30000 | Total reward = 42.37
2022-01-26 14:17:12.060 | DEBUG    | __main__:trials:24 - Trial = 9719/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.062 | DEBUG    | __main__:trials:29 - Trial = 9719/30000 | Total reward = 45.55
2022-01-26 14:17:12.065 | DEBUG    | __main__:trials:24 - Trial = 9720/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.066 | DEBUG    | __main__:trials:29 - Trial = 9720/30000 | Total reward = 44.89
2022-01-26 14:17:12.070 | DEBUG    | __main__:trials:24 - Trial = 9721/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.072 | DEBUG    | __main__:trials:29 - Trial = 9721/30000 | Total reward = 66.05
2022-01-26 14:17:12.075 | DEBUG    | __main__:trials:24 - Trial = 9722/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.076 | DEBUG    | __main__:trials:29 - Trial = 9722/30000 | Total reward = 62.46
2022-01-26 14:17:12.080 | DEBUG    | __main__:trials:24 - Trial = 9723/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.081 | DEBUG    | __main__:trials:29 - Trial = 9723/30000 | Total reward = 40.83
2022-01-26 14:17:12.085 | DEBUG    | __main__:trials:24 - Trial = 9724/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.086 | DEBUG    | __main__:trials:29 - Trial = 9724/30000 | Total reward = 45.40
2022-01-26 14:17:12.090 | DEBUG    | __main__:trials:24 - Trial = 9725/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.091 | DEBUG    | __main__:trials:29 - Trial = 9725/30000 | Total reward = 50.13
2022-01-26 14:17:12.094 | DEBUG    | __main__:trials:24 - Trial = 9726/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.094 | DEBUG    | __main__:trials:29 - Trial = 9726/30000 | Total reward = 38.68
2022-01-26 14:17:12.098 | DEBUG    | __main__:trials:24 - Trial = 9727/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.100 | DEBUG    | __main__:trials:29 - Trial = 9727/30000 | Total reward = 39.08
2022-01-26 14:17:12.102 | DEBUG    | __main__:trials:24 - Trial = 9728/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.104 | DEBUG    | __main__:trials:29 - Trial = 9728/30000 | Total reward = 55.43
2022-01-26 14:17:12.107 | DEBUG    | __main__:trials:24 - Trial = 9729/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.109 | DEBUG    | __main__:trials:29 - Trial = 9729/30000 | Total reward = 47.93
2022-01-26 14:17:12.112 | DEBUG    | __main__:trials:24 - Trial = 9730/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.114 | DEBUG    | __main__:trials:29 - Trial = 9730/30000 | Total reward = 60.82
2022-01-26 14:17:12.118 | DEBUG    | __main__:trials:24 - Trial = 9731/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.118 | DEBUG    | __main__:trials:29 - Trial = 9731/30000 | Total reward = 40.76
2022-01-26 14:17:12.122 | DEBUG    | __main__:trials:24 - Trial = 9732/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.124 | DEBUG    | __main__:trials:29 - Trial = 9732/30000 | Total reward = 28.11
2022-01-26 14:17:12.128 | DEBUG    | __main__:trials:24 - Trial = 9733/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.129 | DEBUG    | __main__:trials:29 - Trial = 9733/30000 | Total reward = 47.87
2022-01-26 14:17:12.132 | DEBUG    | __main__:trials:24 - Trial = 9734/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.134 | DEBUG    | __main__:trials:29 - Trial = 9734/30000 | Total reward = 48.68
2022-01-26 14:17:12.138 | DEBUG    | __main__:trials:24 - Trial = 9735/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.139 | DEBUG    | __main__:trials:29 - Trial = 9735/30000 | Total reward = 53.64
2022-01-26 14:17:12.143 | DEBUG    | __main__:trials:24 - Trial = 9736/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.144 | DEBUG    | __main__:trials:29 - Trial = 9736/30000 | Total reward = 45.84
2022-01-26 14:17:12.148 | DEBUG    | __main__:trials:24 - Trial = 9737/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.149 | DEBUG    | __main__:trials:29 - Trial = 9737/30000 | Total reward = 64.49
2022-01-26 14:17:12.152 | DEBUG    | __main__:trials:24 - Trial = 9738/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.154 | DEBUG    | __main__:trials:29 - Trial = 9738/30000 | Total reward = 40.97
2022-01-26 14:17:12.157 | DEBUG    | __main__:trials:24 - Trial = 9739/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.158 | DEBUG    | __main__:trials:29 - Trial = 9739/30000 | Total reward = 38.26
2022-01-26 14:17:12.162 | DEBUG    | __main__:trials:24 - Trial = 9740/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.163 | DEBUG    | __main__:trials:29 - Trial = 9740/30000 | Total reward = 43.53
2022-01-26 14:17:12.167 | DEBUG    | __main__:trials:24 - Trial = 9741/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.168 | DEBUG    | __main__:trials:29 - Trial = 9741/30000 | Total reward = 47.50
2022-01-26 14:17:12.171 | DEBUG    | __main__:trials:24 - Trial = 9742/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.173 | DEBUG    | __main__:trials:29 - Trial = 9742/30000 | Total reward = 35.26
2022-01-26 14:17:12.176 | DEBUG    | __main__:trials:24 - Trial = 9743/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.178 | DEBUG    | __main__:trials:29 - Trial = 9743/30000 | Total reward = 32.97
2022-01-26 14:17:12.181 | DEBUG    | __main__:trials:24 - Trial = 9744/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.183 | DEBUG    | __main__:trials:29 - Trial = 9744/30000 | Total reward = 46.43
2022-01-26 14:17:12.187 | DEBUG    | __main__:trials:24 - Trial = 9745/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.187 | DEBUG    | __main__:trials:29 - Trial = 9745/30000 | Total reward = 61.97
2022-01-26 14:17:12.192 | DEBUG    | __main__:trials:24 - Trial = 9746/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.192 | DEBUG    | __main__:trials:29 - Trial = 9746/30000 | Total reward = 35.44
2022-01-26 14:17:12.196 | DEBUG    | __main__:trials:24 - Trial = 9747/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.197 | DEBUG    | __main__:trials:29 - Trial = 9747/30000 | Total reward = 55.70
2022-01-26 14:17:12.201 | DEBUG    | __main__:trials:24 - Trial = 9748/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.202 | DEBUG    | __main__:trials:29 - Trial = 9748/30000 | Total reward = 40.97
2022-01-26 14:17:12.206 | DEBUG    | __main__:trials:24 - Trial = 9749/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.208 | DEBUG    | __main__:trials:29 - Trial = 9749/30000 | Total reward = 49.63
2022-01-26 14:17:12.211 | DEBUG    | __main__:trials:24 - Trial = 9750/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.213 | DEBUG    | __main__:trials:29 - Trial = 9750/30000 | Total reward = 34.79
2022-01-26 14:17:12.216 | DEBUG    | __main__:trials:24 - Trial = 9751/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.217 | DEBUG    | __main__:trials:29 - Trial = 9751/30000 | Total reward = 55.18
2022-01-26 14:17:12.220 | DEBUG    | __main__:trials:24 - Trial = 9752/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.221 | DEBUG    | __main__:trials:29 - Trial = 9752/30000 | Total reward = 44.74
2022-01-26 14:17:12.226 | DEBUG    | __main__:trials:24 - Trial = 9753/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.226 | DEBUG    | __main__:trials:29 - Trial = 9753/30000 | Total reward = 46.41
2022-01-26 14:17:12.231 | DEBUG    | __main__:trials:24 - Trial = 9754/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.231 | DEBUG    | __main__:trials:29 - Trial = 9754/30000 | Total reward = 42.84
2022-01-26 14:17:12.236 | DEBUG    | __main__:trials:24 - Trial = 9755/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.237 | DEBUG    | __main__:trials:29 - Trial = 9755/30000 | Total reward = 48.50
2022-01-26 14:17:12.241 | DEBUG    | __main__:trials:24 - Trial = 9756/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.242 | DEBUG    | __main__:trials:29 - Trial = 9756/30000 | Total reward = 42.27
2022-01-26 14:17:12.246 | DEBUG    | __main__:trials:24 - Trial = 9757/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.248 | DEBUG    | __main__:trials:29 - Trial = 9757/30000 | Total reward = 39.52
2022-01-26 14:17:12.251 | DEBUG    | __main__:trials:24 - Trial = 9758/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.253 | DEBUG    | __main__:trials:29 - Trial = 9758/30000 | Total reward = 45.73
2022-01-26 14:17:12.256 | DEBUG    | __main__:trials:24 - Trial = 9759/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.257 | DEBUG    | __main__:trials:29 - Trial = 9759/30000 | Total reward = 41.37
2022-01-26 14:17:12.260 | DEBUG    | __main__:trials:24 - Trial = 9760/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.262 | DEBUG    | __main__:trials:29 - Trial = 9760/30000 | Total reward = 43.18
2022-01-26 14:17:12.266 | DEBUG    | __main__:trials:24 - Trial = 9761/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.266 | DEBUG    | __main__:trials:29 - Trial = 9761/30000 | Total reward = 58.47
2022-01-26 14:17:12.270 | DEBUG    | __main__:trials:24 - Trial = 9762/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.271 | DEBUG    | __main__:trials:29 - Trial = 9762/30000 | Total reward = 39.46
2022-01-26 14:17:12.275 | DEBUG    | __main__:trials:24 - Trial = 9763/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.277 | DEBUG    | __main__:trials:29 - Trial = 9763/30000 | Total reward = 41.47
2022-01-26 14:17:12.280 | DEBUG    | __main__:trials:24 - Trial = 9764/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.282 | DEBUG    | __main__:trials:29 - Trial = 9764/30000 | Total reward = 66.07
2022-01-26 14:17:12.285 | DEBUG    | __main__:trials:24 - Trial = 9765/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.286 | DEBUG    | __main__:trials:29 - Trial = 9765/30000 | Total reward = 46.15
2022-01-26 14:17:12.291 | DEBUG    | __main__:trials:24 - Trial = 9766/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.291 | DEBUG    | __main__:trials:29 - Trial = 9766/30000 | Total reward = 46.73
2022-01-26 14:17:12.295 | DEBUG    | __main__:trials:24 - Trial = 9767/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.297 | DEBUG    | __main__:trials:29 - Trial = 9767/30000 | Total reward = 65.00
2022-01-26 14:17:12.301 | DEBUG    | __main__:trials:24 - Trial = 9768/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.301 | DEBUG    | __main__:trials:29 - Trial = 9768/30000 | Total reward = 40.03
2022-01-26 14:17:12.305 | DEBUG    | __main__:trials:24 - Trial = 9769/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.306 | DEBUG    | __main__:trials:29 - Trial = 9769/30000 | Total reward = 49.06
2022-01-26 14:17:12.309 | DEBUG    | __main__:trials:24 - Trial = 9770/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.311 | DEBUG    | __main__:trials:29 - Trial = 9770/30000 | Total reward = 36.85
2022-01-26 14:17:12.315 | DEBUG    | __main__:trials:24 - Trial = 9771/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.315 | DEBUG    | __main__:trials:29 - Trial = 9771/30000 | Total reward = 49.56
2022-01-26 14:17:12.320 | DEBUG    | __main__:trials:24 - Trial = 9772/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.321 | DEBUG    | __main__:trials:29 - Trial = 9772/30000 | Total reward = 45.16
2022-01-26 14:17:12.325 | DEBUG    | __main__:trials:24 - Trial = 9773/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.326 | DEBUG    | __main__:trials:29 - Trial = 9773/30000 | Total reward = 39.44
2022-01-26 14:17:12.330 | DEBUG    | __main__:trials:24 - Trial = 9774/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.332 | DEBUG    | __main__:trials:29 - Trial = 9774/30000 | Total reward = 41.06
2022-01-26 14:17:12.335 | DEBUG    | __main__:trials:24 - Trial = 9775/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.337 | DEBUG    | __main__:trials:29 - Trial = 9775/30000 | Total reward = 43.47
2022-01-26 14:17:12.340 | DEBUG    | __main__:trials:24 - Trial = 9776/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.342 | DEBUG    | __main__:trials:29 - Trial = 9776/30000 | Total reward = 46.41
2022-01-26 14:17:12.345 | DEBUG    | __main__:trials:24 - Trial = 9777/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.346 | DEBUG    | __main__:trials:29 - Trial = 9777/30000 | Total reward = 43.33
2022-01-26 14:17:12.350 | DEBUG    | __main__:trials:24 - Trial = 9778/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.352 | DEBUG    | __main__:trials:29 - Trial = 9778/30000 | Total reward = 64.37
2022-01-26 14:17:12.355 | DEBUG    | __main__:trials:24 - Trial = 9779/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.356 | DEBUG    | __main__:trials:29 - Trial = 9779/30000 | Total reward = 49.93
2022-01-26 14:17:12.360 | DEBUG    | __main__:trials:24 - Trial = 9780/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.362 | DEBUG    | __main__:trials:29 - Trial = 9780/30000 | Total reward = 43.13
2022-01-26 14:17:12.365 | DEBUG    | __main__:trials:24 - Trial = 9781/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.366 | DEBUG    | __main__:trials:29 - Trial = 9781/30000 | Total reward = 40.44
2022-01-26 14:17:12.370 | DEBUG    | __main__:trials:24 - Trial = 9782/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.372 | DEBUG    | __main__:trials:29 - Trial = 9782/30000 | Total reward = 42.66
2022-01-26 14:17:12.375 | DEBUG    | __main__:trials:24 - Trial = 9783/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.376 | DEBUG    | __main__:trials:29 - Trial = 9783/30000 | Total reward = 42.65
2022-01-26 14:17:12.380 | DEBUG    | __main__:trials:24 - Trial = 9784/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.381 | DEBUG    | __main__:trials:29 - Trial = 9784/30000 | Total reward = 29.25
2022-01-26 14:17:12.385 | DEBUG    | __main__:trials:24 - Trial = 9785/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.386 | DEBUG    | __main__:trials:29 - Trial = 9785/30000 | Total reward = 29.14
2022-01-26 14:17:12.390 | DEBUG    | __main__:trials:24 - Trial = 9786/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.391 | DEBUG    | __main__:trials:29 - Trial = 9786/30000 | Total reward = 47.66
2022-01-26 14:17:12.395 | DEBUG    | __main__:trials:24 - Trial = 9787/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.397 | DEBUG    | __main__:trials:29 - Trial = 9787/30000 | Total reward = 47.28
2022-01-26 14:17:12.400 | DEBUG    | __main__:trials:24 - Trial = 9788/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.402 | DEBUG    | __main__:trials:29 - Trial = 9788/30000 | Total reward = 46.95
2022-01-26 14:17:12.405 | DEBUG    | __main__:trials:24 - Trial = 9789/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.406 | DEBUG    | __main__:trials:29 - Trial = 9789/30000 | Total reward = 50.07
2022-01-26 14:17:12.409 | DEBUG    | __main__:trials:24 - Trial = 9790/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.411 | DEBUG    | __main__:trials:29 - Trial = 9790/30000 | Total reward = 57.66
2022-01-26 14:17:12.413 | DEBUG    | __main__:trials:24 - Trial = 9791/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.415 | DEBUG    | __main__:trials:29 - Trial = 9791/30000 | Total reward = 51.52
2022-01-26 14:17:12.418 | DEBUG    | __main__:trials:24 - Trial = 9792/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.420 | DEBUG    | __main__:trials:29 - Trial = 9792/30000 | Total reward = 50.86
2022-01-26 14:17:12.424 | DEBUG    | __main__:trials:24 - Trial = 9793/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.425 | DEBUG    | __main__:trials:29 - Trial = 9793/30000 | Total reward = 43.04
2022-01-26 14:17:12.428 | DEBUG    | __main__:trials:24 - Trial = 9794/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.430 | DEBUG    | __main__:trials:29 - Trial = 9794/30000 | Total reward = 41.58
2022-01-26 14:17:12.433 | DEBUG    | __main__:trials:24 - Trial = 9795/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.434 | DEBUG    | __main__:trials:29 - Trial = 9795/30000 | Total reward = 56.52
2022-01-26 14:17:12.437 | DEBUG    | __main__:trials:24 - Trial = 9796/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.438 | DEBUG    | __main__:trials:29 - Trial = 9796/30000 | Total reward = 54.75
2022-01-26 14:17:12.442 | DEBUG    | __main__:trials:24 - Trial = 9797/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.443 | DEBUG    | __main__:trials:29 - Trial = 9797/30000 | Total reward = 49.11
2022-01-26 14:17:12.446 | DEBUG    | __main__:trials:24 - Trial = 9798/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.448 | DEBUG    | __main__:trials:29 - Trial = 9798/30000 | Total reward = 46.54
2022-01-26 14:17:12.452 | DEBUG    | __main__:trials:24 - Trial = 9799/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.453 | DEBUG    | __main__:trials:29 - Trial = 9799/30000 | Total reward = 23.74
2022-01-26 14:17:12.457 | DEBUG    | __main__:trials:24 - Trial = 9800/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.458 | DEBUG    | __main__:trials:29 - Trial = 9800/30000 | Total reward = 35.74
2022-01-26 14:17:12.461 | DEBUG    | __main__:trials:24 - Trial = 9801/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.462 | DEBUG    | __main__:trials:29 - Trial = 9801/30000 | Total reward = 47.39
2022-01-26 14:17:12.465 | DEBUG    | __main__:trials:24 - Trial = 9802/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.467 | DEBUG    | __main__:trials:29 - Trial = 9802/30000 | Total reward = 49.82
2022-01-26 14:17:12.470 | DEBUG    | __main__:trials:24 - Trial = 9803/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.470 | DEBUG    | __main__:trials:29 - Trial = 9803/30000 | Total reward = 48.03
2022-01-26 14:17:12.474 | DEBUG    | __main__:trials:24 - Trial = 9804/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.474 | DEBUG    | __main__:trials:29 - Trial = 9804/30000 | Total reward = 51.23
2022-01-26 14:17:12.478 | DEBUG    | __main__:trials:24 - Trial = 9805/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.479 | DEBUG    | __main__:trials:29 - Trial = 9805/30000 | Total reward = 41.87
2022-01-26 14:17:12.482 | DEBUG    | __main__:trials:24 - Trial = 9806/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.483 | DEBUG    | __main__:trials:29 - Trial = 9806/30000 | Total reward = 45.43
2022-01-26 14:17:12.486 | DEBUG    | __main__:trials:24 - Trial = 9807/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.487 | DEBUG    | __main__:trials:29 - Trial = 9807/30000 | Total reward = 47.02
2022-01-26 14:17:12.490 | DEBUG    | __main__:trials:24 - Trial = 9808/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.491 | DEBUG    | __main__:trials:29 - Trial = 9808/30000 | Total reward = 43.78
2022-01-26 14:17:12.494 | DEBUG    | __main__:trials:24 - Trial = 9809/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.496 | DEBUG    | __main__:trials:29 - Trial = 9809/30000 | Total reward = 44.59
2022-01-26 14:17:12.499 | DEBUG    | __main__:trials:24 - Trial = 9810/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.499 | DEBUG    | __main__:trials:29 - Trial = 9810/30000 | Total reward = 48.45
2022-01-26 14:17:12.503 | DEBUG    | __main__:trials:24 - Trial = 9811/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.505 | DEBUG    | __main__:trials:29 - Trial = 9811/30000 | Total reward = 45.79
2022-01-26 14:17:12.508 | DEBUG    | __main__:trials:24 - Trial = 9812/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.508 | DEBUG    | __main__:trials:29 - Trial = 9812/30000 | Total reward = 45.69
2022-01-26 14:17:12.511 | DEBUG    | __main__:trials:24 - Trial = 9813/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.512 | DEBUG    | __main__:trials:29 - Trial = 9813/30000 | Total reward = 64.17
2022-01-26 14:17:12.515 | DEBUG    | __main__:trials:24 - Trial = 9814/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.515 | DEBUG    | __main__:trials:29 - Trial = 9814/30000 | Total reward = 39.82
2022-01-26 14:17:12.519 | DEBUG    | __main__:trials:24 - Trial = 9815/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.520 | DEBUG    | __main__:trials:29 - Trial = 9815/30000 | Total reward = 47.58
2022-01-26 14:17:12.523 | DEBUG    | __main__:trials:24 - Trial = 9816/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.525 | DEBUG    | __main__:trials:29 - Trial = 9816/30000 | Total reward = 46.99
2022-01-26 14:17:12.527 | DEBUG    | __main__:trials:24 - Trial = 9817/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.528 | DEBUG    | __main__:trials:29 - Trial = 9817/30000 | Total reward = 51.74
2022-01-26 14:17:12.531 | DEBUG    | __main__:trials:24 - Trial = 9818/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.531 | DEBUG    | __main__:trials:29 - Trial = 9818/30000 | Total reward = 59.35
2022-01-26 14:17:12.535 | DEBUG    | __main__:trials:24 - Trial = 9819/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.535 | DEBUG    | __main__:trials:29 - Trial = 9819/30000 | Total reward = 49.55
2022-01-26 14:17:12.539 | DEBUG    | __main__:trials:24 - Trial = 9820/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.541 | DEBUG    | __main__:trials:29 - Trial = 9820/30000 | Total reward = 33.89
2022-01-26 14:17:12.544 | DEBUG    | __main__:trials:24 - Trial = 9821/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.545 | DEBUG    | __main__:trials:29 - Trial = 9821/30000 | Total reward = 47.50
2022-01-26 14:17:12.548 | DEBUG    | __main__:trials:24 - Trial = 9822/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.549 | DEBUG    | __main__:trials:29 - Trial = 9822/30000 | Total reward = 61.48
2022-01-26 14:17:12.552 | DEBUG    | __main__:trials:24 - Trial = 9823/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.553 | DEBUG    | __main__:trials:29 - Trial = 9823/30000 | Total reward = 47.74
2022-01-26 14:17:12.557 | DEBUG    | __main__:trials:24 - Trial = 9824/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.557 | DEBUG    | __main__:trials:29 - Trial = 9824/30000 | Total reward = 58.17
2022-01-26 14:17:12.561 | DEBUG    | __main__:trials:24 - Trial = 9825/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.562 | DEBUG    | __main__:trials:29 - Trial = 9825/30000 | Total reward = 64.99
2022-01-26 14:17:12.565 | DEBUG    | __main__:trials:24 - Trial = 9826/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.566 | DEBUG    | __main__:trials:29 - Trial = 9826/30000 | Total reward = 48.96
2022-01-26 14:17:12.570 | DEBUG    | __main__:trials:24 - Trial = 9827/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.571 | DEBUG    | __main__:trials:29 - Trial = 9827/30000 | Total reward = 66.12
2022-01-26 14:17:12.574 | DEBUG    | __main__:trials:24 - Trial = 9828/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.575 | DEBUG    | __main__:trials:29 - Trial = 9828/30000 | Total reward = 47.62
2022-01-26 14:17:12.578 | DEBUG    | __main__:trials:24 - Trial = 9829/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.579 | DEBUG    | __main__:trials:29 - Trial = 9829/30000 | Total reward = 56.89
2022-01-26 14:17:12.582 | DEBUG    | __main__:trials:24 - Trial = 9830/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.583 | DEBUG    | __main__:trials:29 - Trial = 9830/30000 | Total reward = 46.82
2022-01-26 14:17:12.586 | DEBUG    | __main__:trials:24 - Trial = 9831/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.588 | DEBUG    | __main__:trials:29 - Trial = 9831/30000 | Total reward = 45.20
2022-01-26 14:17:12.591 | DEBUG    | __main__:trials:24 - Trial = 9832/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.592 | DEBUG    | __main__:trials:29 - Trial = 9832/30000 | Total reward = 50.59
2022-01-26 14:17:12.595 | DEBUG    | __main__:trials:24 - Trial = 9833/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.596 | DEBUG    | __main__:trials:29 - Trial = 9833/30000 | Total reward = 47.50
2022-01-26 14:17:12.599 | DEBUG    | __main__:trials:24 - Trial = 9834/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.600 | DEBUG    | __main__:trials:29 - Trial = 9834/30000 | Total reward = 40.68
2022-01-26 14:17:12.603 | DEBUG    | __main__:trials:24 - Trial = 9835/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.604 | DEBUG    | __main__:trials:29 - Trial = 9835/30000 | Total reward = 46.52
2022-01-26 14:17:12.608 | DEBUG    | __main__:trials:24 - Trial = 9836/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.608 | DEBUG    | __main__:trials:29 - Trial = 9836/30000 | Total reward = 67.31
2022-01-26 14:17:12.612 | DEBUG    | __main__:trials:24 - Trial = 9837/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.614 | DEBUG    | __main__:trials:29 - Trial = 9837/30000 | Total reward = 44.66
2022-01-26 14:17:12.617 | DEBUG    | __main__:trials:24 - Trial = 9838/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.618 | DEBUG    | __main__:trials:29 - Trial = 9838/30000 | Total reward = 44.00
2022-01-26 14:17:12.621 | DEBUG    | __main__:trials:24 - Trial = 9839/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.622 | DEBUG    | __main__:trials:29 - Trial = 9839/30000 | Total reward = 64.37
2022-01-26 14:17:12.625 | DEBUG    | __main__:trials:24 - Trial = 9840/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.626 | DEBUG    | __main__:trials:29 - Trial = 9840/30000 | Total reward = 52.11
2022-01-26 14:17:12.630 | DEBUG    | __main__:trials:24 - Trial = 9841/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.632 | DEBUG    | __main__:trials:29 - Trial = 9841/30000 | Total reward = 54.30
2022-01-26 14:17:12.635 | DEBUG    | __main__:trials:24 - Trial = 9842/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.637 | DEBUG    | __main__:trials:29 - Trial = 9842/30000 | Total reward = 43.83
2022-01-26 14:17:12.640 | DEBUG    | __main__:trials:24 - Trial = 9843/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.641 | DEBUG    | __main__:trials:29 - Trial = 9843/30000 | Total reward = 47.69
2022-01-26 14:17:12.646 | DEBUG    | __main__:trials:24 - Trial = 9844/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.646 | DEBUG    | __main__:trials:29 - Trial = 9844/30000 | Total reward = 41.69
2022-01-26 14:17:12.651 | DEBUG    | __main__:trials:24 - Trial = 9845/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.652 | DEBUG    | __main__:trials:29 - Trial = 9845/30000 | Total reward = 59.66
2022-01-26 14:17:12.656 | DEBUG    | __main__:trials:24 - Trial = 9846/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.658 | DEBUG    | __main__:trials:29 - Trial = 9846/30000 | Total reward = 42.02
2022-01-26 14:17:12.661 | DEBUG    | __main__:trials:24 - Trial = 9847/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.662 | DEBUG    | __main__:trials:29 - Trial = 9847/30000 | Total reward = 42.23
2022-01-26 14:17:12.666 | DEBUG    | __main__:trials:24 - Trial = 9848/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.666 | DEBUG    | __main__:trials:29 - Trial = 9848/30000 | Total reward = 47.29
2022-01-26 14:17:12.671 | DEBUG    | __main__:trials:24 - Trial = 9849/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.672 | DEBUG    | __main__:trials:29 - Trial = 9849/30000 | Total reward = 43.01
2022-01-26 14:17:12.676 | DEBUG    | __main__:trials:24 - Trial = 9850/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.677 | DEBUG    | __main__:trials:29 - Trial = 9850/30000 | Total reward = 43.21
2022-01-26 14:17:12.681 | DEBUG    | __main__:trials:24 - Trial = 9851/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.683 | DEBUG    | __main__:trials:29 - Trial = 9851/30000 | Total reward = 31.71
2022-01-26 14:17:12.686 | DEBUG    | __main__:trials:24 - Trial = 9852/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.688 | DEBUG    | __main__:trials:29 - Trial = 9852/30000 | Total reward = 42.67
2022-01-26 14:17:12.691 | DEBUG    | __main__:trials:24 - Trial = 9853/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.692 | DEBUG    | __main__:trials:29 - Trial = 9853/30000 | Total reward = 63.02
2022-01-26 14:17:12.695 | DEBUG    | __main__:trials:24 - Trial = 9854/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.697 | DEBUG    | __main__:trials:29 - Trial = 9854/30000 | Total reward = 47.68
2022-01-26 14:17:12.701 | DEBUG    | __main__:trials:24 - Trial = 9855/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.702 | DEBUG    | __main__:trials:29 - Trial = 9855/30000 | Total reward = 60.72
2022-01-26 14:17:12.705 | DEBUG    | __main__:trials:24 - Trial = 9856/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.706 | DEBUG    | __main__:trials:29 - Trial = 9856/30000 | Total reward = 49.55
2022-01-26 14:17:12.709 | DEBUG    | __main__:trials:24 - Trial = 9857/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.711 | DEBUG    | __main__:trials:29 - Trial = 9857/30000 | Total reward = 62.94
2022-01-26 14:17:12.713 | DEBUG    | __main__:trials:24 - Trial = 9858/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.714 | DEBUG    | __main__:trials:29 - Trial = 9858/30000 | Total reward = 45.08
2022-01-26 14:17:12.718 | DEBUG    | __main__:trials:24 - Trial = 9859/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.719 | DEBUG    | __main__:trials:29 - Trial = 9859/30000 | Total reward = 47.57
2022-01-26 14:17:12.723 | DEBUG    | __main__:trials:24 - Trial = 9860/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.724 | DEBUG    | __main__:trials:29 - Trial = 9860/30000 | Total reward = 43.34
2022-01-26 14:17:12.728 | DEBUG    | __main__:trials:24 - Trial = 9861/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.729 | DEBUG    | __main__:trials:29 - Trial = 9861/30000 | Total reward = 42.94
2022-01-26 14:17:12.732 | DEBUG    | __main__:trials:24 - Trial = 9862/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.734 | DEBUG    | __main__:trials:29 - Trial = 9862/30000 | Total reward = 49.63
2022-01-26 14:17:12.737 | DEBUG    | __main__:trials:24 - Trial = 9863/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.738 | DEBUG    | __main__:trials:29 - Trial = 9863/30000 | Total reward = 43.49
2022-01-26 14:17:12.742 | DEBUG    | __main__:trials:24 - Trial = 9864/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.743 | DEBUG    | __main__:trials:29 - Trial = 9864/30000 | Total reward = 48.03
2022-01-26 14:17:12.747 | DEBUG    | __main__:trials:24 - Trial = 9865/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.749 | DEBUG    | __main__:trials:29 - Trial = 9865/30000 | Total reward = 44.93
2022-01-26 14:17:12.752 | DEBUG    | __main__:trials:24 - Trial = 9866/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.754 | DEBUG    | __main__:trials:29 - Trial = 9866/30000 | Total reward = 32.86
2022-01-26 14:17:12.757 | DEBUG    | __main__:trials:24 - Trial = 9867/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.758 | DEBUG    | __main__:trials:29 - Trial = 9867/30000 | Total reward = 61.15
2022-01-26 14:17:12.762 | DEBUG    | __main__:trials:24 - Trial = 9868/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.763 | DEBUG    | __main__:trials:29 - Trial = 9868/30000 | Total reward = 55.92
2022-01-26 14:17:12.767 | DEBUG    | __main__:trials:24 - Trial = 9869/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.769 | DEBUG    | __main__:trials:29 - Trial = 9869/30000 | Total reward = 49.96
2022-01-26 14:17:12.772 | DEBUG    | __main__:trials:24 - Trial = 9870/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.774 | DEBUG    | __main__:trials:29 - Trial = 9870/30000 | Total reward = 57.06
2022-01-26 14:17:12.777 | DEBUG    | __main__:trials:24 - Trial = 9871/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.779 | DEBUG    | __main__:trials:29 - Trial = 9871/30000 | Total reward = 45.47
2022-01-26 14:17:12.782 | DEBUG    | __main__:trials:24 - Trial = 9872/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.783 | DEBUG    | __main__:trials:29 - Trial = 9872/30000 | Total reward = 46.43
2022-01-26 14:17:12.787 | DEBUG    | __main__:trials:24 - Trial = 9873/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.789 | DEBUG    | __main__:trials:29 - Trial = 9873/30000 | Total reward = 48.03
2022-01-26 14:17:12.793 | DEBUG    | __main__:trials:24 - Trial = 9874/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.793 | DEBUG    | __main__:trials:29 - Trial = 9874/30000 | Total reward = 44.69
2022-01-26 14:17:12.798 | DEBUG    | __main__:trials:24 - Trial = 9875/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.799 | DEBUG    | __main__:trials:29 - Trial = 9875/30000 | Total reward = 37.20
2022-01-26 14:17:12.803 | DEBUG    | __main__:trials:24 - Trial = 9876/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.804 | DEBUG    | __main__:trials:29 - Trial = 9876/30000 | Total reward = 58.77
2022-01-26 14:17:12.808 | DEBUG    | __main__:trials:24 - Trial = 9877/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.809 | DEBUG    | __main__:trials:29 - Trial = 9877/30000 | Total reward = 47.50
2022-01-26 14:17:12.813 | DEBUG    | __main__:trials:24 - Trial = 9878/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.814 | DEBUG    | __main__:trials:29 - Trial = 9878/30000 | Total reward = 47.51
2022-01-26 14:17:12.817 | DEBUG    | __main__:trials:24 - Trial = 9879/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.818 | DEBUG    | __main__:trials:29 - Trial = 9879/30000 | Total reward = 46.03
2022-01-26 14:17:12.821 | DEBUG    | __main__:trials:24 - Trial = 9880/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.822 | DEBUG    | __main__:trials:29 - Trial = 9880/30000 | Total reward = 42.29
2022-01-26 14:17:12.825 | DEBUG    | __main__:trials:24 - Trial = 9881/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.827 | DEBUG    | __main__:trials:29 - Trial = 9881/30000 | Total reward = 56.43
2022-01-26 14:17:12.830 | DEBUG    | __main__:trials:24 - Trial = 9882/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.832 | DEBUG    | __main__:trials:29 - Trial = 9882/30000 | Total reward = 48.33
2022-01-26 14:17:12.835 | DEBUG    | __main__:trials:24 - Trial = 9883/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.837 | DEBUG    | __main__:trials:29 - Trial = 9883/30000 | Total reward = 46.84
2022-01-26 14:17:12.840 | DEBUG    | __main__:trials:24 - Trial = 9884/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.841 | DEBUG    | __main__:trials:29 - Trial = 9884/30000 | Total reward = 53.06
2022-01-26 14:17:12.845 | DEBUG    | __main__:trials:24 - Trial = 9885/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.846 | DEBUG    | __main__:trials:29 - Trial = 9885/30000 | Total reward = 39.15
2022-01-26 14:17:12.850 | DEBUG    | __main__:trials:24 - Trial = 9886/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.852 | DEBUG    | __main__:trials:29 - Trial = 9886/30000 | Total reward = 43.88
2022-01-26 14:17:12.855 | DEBUG    | __main__:trials:24 - Trial = 9887/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.856 | DEBUG    | __main__:trials:29 - Trial = 9887/30000 | Total reward = 39.55
2022-01-26 14:17:12.860 | DEBUG    | __main__:trials:24 - Trial = 9888/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.862 | DEBUG    | __main__:trials:29 - Trial = 9888/30000 | Total reward = 55.48
2022-01-26 14:17:12.865 | DEBUG    | __main__:trials:24 - Trial = 9889/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.867 | DEBUG    | __main__:trials:29 - Trial = 9889/30000 | Total reward = 58.65
2022-01-26 14:17:12.871 | DEBUG    | __main__:trials:24 - Trial = 9890/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.872 | DEBUG    | __main__:trials:29 - Trial = 9890/30000 | Total reward = 46.84
2022-01-26 14:17:12.876 | DEBUG    | __main__:trials:24 - Trial = 9891/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.877 | DEBUG    | __main__:trials:29 - Trial = 9891/30000 | Total reward = 50.54
2022-01-26 14:17:12.881 | DEBUG    | __main__:trials:24 - Trial = 9892/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.881 | DEBUG    | __main__:trials:29 - Trial = 9892/30000 | Total reward = 42.73
2022-01-26 14:17:12.885 | DEBUG    | __main__:trials:24 - Trial = 9893/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.885 | DEBUG    | __main__:trials:29 - Trial = 9893/30000 | Total reward = 51.16
2022-01-26 14:17:12.889 | DEBUG    | __main__:trials:24 - Trial = 9894/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.892 | DEBUG    | __main__:trials:29 - Trial = 9894/30000 | Total reward = 44.36
2022-01-26 14:17:12.895 | DEBUG    | __main__:trials:24 - Trial = 9895/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.896 | DEBUG    | __main__:trials:29 - Trial = 9895/30000 | Total reward = 64.14
2022-01-26 14:17:12.899 | DEBUG    | __main__:trials:24 - Trial = 9896/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.901 | DEBUG    | __main__:trials:29 - Trial = 9896/30000 | Total reward = 46.46
2022-01-26 14:17:12.905 | DEBUG    | __main__:trials:24 - Trial = 9897/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.906 | DEBUG    | __main__:trials:29 - Trial = 9897/30000 | Total reward = 47.05
2022-01-26 14:17:12.909 | DEBUG    | __main__:trials:24 - Trial = 9898/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.909 | DEBUG    | __main__:trials:29 - Trial = 9898/30000 | Total reward = 57.74
2022-01-26 14:17:12.914 | DEBUG    | __main__:trials:24 - Trial = 9899/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.915 | DEBUG    | __main__:trials:29 - Trial = 9899/30000 | Total reward = 48.93
2022-01-26 14:17:12.919 | DEBUG    | __main__:trials:24 - Trial = 9900/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.921 | DEBUG    | __main__:trials:29 - Trial = 9900/30000 | Total reward = 46.95
2022-01-26 14:17:12.924 | DEBUG    | __main__:trials:24 - Trial = 9901/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.928 | DEBUG    | __main__:trials:29 - Trial = 9901/30000 | Total reward = 46.61
2022-01-26 14:17:12.933 | DEBUG    | __main__:trials:24 - Trial = 9902/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.934 | DEBUG    | __main__:trials:29 - Trial = 9902/30000 | Total reward = 41.23
2022-01-26 14:17:12.938 | DEBUG    | __main__:trials:24 - Trial = 9903/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.940 | DEBUG    | __main__:trials:29 - Trial = 9903/30000 | Total reward = 47.66
2022-01-26 14:17:12.943 | DEBUG    | __main__:trials:24 - Trial = 9904/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.945 | DEBUG    | __main__:trials:29 - Trial = 9904/30000 | Total reward = 44.83
2022-01-26 14:17:12.948 | DEBUG    | __main__:trials:24 - Trial = 9905/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.950 | DEBUG    | __main__:trials:29 - Trial = 9905/30000 | Total reward = 46.75
2022-01-26 14:17:12.953 | DEBUG    | __main__:trials:24 - Trial = 9906/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.955 | DEBUG    | __main__:trials:29 - Trial = 9906/30000 | Total reward = 46.39
2022-01-26 14:17:12.958 | DEBUG    | __main__:trials:24 - Trial = 9907/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.959 | DEBUG    | __main__:trials:29 - Trial = 9907/30000 | Total reward = 48.67
2022-01-26 14:17:12.962 | DEBUG    | __main__:trials:24 - Trial = 9908/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.964 | DEBUG    | __main__:trials:29 - Trial = 9908/30000 | Total reward = 48.03
2022-01-26 14:17:12.967 | DEBUG    | __main__:trials:24 - Trial = 9909/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.969 | DEBUG    | __main__:trials:29 - Trial = 9909/30000 | Total reward = 44.12
2022-01-26 14:17:12.972 | DEBUG    | __main__:trials:24 - Trial = 9910/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.973 | DEBUG    | __main__:trials:29 - Trial = 9910/30000 | Total reward = 45.26
2022-01-26 14:17:12.976 | DEBUG    | __main__:trials:24 - Trial = 9911/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.978 | DEBUG    | __main__:trials:29 - Trial = 9911/30000 | Total reward = 43.09
2022-01-26 14:17:12.981 | DEBUG    | __main__:trials:24 - Trial = 9912/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.982 | DEBUG    | __main__:trials:29 - Trial = 9912/30000 | Total reward = 65.45
2022-01-26 14:17:12.985 | DEBUG    | __main__:trials:24 - Trial = 9913/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.986 | DEBUG    | __main__:trials:29 - Trial = 9913/30000 | Total reward = 47.81
2022-01-26 14:17:12.989 | DEBUG    | __main__:trials:24 - Trial = 9914/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.991 | DEBUG    | __main__:trials:29 - Trial = 9914/30000 | Total reward = 41.40
2022-01-26 14:17:12.995 | DEBUG    | __main__:trials:24 - Trial = 9915/30000 | Max number of steps (20) reached
2022-01-26 14:17:12.996 | DEBUG    | __main__:trials:29 - Trial = 9915/30000 | Total reward = 54.78
2022-01-26 14:17:13.000 | DEBUG    | __main__:trials:24 - Trial = 9916/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.001 | DEBUG    | __main__:trials:29 - Trial = 9916/30000 | Total reward = 48.03
2022-01-26 14:17:13.005 | DEBUG    | __main__:trials:24 - Trial = 9917/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.007 | DEBUG    | __main__:trials:29 - Trial = 9917/30000 | Total reward = 44.03
2022-01-26 14:17:13.009 | DEBUG    | __main__:trials:24 - Trial = 9918/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.011 | DEBUG    | __main__:trials:29 - Trial = 9918/30000 | Total reward = 40.43
2022-01-26 14:17:13.014 | DEBUG    | __main__:trials:24 - Trial = 9919/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.016 | DEBUG    | __main__:trials:29 - Trial = 9919/30000 | Total reward = 42.85
2022-01-26 14:17:13.019 | DEBUG    | __main__:trials:24 - Trial = 9920/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.020 | DEBUG    | __main__:trials:29 - Trial = 9920/30000 | Total reward = 50.71
2022-01-26 14:17:13.023 | DEBUG    | __main__:trials:24 - Trial = 9921/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.025 | DEBUG    | __main__:trials:29 - Trial = 9921/30000 | Total reward = 57.48
2022-01-26 14:17:13.028 | DEBUG    | __main__:trials:24 - Trial = 9922/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.029 | DEBUG    | __main__:trials:29 - Trial = 9922/30000 | Total reward = 43.97
2022-01-26 14:17:13.034 | DEBUG    | __main__:trials:24 - Trial = 9923/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.034 | DEBUG    | __main__:trials:29 - Trial = 9923/30000 | Total reward = 56.29
2022-01-26 14:17:13.039 | DEBUG    | __main__:trials:24 - Trial = 9924/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.040 | DEBUG    | __main__:trials:29 - Trial = 9924/30000 | Total reward = 46.84
2022-01-26 14:17:13.044 | DEBUG    | __main__:trials:24 - Trial = 9925/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.044 | DEBUG    | __main__:trials:29 - Trial = 9925/30000 | Total reward = 48.09
2022-01-26 14:17:13.049 | DEBUG    | __main__:trials:24 - Trial = 9926/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.050 | DEBUG    | __main__:trials:29 - Trial = 9926/30000 | Total reward = 55.62
2022-01-26 14:17:13.054 | DEBUG    | __main__:trials:24 - Trial = 9927/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.055 | DEBUG    | __main__:trials:29 - Trial = 9927/30000 | Total reward = 45.31
2022-01-26 14:17:13.058 | DEBUG    | __main__:trials:24 - Trial = 9928/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.059 | DEBUG    | __main__:trials:29 - Trial = 9928/30000 | Total reward = 49.89
2022-01-26 14:17:13.063 | DEBUG    | __main__:trials:24 - Trial = 9929/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.065 | DEBUG    | __main__:trials:29 - Trial = 9929/30000 | Total reward = 48.34
2022-01-26 14:17:13.067 | DEBUG    | __main__:trials:24 - Trial = 9930/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.069 | DEBUG    | __main__:trials:29 - Trial = 9930/30000 | Total reward = 54.42
2022-01-26 14:17:13.072 | DEBUG    | __main__:trials:24 - Trial = 9931/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.074 | DEBUG    | __main__:trials:29 - Trial = 9931/30000 | Total reward = 41.80
2022-01-26 14:17:13.077 | DEBUG    | __main__:trials:24 - Trial = 9932/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.078 | DEBUG    | __main__:trials:29 - Trial = 9932/30000 | Total reward = 50.55
2022-01-26 14:17:13.083 | DEBUG    | __main__:trials:24 - Trial = 9933/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.083 | DEBUG    | __main__:trials:29 - Trial = 9933/30000 | Total reward = 53.21
2022-01-26 14:17:13.088 | DEBUG    | __main__:trials:24 - Trial = 9934/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.090 | DEBUG    | __main__:trials:29 - Trial = 9934/30000 | Total reward = 47.42
2022-01-26 14:17:13.094 | DEBUG    | __main__:trials:24 - Trial = 9935/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.095 | DEBUG    | __main__:trials:29 - Trial = 9935/30000 | Total reward = 42.50
2022-01-26 14:17:13.099 | DEBUG    | __main__:trials:24 - Trial = 9936/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.101 | DEBUG    | __main__:trials:29 - Trial = 9936/30000 | Total reward = 44.96
2022-01-26 14:17:13.104 | DEBUG    | __main__:trials:24 - Trial = 9937/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.105 | DEBUG    | __main__:trials:29 - Trial = 9937/30000 | Total reward = 41.36
2022-01-26 14:17:13.109 | DEBUG    | __main__:trials:24 - Trial = 9938/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.110 | DEBUG    | __main__:trials:29 - Trial = 9938/30000 | Total reward = 37.81
2022-01-26 14:17:13.114 | DEBUG    | __main__:trials:24 - Trial = 9939/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.115 | DEBUG    | __main__:trials:29 - Trial = 9939/30000 | Total reward = 35.67
2022-01-26 14:17:13.119 | DEBUG    | __main__:trials:24 - Trial = 9940/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.121 | DEBUG    | __main__:trials:29 - Trial = 9940/30000 | Total reward = 46.11
2022-01-26 14:17:13.124 | DEBUG    | __main__:trials:24 - Trial = 9941/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.126 | DEBUG    | __main__:trials:29 - Trial = 9941/30000 | Total reward = 47.86
2022-01-26 14:17:13.129 | DEBUG    | __main__:trials:24 - Trial = 9942/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.130 | DEBUG    | __main__:trials:29 - Trial = 9942/30000 | Total reward = 59.91
2022-01-26 14:17:13.134 | DEBUG    | __main__:trials:24 - Trial = 9943/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.136 | DEBUG    | __main__:trials:29 - Trial = 9943/30000 | Total reward = 50.69
2022-01-26 14:17:13.139 | DEBUG    | __main__:trials:24 - Trial = 9944/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.140 | DEBUG    | __main__:trials:29 - Trial = 9944/30000 | Total reward = 40.75
2022-01-26 14:17:13.144 | DEBUG    | __main__:trials:24 - Trial = 9945/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.145 | DEBUG    | __main__:trials:29 - Trial = 9945/30000 | Total reward = 47.28
2022-01-26 14:17:13.149 | DEBUG    | __main__:trials:24 - Trial = 9946/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.151 | DEBUG    | __main__:trials:29 - Trial = 9946/30000 | Total reward = 43.47
2022-01-26 14:17:13.155 | DEBUG    | __main__:trials:24 - Trial = 9947/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.156 | DEBUG    | __main__:trials:29 - Trial = 9947/30000 | Total reward = 53.45
2022-01-26 14:17:13.159 | DEBUG    | __main__:trials:24 - Trial = 9948/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.161 | DEBUG    | __main__:trials:29 - Trial = 9948/30000 | Total reward = 54.40
2022-01-26 14:17:13.164 | DEBUG    | __main__:trials:24 - Trial = 9949/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.165 | DEBUG    | __main__:trials:29 - Trial = 9949/30000 | Total reward = 46.90
2022-01-26 14:17:13.169 | DEBUG    | __main__:trials:24 - Trial = 9950/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.170 | DEBUG    | __main__:trials:29 - Trial = 9950/30000 | Total reward = 39.13
2022-01-26 14:17:13.173 | DEBUG    | __main__:trials:24 - Trial = 9951/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.174 | DEBUG    | __main__:trials:29 - Trial = 9951/30000 | Total reward = 40.96
2022-01-26 14:17:13.177 | DEBUG    | __main__:trials:24 - Trial = 9952/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.179 | DEBUG    | __main__:trials:29 - Trial = 9952/30000 | Total reward = 40.72
2022-01-26 14:17:13.182 | DEBUG    | __main__:trials:24 - Trial = 9953/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.183 | DEBUG    | __main__:trials:29 - Trial = 9953/30000 | Total reward = 47.14
2022-01-26 14:17:13.186 | DEBUG    | __main__:trials:24 - Trial = 9954/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.187 | DEBUG    | __main__:trials:29 - Trial = 9954/30000 | Total reward = 44.74
2022-01-26 14:17:13.190 | DEBUG    | __main__:trials:24 - Trial = 9955/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.192 | DEBUG    | __main__:trials:29 - Trial = 9955/30000 | Total reward = 42.96
2022-01-26 14:17:13.195 | DEBUG    | __main__:trials:24 - Trial = 9956/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.196 | DEBUG    | __main__:trials:29 - Trial = 9956/30000 | Total reward = 47.53
2022-01-26 14:17:13.199 | DEBUG    | __main__:trials:24 - Trial = 9957/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.201 | DEBUG    | __main__:trials:29 - Trial = 9957/30000 | Total reward = 65.30
2022-01-26 14:17:13.204 | DEBUG    | __main__:trials:24 - Trial = 9958/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.204 | DEBUG    | __main__:trials:29 - Trial = 9958/30000 | Total reward = 44.19
2022-01-26 14:17:13.208 | DEBUG    | __main__:trials:24 - Trial = 9959/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.209 | DEBUG    | __main__:trials:29 - Trial = 9959/30000 | Total reward = 33.74
2022-01-26 14:17:13.213 | DEBUG    | __main__:trials:24 - Trial = 9960/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.215 | DEBUG    | __main__:trials:29 - Trial = 9960/30000 | Total reward = 44.18
2022-01-26 14:17:13.218 | DEBUG    | __main__:trials:24 - Trial = 9961/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.218 | DEBUG    | __main__:trials:29 - Trial = 9961/30000 | Total reward = 67.02
2022-01-26 14:17:13.222 | DEBUG    | __main__:trials:24 - Trial = 9962/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.223 | DEBUG    | __main__:trials:29 - Trial = 9962/30000 | Total reward = 42.35
2022-01-26 14:17:13.226 | DEBUG    | __main__:trials:24 - Trial = 9963/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.228 | DEBUG    | __main__:trials:29 - Trial = 9963/30000 | Total reward = 37.98
2022-01-26 14:17:13.231 | DEBUG    | __main__:trials:24 - Trial = 9964/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.233 | DEBUG    | __main__:trials:29 - Trial = 9964/30000 | Total reward = 48.60
2022-01-26 14:17:13.236 | DEBUG    | __main__:trials:24 - Trial = 9965/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.237 | DEBUG    | __main__:trials:29 - Trial = 9965/30000 | Total reward = 44.04
2022-01-26 14:17:13.240 | DEBUG    | __main__:trials:24 - Trial = 9966/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.241 | DEBUG    | __main__:trials:29 - Trial = 9966/30000 | Total reward = 46.91
2022-01-26 14:17:13.244 | DEBUG    | __main__:trials:24 - Trial = 9967/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.245 | DEBUG    | __main__:trials:29 - Trial = 9967/30000 | Total reward = 44.47
2022-01-26 14:17:13.248 | DEBUG    | __main__:trials:24 - Trial = 9968/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.250 | DEBUG    | __main__:trials:29 - Trial = 9968/30000 | Total reward = 51.83
2022-01-26 14:17:13.254 | DEBUG    | __main__:trials:24 - Trial = 9969/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.255 | DEBUG    | __main__:trials:29 - Trial = 9969/30000 | Total reward = 44.69
2022-01-26 14:17:13.259 | DEBUG    | __main__:trials:24 - Trial = 9970/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.261 | DEBUG    | __main__:trials:29 - Trial = 9970/30000 | Total reward = 47.48
2022-01-26 14:17:13.264 | DEBUG    | __main__:trials:24 - Trial = 9971/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.265 | DEBUG    | __main__:trials:29 - Trial = 9971/30000 | Total reward = 42.32
2022-01-26 14:17:13.270 | DEBUG    | __main__:trials:24 - Trial = 9972/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.271 | DEBUG    | __main__:trials:29 - Trial = 9972/30000 | Total reward = 44.80
2022-01-26 14:17:13.275 | DEBUG    | __main__:trials:24 - Trial = 9973/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.276 | DEBUG    | __main__:trials:29 - Trial = 9973/30000 | Total reward = 61.68
2022-01-26 14:17:13.280 | DEBUG    | __main__:trials:24 - Trial = 9974/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.282 | DEBUG    | __main__:trials:29 - Trial = 9974/30000 | Total reward = 42.00
2022-01-26 14:17:13.286 | DEBUG    | __main__:trials:24 - Trial = 9975/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.286 | DEBUG    | __main__:trials:29 - Trial = 9975/30000 | Total reward = 44.67
2022-01-26 14:17:13.290 | DEBUG    | __main__:trials:24 - Trial = 9976/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.291 | DEBUG    | __main__:trials:29 - Trial = 9976/30000 | Total reward = 26.88
2022-01-26 14:17:13.295 | DEBUG    | __main__:trials:24 - Trial = 9977/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.297 | DEBUG    | __main__:trials:29 - Trial = 9977/30000 | Total reward = 44.90
2022-01-26 14:17:13.300 | DEBUG    | __main__:trials:24 - Trial = 9978/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.302 | DEBUG    | __main__:trials:29 - Trial = 9978/30000 | Total reward = 44.99
2022-01-26 14:17:13.305 | DEBUG    | __main__:trials:24 - Trial = 9979/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.306 | DEBUG    | __main__:trials:29 - Trial = 9979/30000 | Total reward = 62.72
2022-01-26 14:17:13.310 | DEBUG    | __main__:trials:24 - Trial = 9980/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.312 | DEBUG    | __main__:trials:29 - Trial = 9980/30000 | Total reward = 44.89
2022-01-26 14:17:13.316 | DEBUG    | __main__:trials:24 - Trial = 9981/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.317 | DEBUG    | __main__:trials:29 - Trial = 9981/30000 | Total reward = 35.74
2022-01-26 14:17:13.321 | DEBUG    | __main__:trials:26 - Trial = 9982/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:13.322 | DEBUG    | __main__:trials:29 - Trial = 9982/30000 | Total reward = 34.69
2022-01-26 14:17:13.326 | DEBUG    | __main__:trials:24 - Trial = 9983/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.327 | DEBUG    | __main__:trials:29 - Trial = 9983/30000 | Total reward = 52.73
2022-01-26 14:17:13.331 | DEBUG    | __main__:trials:24 - Trial = 9984/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.332 | DEBUG    | __main__:trials:29 - Trial = 9984/30000 | Total reward = 47.86
2022-01-26 14:17:13.336 | DEBUG    | __main__:trials:24 - Trial = 9985/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.337 | DEBUG    | __main__:trials:29 - Trial = 9985/30000 | Total reward = 49.29
2022-01-26 14:17:13.342 | DEBUG    | __main__:trials:24 - Trial = 9986/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.343 | DEBUG    | __main__:trials:29 - Trial = 9986/30000 | Total reward = 57.04
2022-01-26 14:17:13.347 | DEBUG    | __main__:trials:24 - Trial = 9987/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.348 | DEBUG    | __main__:trials:29 - Trial = 9987/30000 | Total reward = 48.73
2022-01-26 14:17:13.353 | DEBUG    | __main__:trials:24 - Trial = 9988/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.354 | DEBUG    | __main__:trials:29 - Trial = 9988/30000 | Total reward = 65.28
2022-01-26 14:17:13.358 | DEBUG    | __main__:trials:24 - Trial = 9989/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.359 | DEBUG    | __main__:trials:29 - Trial = 9989/30000 | Total reward = 52.72
2022-01-26 14:17:13.363 | DEBUG    | __main__:trials:24 - Trial = 9990/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.363 | DEBUG    | __main__:trials:29 - Trial = 9990/30000 | Total reward = 47.25
2022-01-26 14:17:13.367 | DEBUG    | __main__:trials:24 - Trial = 9991/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.369 | DEBUG    | __main__:trials:29 - Trial = 9991/30000 | Total reward = 44.46
2022-01-26 14:17:13.373 | DEBUG    | __main__:trials:24 - Trial = 9992/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.374 | DEBUG    | __main__:trials:29 - Trial = 9992/30000 | Total reward = 33.79
2022-01-26 14:17:13.378 | DEBUG    | __main__:trials:24 - Trial = 9993/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.378 | DEBUG    | __main__:trials:29 - Trial = 9993/30000 | Total reward = 40.98
2022-01-26 14:17:13.383 | DEBUG    | __main__:trials:24 - Trial = 9994/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.384 | DEBUG    | __main__:trials:29 - Trial = 9994/30000 | Total reward = 39.36
2022-01-26 14:17:13.387 | DEBUG    | __main__:trials:24 - Trial = 9995/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.389 | DEBUG    | __main__:trials:29 - Trial = 9995/30000 | Total reward = 40.93
2022-01-26 14:17:13.392 | DEBUG    | __main__:trials:24 - Trial = 9996/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.393 | DEBUG    | __main__:trials:29 - Trial = 9996/30000 | Total reward = 47.84
2022-01-26 14:17:13.397 | DEBUG    | __main__:trials:24 - Trial = 9997/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.398 | DEBUG    | __main__:trials:29 - Trial = 9997/30000 | Total reward = 59.88
2022-01-26 14:17:13.402 | DEBUG    | __main__:trials:24 - Trial = 9998/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.403 | DEBUG    | __main__:trials:29 - Trial = 9998/30000 | Total reward = 44.53
2022-01-26 14:17:13.407 | DEBUG    | __main__:trials:24 - Trial = 9999/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.409 | DEBUG    | __main__:trials:29 - Trial = 9999/30000 | Total reward = 48.99
2022-01-26 14:17:13.412 | DEBUG    | __main__:trials:24 - Trial = 10000/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.414 | DEBUG    | __main__:trials:29 - Trial = 10000/30000 | Total reward = 58.42
2022-01-26 14:17:13.417 | DEBUG    | __main__:trials:24 - Trial = 10001/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.418 | DEBUG    | __main__:trials:29 - Trial = 10001/30000 | Total reward = 40.94
2022-01-26 14:17:13.422 | DEBUG    | __main__:trials:26 - Trial = 10002/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:13.423 | DEBUG    | __main__:trials:29 - Trial = 10002/30000 | Total reward = 12.44
2022-01-26 14:17:13.427 | DEBUG    | __main__:trials:24 - Trial = 10003/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.428 | DEBUG    | __main__:trials:29 - Trial = 10003/30000 | Total reward = 41.51
2022-01-26 14:17:13.432 | DEBUG    | __main__:trials:24 - Trial = 10004/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.433 | DEBUG    | __main__:trials:29 - Trial = 10004/30000 | Total reward = 45.58
2022-01-26 14:17:13.437 | DEBUG    | __main__:trials:24 - Trial = 10005/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.438 | DEBUG    | __main__:trials:29 - Trial = 10005/30000 | Total reward = 38.24
2022-01-26 14:17:13.441 | DEBUG    | __main__:trials:24 - Trial = 10006/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.443 | DEBUG    | __main__:trials:29 - Trial = 10006/30000 | Total reward = 42.33
2022-01-26 14:17:13.446 | DEBUG    | __main__:trials:24 - Trial = 10007/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.447 | DEBUG    | __main__:trials:29 - Trial = 10007/30000 | Total reward = 43.95
2022-01-26 14:17:13.450 | DEBUG    | __main__:trials:24 - Trial = 10008/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.451 | DEBUG    | __main__:trials:29 - Trial = 10008/30000 | Total reward = 40.29
2022-01-26 14:17:13.455 | DEBUG    | __main__:trials:24 - Trial = 10009/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.457 | DEBUG    | __main__:trials:29 - Trial = 10009/30000 | Total reward = 41.34
2022-01-26 14:17:13.460 | DEBUG    | __main__:trials:24 - Trial = 10010/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.462 | DEBUG    | __main__:trials:29 - Trial = 10010/30000 | Total reward = 39.51
2022-01-26 14:17:13.465 | DEBUG    | __main__:trials:24 - Trial = 10011/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.466 | DEBUG    | __main__:trials:29 - Trial = 10011/30000 | Total reward = 44.74
2022-01-26 14:17:13.469 | DEBUG    | __main__:trials:24 - Trial = 10012/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.470 | DEBUG    | __main__:trials:29 - Trial = 10012/30000 | Total reward = 44.74
2022-01-26 14:17:13.473 | DEBUG    | __main__:trials:24 - Trial = 10013/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.475 | DEBUG    | __main__:trials:29 - Trial = 10013/30000 | Total reward = 41.88
2022-01-26 14:17:13.479 | DEBUG    | __main__:trials:24 - Trial = 10014/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.480 | DEBUG    | __main__:trials:29 - Trial = 10014/30000 | Total reward = 51.90
2022-01-26 14:17:13.484 | DEBUG    | __main__:trials:24 - Trial = 10015/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.486 | DEBUG    | __main__:trials:29 - Trial = 10015/30000 | Total reward = 50.22
2022-01-26 14:17:13.490 | DEBUG    | __main__:trials:24 - Trial = 10016/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.491 | DEBUG    | __main__:trials:29 - Trial = 10016/30000 | Total reward = 35.47
2022-01-26 14:17:13.495 | DEBUG    | __main__:trials:24 - Trial = 10017/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.496 | DEBUG    | __main__:trials:29 - Trial = 10017/30000 | Total reward = 65.50
2022-01-26 14:17:13.500 | DEBUG    | __main__:trials:24 - Trial = 10018/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.501 | DEBUG    | __main__:trials:29 - Trial = 10018/30000 | Total reward = 43.61
2022-01-26 14:17:13.505 | DEBUG    | __main__:trials:24 - Trial = 10019/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.506 | DEBUG    | __main__:trials:29 - Trial = 10019/30000 | Total reward = 44.64
2022-01-26 14:17:13.510 | DEBUG    | __main__:trials:24 - Trial = 10020/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.511 | DEBUG    | __main__:trials:29 - Trial = 10020/30000 | Total reward = 43.44
2022-01-26 14:17:13.515 | DEBUG    | __main__:trials:24 - Trial = 10021/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.517 | DEBUG    | __main__:trials:29 - Trial = 10021/30000 | Total reward = 66.25
2022-01-26 14:17:13.520 | DEBUG    | __main__:trials:24 - Trial = 10022/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.521 | DEBUG    | __main__:trials:29 - Trial = 10022/30000 | Total reward = 45.83
2022-01-26 14:17:13.524 | DEBUG    | __main__:trials:24 - Trial = 10023/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.525 | DEBUG    | __main__:trials:29 - Trial = 10023/30000 | Total reward = 34.42
2022-01-26 14:17:13.529 | DEBUG    | __main__:trials:24 - Trial = 10024/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.530 | DEBUG    | __main__:trials:29 - Trial = 10024/30000 | Total reward = 35.03
2022-01-26 14:17:13.534 | DEBUG    | __main__:trials:24 - Trial = 10025/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.534 | DEBUG    | __main__:trials:29 - Trial = 10025/30000 | Total reward = 31.17
2022-01-26 14:17:13.538 | DEBUG    | __main__:trials:24 - Trial = 10026/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.539 | DEBUG    | __main__:trials:29 - Trial = 10026/30000 | Total reward = 50.02
2022-01-26 14:17:13.542 | DEBUG    | __main__:trials:24 - Trial = 10027/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.543 | DEBUG    | __main__:trials:29 - Trial = 10027/30000 | Total reward = 47.62
2022-01-26 14:17:13.546 | DEBUG    | __main__:trials:24 - Trial = 10028/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.547 | DEBUG    | __main__:trials:29 - Trial = 10028/30000 | Total reward = 48.03
2022-01-26 14:17:13.551 | DEBUG    | __main__:trials:24 - Trial = 10029/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.553 | DEBUG    | __main__:trials:29 - Trial = 10029/30000 | Total reward = 52.00
2022-01-26 14:17:13.556 | DEBUG    | __main__:trials:24 - Trial = 10030/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.558 | DEBUG    | __main__:trials:29 - Trial = 10030/30000 | Total reward = 61.26
2022-01-26 14:17:13.562 | DEBUG    | __main__:trials:24 - Trial = 10031/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.563 | DEBUG    | __main__:trials:29 - Trial = 10031/30000 | Total reward = 45.76
2022-01-26 14:17:13.567 | DEBUG    | __main__:trials:24 - Trial = 10032/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.568 | DEBUG    | __main__:trials:29 - Trial = 10032/30000 | Total reward = 38.67
2022-01-26 14:17:13.571 | DEBUG    | __main__:trials:26 - Trial = 10033/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:13.572 | DEBUG    | __main__:trials:29 - Trial = 10033/30000 | Total reward = 16.30
2022-01-26 14:17:13.576 | DEBUG    | __main__:trials:24 - Trial = 10034/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.577 | DEBUG    | __main__:trials:29 - Trial = 10034/30000 | Total reward = 46.84
2022-01-26 14:17:13.581 | DEBUG    | __main__:trials:24 - Trial = 10035/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.582 | DEBUG    | __main__:trials:29 - Trial = 10035/30000 | Total reward = 34.42
2022-01-26 14:17:13.586 | DEBUG    | __main__:trials:24 - Trial = 10036/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.588 | DEBUG    | __main__:trials:29 - Trial = 10036/30000 | Total reward = 47.31
2022-01-26 14:17:13.591 | DEBUG    | __main__:trials:24 - Trial = 10037/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.593 | DEBUG    | __main__:trials:29 - Trial = 10037/30000 | Total reward = 32.66
2022-01-26 14:17:13.596 | DEBUG    | __main__:trials:24 - Trial = 10038/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.598 | DEBUG    | __main__:trials:29 - Trial = 10038/30000 | Total reward = 14.56
2022-01-26 14:17:13.602 | DEBUG    | __main__:trials:24 - Trial = 10039/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.602 | DEBUG    | __main__:trials:29 - Trial = 10039/30000 | Total reward = 48.28
2022-01-26 14:17:13.606 | DEBUG    | __main__:trials:24 - Trial = 10040/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.607 | DEBUG    | __main__:trials:29 - Trial = 10040/30000 | Total reward = 41.05
2022-01-26 14:17:13.611 | DEBUG    | __main__:trials:24 - Trial = 10041/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.613 | DEBUG    | __main__:trials:29 - Trial = 10041/30000 | Total reward = 43.65
2022-01-26 14:17:13.616 | DEBUG    | __main__:trials:24 - Trial = 10042/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.618 | DEBUG    | __main__:trials:29 - Trial = 10042/30000 | Total reward = 43.93
2022-01-26 14:17:13.621 | DEBUG    | __main__:trials:24 - Trial = 10043/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.623 | DEBUG    | __main__:trials:29 - Trial = 10043/30000 | Total reward = 44.15
2022-01-26 14:17:13.626 | DEBUG    | __main__:trials:24 - Trial = 10044/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.628 | DEBUG    | __main__:trials:29 - Trial = 10044/30000 | Total reward = 44.27
2022-01-26 14:17:13.631 | DEBUG    | __main__:trials:24 - Trial = 10045/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.633 | DEBUG    | __main__:trials:29 - Trial = 10045/30000 | Total reward = 40.00
2022-01-26 14:17:13.636 | DEBUG    | __main__:trials:24 - Trial = 10046/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.638 | DEBUG    | __main__:trials:29 - Trial = 10046/30000 | Total reward = 41.26
2022-01-26 14:17:13.641 | DEBUG    | __main__:trials:24 - Trial = 10047/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.642 | DEBUG    | __main__:trials:29 - Trial = 10047/30000 | Total reward = 56.38
2022-01-26 14:17:13.646 | DEBUG    | __main__:trials:24 - Trial = 10048/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.647 | DEBUG    | __main__:trials:29 - Trial = 10048/30000 | Total reward = 48.97
2022-01-26 14:17:13.651 | DEBUG    | __main__:trials:24 - Trial = 10049/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.653 | DEBUG    | __main__:trials:29 - Trial = 10049/30000 | Total reward = 44.44
2022-01-26 14:17:13.656 | DEBUG    | __main__:trials:24 - Trial = 10050/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.658 | DEBUG    | __main__:trials:29 - Trial = 10050/30000 | Total reward = 63.50
2022-01-26 14:17:13.662 | DEBUG    | __main__:trials:24 - Trial = 10051/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.663 | DEBUG    | __main__:trials:29 - Trial = 10051/30000 | Total reward = 37.36
2022-01-26 14:17:13.666 | DEBUG    | __main__:trials:24 - Trial = 10052/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.668 | DEBUG    | __main__:trials:29 - Trial = 10052/30000 | Total reward = 41.83
2022-01-26 14:17:13.671 | DEBUG    | __main__:trials:24 - Trial = 10053/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.673 | DEBUG    | __main__:trials:29 - Trial = 10053/30000 | Total reward = 53.83
2022-01-26 14:17:13.676 | DEBUG    | __main__:trials:24 - Trial = 10054/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.678 | DEBUG    | __main__:trials:29 - Trial = 10054/30000 | Total reward = 37.32
2022-01-26 14:17:13.681 | DEBUG    | __main__:trials:24 - Trial = 10055/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.681 | DEBUG    | __main__:trials:29 - Trial = 10055/30000 | Total reward = 53.11
2022-01-26 14:17:13.686 | DEBUG    | __main__:trials:24 - Trial = 10056/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.687 | DEBUG    | __main__:trials:29 - Trial = 10056/30000 | Total reward = 30.57
2022-01-26 14:17:13.691 | DEBUG    | __main__:trials:24 - Trial = 10057/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.693 | DEBUG    | __main__:trials:29 - Trial = 10057/30000 | Total reward = 59.09
2022-01-26 14:17:13.695 | DEBUG    | __main__:trials:24 - Trial = 10058/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.697 | DEBUG    | __main__:trials:29 - Trial = 10058/30000 | Total reward = 43.65
2022-01-26 14:17:13.701 | DEBUG    | __main__:trials:24 - Trial = 10059/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.702 | DEBUG    | __main__:trials:29 - Trial = 10059/30000 | Total reward = 47.39
2022-01-26 14:17:13.706 | DEBUG    | __main__:trials:24 - Trial = 10060/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.707 | DEBUG    | __main__:trials:29 - Trial = 10060/30000 | Total reward = 40.49
2022-01-26 14:17:13.710 | DEBUG    | __main__:trials:24 - Trial = 10061/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.711 | DEBUG    | __main__:trials:29 - Trial = 10061/30000 | Total reward = 43.84
2022-01-26 14:17:13.715 | DEBUG    | __main__:trials:24 - Trial = 10062/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.716 | DEBUG    | __main__:trials:29 - Trial = 10062/30000 | Total reward = 43.15
2022-01-26 14:17:13.720 | DEBUG    | __main__:trials:24 - Trial = 10063/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.721 | DEBUG    | __main__:trials:29 - Trial = 10063/30000 | Total reward = 40.64
2022-01-26 14:17:13.725 | DEBUG    | __main__:trials:24 - Trial = 10064/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.726 | DEBUG    | __main__:trials:29 - Trial = 10064/30000 | Total reward = 39.95
2022-01-26 14:17:13.730 | DEBUG    | __main__:trials:24 - Trial = 10065/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.732 | DEBUG    | __main__:trials:29 - Trial = 10065/30000 | Total reward = 46.85
2022-01-26 14:17:13.735 | DEBUG    | __main__:trials:24 - Trial = 10066/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.737 | DEBUG    | __main__:trials:29 - Trial = 10066/30000 | Total reward = 39.77
2022-01-26 14:17:13.740 | DEBUG    | __main__:trials:24 - Trial = 10067/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.742 | DEBUG    | __main__:trials:29 - Trial = 10067/30000 | Total reward = 41.12
2022-01-26 14:17:13.746 | DEBUG    | __main__:trials:24 - Trial = 10068/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.747 | DEBUG    | __main__:trials:29 - Trial = 10068/30000 | Total reward = 44.36
2022-01-26 14:17:13.751 | DEBUG    | __main__:trials:24 - Trial = 10069/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.751 | DEBUG    | __main__:trials:29 - Trial = 10069/30000 | Total reward = 44.74
2022-01-26 14:17:13.755 | DEBUG    | __main__:trials:24 - Trial = 10070/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.756 | DEBUG    | __main__:trials:29 - Trial = 10070/30000 | Total reward = 40.18
2022-01-26 14:17:13.761 | DEBUG    | __main__:trials:24 - Trial = 10071/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.762 | DEBUG    | __main__:trials:29 - Trial = 10071/30000 | Total reward = 41.91
2022-01-26 14:17:13.766 | DEBUG    | __main__:trials:24 - Trial = 10072/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.767 | DEBUG    | __main__:trials:29 - Trial = 10072/30000 | Total reward = 42.15
2022-01-26 14:17:13.771 | DEBUG    | __main__:trials:24 - Trial = 10073/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.772 | DEBUG    | __main__:trials:29 - Trial = 10073/30000 | Total reward = 42.37
2022-01-26 14:17:13.776 | DEBUG    | __main__:trials:24 - Trial = 10074/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.777 | DEBUG    | __main__:trials:29 - Trial = 10074/30000 | Total reward = 38.25
2022-01-26 14:17:13.780 | DEBUG    | __main__:trials:24 - Trial = 10075/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.782 | DEBUG    | __main__:trials:29 - Trial = 10075/30000 | Total reward = 43.11
2022-01-26 14:17:13.785 | DEBUG    | __main__:trials:24 - Trial = 10076/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.786 | DEBUG    | __main__:trials:29 - Trial = 10076/30000 | Total reward = 44.30
2022-01-26 14:17:13.789 | DEBUG    | __main__:trials:24 - Trial = 10077/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.792 | DEBUG    | __main__:trials:29 - Trial = 10077/30000 | Total reward = 42.62
2022-01-26 14:17:13.795 | DEBUG    | __main__:trials:24 - Trial = 10078/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.797 | DEBUG    | __main__:trials:29 - Trial = 10078/30000 | Total reward = 44.39
2022-01-26 14:17:13.800 | DEBUG    | __main__:trials:24 - Trial = 10079/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.801 | DEBUG    | __main__:trials:29 - Trial = 10079/30000 | Total reward = 43.64
2022-01-26 14:17:13.805 | DEBUG    | __main__:trials:24 - Trial = 10080/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.807 | DEBUG    | __main__:trials:29 - Trial = 10080/30000 | Total reward = 34.00
2022-01-26 14:17:13.810 | DEBUG    | __main__:trials:24 - Trial = 10081/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.812 | DEBUG    | __main__:trials:29 - Trial = 10081/30000 | Total reward = 40.60
2022-01-26 14:17:13.816 | DEBUG    | __main__:trials:24 - Trial = 10082/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.817 | DEBUG    | __main__:trials:29 - Trial = 10082/30000 | Total reward = 40.91
2022-01-26 14:17:13.997 | DEBUG    | __main__:trials:24 - Trial = 10083/30000 | Max number of steps (20) reached
2022-01-26 14:17:13.999 | DEBUG    | __main__:trials:29 - Trial = 10083/30000 | Total reward = 43.25
2022-01-26 14:17:14.003 | DEBUG    | __main__:trials:24 - Trial = 10084/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.005 | DEBUG    | __main__:trials:29 - Trial = 10084/30000 | Total reward = 43.05
2022-01-26 14:17:14.008 | DEBUG    | __main__:trials:24 - Trial = 10085/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.010 | DEBUG    | __main__:trials:29 - Trial = 10085/30000 | Total reward = 47.71
2022-01-26 14:17:14.013 | DEBUG    | __main__:trials:24 - Trial = 10086/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.015 | DEBUG    | __main__:trials:29 - Trial = 10086/30000 | Total reward = 39.13
2022-01-26 14:17:14.019 | DEBUG    | __main__:trials:24 - Trial = 10087/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.019 | DEBUG    | __main__:trials:29 - Trial = 10087/30000 | Total reward = 36.07
2022-01-26 14:17:14.024 | DEBUG    | __main__:trials:24 - Trial = 10088/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.025 | DEBUG    | __main__:trials:29 - Trial = 10088/30000 | Total reward = 47.15
2022-01-26 14:17:14.029 | DEBUG    | __main__:trials:24 - Trial = 10089/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.030 | DEBUG    | __main__:trials:29 - Trial = 10089/30000 | Total reward = 43.65
2022-01-26 14:17:14.034 | DEBUG    | __main__:trials:24 - Trial = 10090/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.034 | DEBUG    | __main__:trials:29 - Trial = 10090/30000 | Total reward = 36.32
2022-01-26 14:17:14.039 | DEBUG    | __main__:trials:24 - Trial = 10091/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.040 | DEBUG    | __main__:trials:29 - Trial = 10091/30000 | Total reward = 35.64
2022-01-26 14:17:14.044 | DEBUG    | __main__:trials:24 - Trial = 10092/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.045 | DEBUG    | __main__:trials:29 - Trial = 10092/30000 | Total reward = 42.50
2022-01-26 14:17:14.049 | DEBUG    | __main__:trials:24 - Trial = 10093/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.050 | DEBUG    | __main__:trials:29 - Trial = 10093/30000 | Total reward = 44.50
2022-01-26 14:17:14.054 | DEBUG    | __main__:trials:24 - Trial = 10094/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.054 | DEBUG    | __main__:trials:29 - Trial = 10094/30000 | Total reward = 47.31
2022-01-26 14:17:14.058 | DEBUG    | __main__:trials:24 - Trial = 10095/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.059 | DEBUG    | __main__:trials:29 - Trial = 10095/30000 | Total reward = 46.67
2022-01-26 14:17:14.063 | DEBUG    | __main__:trials:24 - Trial = 10096/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.064 | DEBUG    | __main__:trials:29 - Trial = 10096/30000 | Total reward = 44.40
2022-01-26 14:17:14.067 | DEBUG    | __main__:trials:24 - Trial = 10097/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.068 | DEBUG    | __main__:trials:29 - Trial = 10097/30000 | Total reward = 54.87
2022-01-26 14:17:14.071 | DEBUG    | __main__:trials:24 - Trial = 10098/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.073 | DEBUG    | __main__:trials:29 - Trial = 10098/30000 | Total reward = 64.09
2022-01-26 14:17:14.076 | DEBUG    | __main__:trials:24 - Trial = 10099/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.078 | DEBUG    | __main__:trials:29 - Trial = 10099/30000 | Total reward = 39.45
2022-01-26 14:17:14.081 | DEBUG    | __main__:trials:24 - Trial = 10100/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.082 | DEBUG    | __main__:trials:29 - Trial = 10100/30000 | Total reward = 53.78
2022-01-26 14:17:14.086 | DEBUG    | __main__:trials:24 - Trial = 10101/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.087 | DEBUG    | __main__:trials:29 - Trial = 10101/30000 | Total reward = 38.20
2022-01-26 14:17:14.091 | DEBUG    | __main__:trials:24 - Trial = 10102/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.091 | DEBUG    | __main__:trials:29 - Trial = 10102/30000 | Total reward = 48.23
2022-01-26 14:17:14.095 | DEBUG    | __main__:trials:24 - Trial = 10103/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.096 | DEBUG    | __main__:trials:29 - Trial = 10103/30000 | Total reward = 38.44
2022-01-26 14:17:14.100 | DEBUG    | __main__:trials:24 - Trial = 10104/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.100 | DEBUG    | __main__:trials:29 - Trial = 10104/30000 | Total reward = 44.07
2022-01-26 14:17:14.104 | DEBUG    | __main__:trials:24 - Trial = 10105/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.106 | DEBUG    | __main__:trials:29 - Trial = 10105/30000 | Total reward = 36.64
2022-01-26 14:17:14.109 | DEBUG    | __main__:trials:24 - Trial = 10106/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.110 | DEBUG    | __main__:trials:29 - Trial = 10106/30000 | Total reward = 42.22
2022-01-26 14:17:14.114 | DEBUG    | __main__:trials:24 - Trial = 10107/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.115 | DEBUG    | __main__:trials:29 - Trial = 10107/30000 | Total reward = 37.80
2022-01-26 14:17:14.119 | DEBUG    | __main__:trials:24 - Trial = 10108/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.120 | DEBUG    | __main__:trials:29 - Trial = 10108/30000 | Total reward = 40.25
2022-01-26 14:17:14.123 | DEBUG    | __main__:trials:24 - Trial = 10109/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.125 | DEBUG    | __main__:trials:29 - Trial = 10109/30000 | Total reward = 42.22
2022-01-26 14:17:14.128 | DEBUG    | __main__:trials:26 - Trial = 10110/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.129 | DEBUG    | __main__:trials:29 - Trial = 10110/30000 | Total reward = 20.30
2022-01-26 14:17:14.133 | DEBUG    | __main__:trials:24 - Trial = 10111/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.134 | DEBUG    | __main__:trials:29 - Trial = 10111/30000 | Total reward = 25.99
2022-01-26 14:17:14.138 | DEBUG    | __main__:trials:24 - Trial = 10112/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.139 | DEBUG    | __main__:trials:29 - Trial = 10112/30000 | Total reward = 34.70
2022-01-26 14:17:14.143 | DEBUG    | __main__:trials:24 - Trial = 10113/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.144 | DEBUG    | __main__:trials:29 - Trial = 10113/30000 | Total reward = 40.13
2022-01-26 14:17:14.147 | DEBUG    | __main__:trials:24 - Trial = 10114/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.149 | DEBUG    | __main__:trials:29 - Trial = 10114/30000 | Total reward = 43.26
2022-01-26 14:17:14.152 | DEBUG    | __main__:trials:24 - Trial = 10115/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.153 | DEBUG    | __main__:trials:29 - Trial = 10115/30000 | Total reward = 47.63
2022-01-26 14:17:14.157 | DEBUG    | __main__:trials:24 - Trial = 10116/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.159 | DEBUG    | __main__:trials:29 - Trial = 10116/30000 | Total reward = 39.29
2022-01-26 14:17:14.162 | DEBUG    | __main__:trials:24 - Trial = 10117/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.164 | DEBUG    | __main__:trials:29 - Trial = 10117/30000 | Total reward = 42.64
2022-01-26 14:17:14.168 | DEBUG    | __main__:trials:24 - Trial = 10118/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.169 | DEBUG    | __main__:trials:29 - Trial = 10118/30000 | Total reward = 39.62
2022-01-26 14:17:14.173 | DEBUG    | __main__:trials:24 - Trial = 10119/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.174 | DEBUG    | __main__:trials:29 - Trial = 10119/30000 | Total reward = 38.83
2022-01-26 14:17:14.177 | DEBUG    | __main__:trials:24 - Trial = 10120/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.178 | DEBUG    | __main__:trials:29 - Trial = 10120/30000 | Total reward = 46.14
2022-01-26 14:17:14.181 | DEBUG    | __main__:trials:24 - Trial = 10121/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.183 | DEBUG    | __main__:trials:29 - Trial = 10121/30000 | Total reward = 42.25
2022-01-26 14:17:14.187 | DEBUG    | __main__:trials:24 - Trial = 10122/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.188 | DEBUG    | __main__:trials:29 - Trial = 10122/30000 | Total reward = 46.06
2022-01-26 14:17:14.192 | DEBUG    | __main__:trials:24 - Trial = 10123/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.193 | DEBUG    | __main__:trials:29 - Trial = 10123/30000 | Total reward = 39.95
2022-01-26 14:17:14.197 | DEBUG    | __main__:trials:24 - Trial = 10124/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.197 | DEBUG    | __main__:trials:29 - Trial = 10124/30000 | Total reward = 38.55
2022-01-26 14:17:14.202 | DEBUG    | __main__:trials:24 - Trial = 10125/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.202 | DEBUG    | __main__:trials:29 - Trial = 10125/30000 | Total reward = 43.65
2022-01-26 14:17:14.207 | DEBUG    | __main__:trials:24 - Trial = 10126/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.208 | DEBUG    | __main__:trials:29 - Trial = 10126/30000 | Total reward = 37.82
2022-01-26 14:17:14.212 | DEBUG    | __main__:trials:24 - Trial = 10127/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.213 | DEBUG    | __main__:trials:29 - Trial = 10127/30000 | Total reward = 42.08
2022-01-26 14:17:14.217 | DEBUG    | __main__:trials:24 - Trial = 10128/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.218 | DEBUG    | __main__:trials:29 - Trial = 10128/30000 | Total reward = 48.47
2022-01-26 14:17:14.223 | DEBUG    | __main__:trials:24 - Trial = 10129/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.224 | DEBUG    | __main__:trials:29 - Trial = 10129/30000 | Total reward = 47.32
2022-01-26 14:17:14.228 | DEBUG    | __main__:trials:24 - Trial = 10130/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.229 | DEBUG    | __main__:trials:29 - Trial = 10130/30000 | Total reward = 44.34
2022-01-26 14:17:14.233 | DEBUG    | __main__:trials:24 - Trial = 10131/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.234 | DEBUG    | __main__:trials:29 - Trial = 10131/30000 | Total reward = 55.27
2022-01-26 14:17:14.238 | DEBUG    | __main__:trials:24 - Trial = 10132/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.239 | DEBUG    | __main__:trials:29 - Trial = 10132/30000 | Total reward = 41.45
2022-01-26 14:17:14.243 | DEBUG    | __main__:trials:24 - Trial = 10133/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.244 | DEBUG    | __main__:trials:29 - Trial = 10133/30000 | Total reward = 29.18
2022-01-26 14:17:14.248 | DEBUG    | __main__:trials:24 - Trial = 10134/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.248 | DEBUG    | __main__:trials:29 - Trial = 10134/30000 | Total reward = 40.79
2022-01-26 14:17:14.252 | DEBUG    | __main__:trials:24 - Trial = 10135/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.253 | DEBUG    | __main__:trials:29 - Trial = 10135/30000 | Total reward = 31.67
2022-01-26 14:17:14.256 | DEBUG    | __main__:trials:24 - Trial = 10136/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.257 | DEBUG    | __main__:trials:29 - Trial = 10136/30000 | Total reward = 37.19
2022-01-26 14:17:14.260 | DEBUG    | __main__:trials:24 - Trial = 10137/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.262 | DEBUG    | __main__:trials:29 - Trial = 10137/30000 | Total reward = 43.65
2022-01-26 14:17:14.265 | DEBUG    | __main__:trials:24 - Trial = 10138/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.266 | DEBUG    | __main__:trials:29 - Trial = 10138/30000 | Total reward = 41.36
2022-01-26 14:17:14.270 | DEBUG    | __main__:trials:24 - Trial = 10139/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.270 | DEBUG    | __main__:trials:29 - Trial = 10139/30000 | Total reward = 44.21
2022-01-26 14:17:14.274 | DEBUG    | __main__:trials:24 - Trial = 10140/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.275 | DEBUG    | __main__:trials:29 - Trial = 10140/30000 | Total reward = 42.70
2022-01-26 14:17:14.279 | DEBUG    | __main__:trials:24 - Trial = 10141/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.280 | DEBUG    | __main__:trials:29 - Trial = 10141/30000 | Total reward = 36.31
2022-01-26 14:17:14.283 | DEBUG    | __main__:trials:24 - Trial = 10142/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.285 | DEBUG    | __main__:trials:29 - Trial = 10142/30000 | Total reward = 47.73
2022-01-26 14:17:14.288 | DEBUG    | __main__:trials:24 - Trial = 10143/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.289 | DEBUG    | __main__:trials:29 - Trial = 10143/30000 | Total reward = 54.16
2022-01-26 14:17:14.292 | DEBUG    | __main__:trials:24 - Trial = 10144/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.293 | DEBUG    | __main__:trials:29 - Trial = 10144/30000 | Total reward = 42.68
2022-01-26 14:17:14.296 | DEBUG    | __main__:trials:24 - Trial = 10145/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.298 | DEBUG    | __main__:trials:29 - Trial = 10145/30000 | Total reward = 40.55
2022-01-26 14:17:14.301 | DEBUG    | __main__:trials:24 - Trial = 10146/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.301 | DEBUG    | __main__:trials:29 - Trial = 10146/30000 | Total reward = 49.14
2022-01-26 14:17:14.305 | DEBUG    | __main__:trials:24 - Trial = 10147/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.305 | DEBUG    | __main__:trials:29 - Trial = 10147/30000 | Total reward = 43.80
2022-01-26 14:17:14.309 | DEBUG    | __main__:trials:24 - Trial = 10148/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.309 | DEBUG    | __main__:trials:29 - Trial = 10148/30000 | Total reward = 40.63
2022-01-26 14:17:14.313 | DEBUG    | __main__:trials:24 - Trial = 10149/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.314 | DEBUG    | __main__:trials:29 - Trial = 10149/30000 | Total reward = 36.95
2022-01-26 14:17:14.317 | DEBUG    | __main__:trials:24 - Trial = 10150/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.318 | DEBUG    | __main__:trials:29 - Trial = 10150/30000 | Total reward = 40.06
2022-01-26 14:17:14.321 | DEBUG    | __main__:trials:24 - Trial = 10151/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.322 | DEBUG    | __main__:trials:29 - Trial = 10151/30000 | Total reward = 41.28
2022-01-26 14:17:14.326 | DEBUG    | __main__:trials:24 - Trial = 10152/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.327 | DEBUG    | __main__:trials:29 - Trial = 10152/30000 | Total reward = 43.90
2022-01-26 14:17:14.330 | DEBUG    | __main__:trials:24 - Trial = 10153/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.332 | DEBUG    | __main__:trials:29 - Trial = 10153/30000 | Total reward = 41.43
2022-01-26 14:17:14.335 | DEBUG    | __main__:trials:24 - Trial = 10154/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.335 | DEBUG    | __main__:trials:29 - Trial = 10154/30000 | Total reward = 37.55
2022-01-26 14:17:14.339 | DEBUG    | __main__:trials:24 - Trial = 10155/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.341 | DEBUG    | __main__:trials:29 - Trial = 10155/30000 | Total reward = 41.61
2022-01-26 14:17:14.343 | DEBUG    | __main__:trials:24 - Trial = 10156/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.344 | DEBUG    | __main__:trials:29 - Trial = 10156/30000 | Total reward = 42.05
2022-01-26 14:17:14.348 | DEBUG    | __main__:trials:24 - Trial = 10157/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.348 | DEBUG    | __main__:trials:29 - Trial = 10157/30000 | Total reward = 43.06
2022-01-26 14:17:14.352 | DEBUG    | __main__:trials:24 - Trial = 10158/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.353 | DEBUG    | __main__:trials:29 - Trial = 10158/30000 | Total reward = 44.22
2022-01-26 14:17:14.356 | DEBUG    | __main__:trials:24 - Trial = 10159/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.358 | DEBUG    | __main__:trials:29 - Trial = 10159/30000 | Total reward = 41.49
2022-01-26 14:17:14.362 | DEBUG    | __main__:trials:24 - Trial = 10160/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.362 | DEBUG    | __main__:trials:29 - Trial = 10160/30000 | Total reward = 44.22
2022-01-26 14:17:14.366 | DEBUG    | __main__:trials:24 - Trial = 10161/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.367 | DEBUG    | __main__:trials:29 - Trial = 10161/30000 | Total reward = 40.07
2022-01-26 14:17:14.370 | DEBUG    | __main__:trials:24 - Trial = 10162/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.372 | DEBUG    | __main__:trials:29 - Trial = 10162/30000 | Total reward = 52.05
2022-01-26 14:17:14.375 | DEBUG    | __main__:trials:24 - Trial = 10163/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.376 | DEBUG    | __main__:trials:29 - Trial = 10163/30000 | Total reward = 68.95
2022-01-26 14:17:14.379 | DEBUG    | __main__:trials:24 - Trial = 10164/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.380 | DEBUG    | __main__:trials:29 - Trial = 10164/30000 | Total reward = 41.81
2022-01-26 14:17:14.383 | DEBUG    | __main__:trials:24 - Trial = 10165/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.385 | DEBUG    | __main__:trials:29 - Trial = 10165/30000 | Total reward = 38.48
2022-01-26 14:17:14.388 | DEBUG    | __main__:trials:24 - Trial = 10166/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.389 | DEBUG    | __main__:trials:29 - Trial = 10166/30000 | Total reward = 34.48
2022-01-26 14:17:14.392 | DEBUG    | __main__:trials:24 - Trial = 10167/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.394 | DEBUG    | __main__:trials:29 - Trial = 10167/30000 | Total reward = 42.40
2022-01-26 14:17:14.397 | DEBUG    | __main__:trials:24 - Trial = 10168/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.397 | DEBUG    | __main__:trials:29 - Trial = 10168/30000 | Total reward = 58.30
2022-01-26 14:17:14.401 | DEBUG    | __main__:trials:24 - Trial = 10169/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.401 | DEBUG    | __main__:trials:29 - Trial = 10169/30000 | Total reward = 51.53
2022-01-26 14:17:14.405 | DEBUG    | __main__:trials:24 - Trial = 10170/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.405 | DEBUG    | __main__:trials:29 - Trial = 10170/30000 | Total reward = 42.74
2022-01-26 14:17:14.409 | DEBUG    | __main__:trials:24 - Trial = 10171/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.409 | DEBUG    | __main__:trials:29 - Trial = 10171/30000 | Total reward = 32.90
2022-01-26 14:17:14.413 | DEBUG    | __main__:trials:24 - Trial = 10172/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.415 | DEBUG    | __main__:trials:29 - Trial = 10172/30000 | Total reward = 42.26
2022-01-26 14:17:14.418 | DEBUG    | __main__:trials:24 - Trial = 10173/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.419 | DEBUG    | __main__:trials:29 - Trial = 10173/30000 | Total reward = 42.60
2022-01-26 14:17:14.422 | DEBUG    | __main__:trials:24 - Trial = 10174/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.422 | DEBUG    | __main__:trials:29 - Trial = 10174/30000 | Total reward = 38.59
2022-01-26 14:17:14.426 | DEBUG    | __main__:trials:24 - Trial = 10175/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.427 | DEBUG    | __main__:trials:29 - Trial = 10175/30000 | Total reward = 35.07
2022-01-26 14:17:14.430 | DEBUG    | __main__:trials:24 - Trial = 10176/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.431 | DEBUG    | __main__:trials:29 - Trial = 10176/30000 | Total reward = 47.84
2022-01-26 14:17:14.435 | DEBUG    | __main__:trials:24 - Trial = 10177/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.436 | DEBUG    | __main__:trials:29 - Trial = 10177/30000 | Total reward = 36.66
2022-01-26 14:17:14.439 | DEBUG    | __main__:trials:26 - Trial = 10178/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.439 | DEBUG    | __main__:trials:29 - Trial = 10178/30000 | Total reward = 20.26
2022-01-26 14:17:14.443 | DEBUG    | __main__:trials:24 - Trial = 10179/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.443 | DEBUG    | __main__:trials:29 - Trial = 10179/30000 | Total reward = 42.05
2022-01-26 14:17:14.447 | DEBUG    | __main__:trials:24 - Trial = 10180/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.448 | DEBUG    | __main__:trials:29 - Trial = 10180/30000 | Total reward = 41.52
2022-01-26 14:17:14.451 | DEBUG    | __main__:trials:24 - Trial = 10181/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.452 | DEBUG    | __main__:trials:29 - Trial = 10181/30000 | Total reward = 34.10
2022-01-26 14:17:14.456 | DEBUG    | __main__:trials:24 - Trial = 10182/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.457 | DEBUG    | __main__:trials:29 - Trial = 10182/30000 | Total reward = 42.74
2022-01-26 14:17:14.461 | DEBUG    | __main__:trials:24 - Trial = 10183/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.462 | DEBUG    | __main__:trials:29 - Trial = 10183/30000 | Total reward = 38.49
2022-01-26 14:17:14.465 | DEBUG    | __main__:trials:24 - Trial = 10184/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.465 | DEBUG    | __main__:trials:29 - Trial = 10184/30000 | Total reward = 47.07
2022-01-26 14:17:14.469 | DEBUG    | __main__:trials:24 - Trial = 10185/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.470 | DEBUG    | __main__:trials:29 - Trial = 10185/30000 | Total reward = 38.75
2022-01-26 14:17:14.474 | DEBUG    | __main__:trials:24 - Trial = 10186/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.474 | DEBUG    | __main__:trials:29 - Trial = 10186/30000 | Total reward = 44.51
2022-01-26 14:17:14.478 | DEBUG    | __main__:trials:24 - Trial = 10187/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.480 | DEBUG    | __main__:trials:29 - Trial = 10187/30000 | Total reward = 32.71
2022-01-26 14:17:14.483 | DEBUG    | __main__:trials:24 - Trial = 10188/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.485 | DEBUG    | __main__:trials:29 - Trial = 10188/30000 | Total reward = 36.60
2022-01-26 14:17:14.488 | DEBUG    | __main__:trials:24 - Trial = 10189/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.489 | DEBUG    | __main__:trials:29 - Trial = 10189/30000 | Total reward = 41.43
2022-01-26 14:17:14.493 | DEBUG    | __main__:trials:24 - Trial = 10190/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.493 | DEBUG    | __main__:trials:29 - Trial = 10190/30000 | Total reward = 34.53
2022-01-26 14:17:14.495 | DEBUG    | __main__:trials:26 - Trial = 10191/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.496 | DEBUG    | __main__:trials:29 - Trial = 10191/30000 | Total reward = 8.75
2022-01-26 14:17:14.499 | DEBUG    | __main__:trials:24 - Trial = 10192/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.501 | DEBUG    | __main__:trials:29 - Trial = 10192/30000 | Total reward = 30.85
2022-01-26 14:17:14.504 | DEBUG    | __main__:trials:24 - Trial = 10193/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.506 | DEBUG    | __main__:trials:29 - Trial = 10193/30000 | Total reward = 29.73
2022-01-26 14:17:14.510 | DEBUG    | __main__:trials:24 - Trial = 10194/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.510 | DEBUG    | __main__:trials:29 - Trial = 10194/30000 | Total reward = 65.23
2022-01-26 14:17:14.514 | DEBUG    | __main__:trials:24 - Trial = 10195/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.515 | DEBUG    | __main__:trials:29 - Trial = 10195/30000 | Total reward = 39.95
2022-01-26 14:17:14.519 | DEBUG    | __main__:trials:24 - Trial = 10196/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.519 | DEBUG    | __main__:trials:29 - Trial = 10196/30000 | Total reward = 21.75
2022-01-26 14:17:14.524 | DEBUG    | __main__:trials:24 - Trial = 10197/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.525 | DEBUG    | __main__:trials:29 - Trial = 10197/30000 | Total reward = 42.32
2022-01-26 14:17:14.529 | DEBUG    | __main__:trials:24 - Trial = 10198/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.530 | DEBUG    | __main__:trials:29 - Trial = 10198/30000 | Total reward = 41.37
2022-01-26 14:17:14.533 | DEBUG    | __main__:trials:24 - Trial = 10199/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.534 | DEBUG    | __main__:trials:29 - Trial = 10199/30000 | Total reward = 44.14
2022-01-26 14:17:14.538 | DEBUG    | __main__:trials:24 - Trial = 10200/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.539 | DEBUG    | __main__:trials:29 - Trial = 10200/30000 | Total reward = 23.31
2022-01-26 14:17:14.542 | DEBUG    | __main__:trials:24 - Trial = 10201/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.544 | DEBUG    | __main__:trials:29 - Trial = 10201/30000 | Total reward = 30.03
2022-01-26 14:17:14.548 | DEBUG    | __main__:trials:24 - Trial = 10202/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.548 | DEBUG    | __main__:trials:29 - Trial = 10202/30000 | Total reward = 29.64
2022-01-26 14:17:14.552 | DEBUG    | __main__:trials:24 - Trial = 10203/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.554 | DEBUG    | __main__:trials:29 - Trial = 10203/30000 | Total reward = 26.82
2022-01-26 14:17:14.557 | DEBUG    | __main__:trials:24 - Trial = 10204/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.559 | DEBUG    | __main__:trials:29 - Trial = 10204/30000 | Total reward = 32.45
2022-01-26 14:17:14.562 | DEBUG    | __main__:trials:24 - Trial = 10205/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.564 | DEBUG    | __main__:trials:29 - Trial = 10205/30000 | Total reward = 29.23
2022-01-26 14:17:14.567 | DEBUG    | __main__:trials:24 - Trial = 10206/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.569 | DEBUG    | __main__:trials:29 - Trial = 10206/30000 | Total reward = 28.77
2022-01-26 14:17:14.572 | DEBUG    | __main__:trials:24 - Trial = 10207/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.573 | DEBUG    | __main__:trials:29 - Trial = 10207/30000 | Total reward = 46.61
2022-01-26 14:17:14.576 | DEBUG    | __main__:trials:26 - Trial = 10208/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.577 | DEBUG    | __main__:trials:29 - Trial = 10208/30000 | Total reward = 21.24
2022-01-26 14:17:14.580 | DEBUG    | __main__:trials:24 - Trial = 10209/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.582 | DEBUG    | __main__:trials:29 - Trial = 10209/30000 | Total reward = 24.49
2022-01-26 14:17:14.585 | DEBUG    | __main__:trials:24 - Trial = 10210/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.586 | DEBUG    | __main__:trials:29 - Trial = 10210/30000 | Total reward = 49.82
2022-01-26 14:17:14.589 | DEBUG    | __main__:trials:24 - Trial = 10211/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.591 | DEBUG    | __main__:trials:29 - Trial = 10211/30000 | Total reward = 27.10
2022-01-26 14:17:14.593 | DEBUG    | __main__:trials:26 - Trial = 10212/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.594 | DEBUG    | __main__:trials:29 - Trial = 10212/30000 | Total reward = 20.75
2022-01-26 14:17:14.597 | DEBUG    | __main__:trials:24 - Trial = 10213/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.598 | DEBUG    | __main__:trials:29 - Trial = 10213/30000 | Total reward = 38.59
2022-01-26 14:17:14.602 | DEBUG    | __main__:trials:24 - Trial = 10214/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.604 | DEBUG    | __main__:trials:29 - Trial = 10214/30000 | Total reward = 28.41
2022-01-26 14:17:14.607 | DEBUG    | __main__:trials:24 - Trial = 10215/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.607 | DEBUG    | __main__:trials:29 - Trial = 10215/30000 | Total reward = 33.17
2022-01-26 14:17:14.611 | DEBUG    | __main__:trials:24 - Trial = 10216/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.611 | DEBUG    | __main__:trials:29 - Trial = 10216/30000 | Total reward = 47.09
2022-01-26 14:17:14.615 | DEBUG    | __main__:trials:24 - Trial = 10217/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.616 | DEBUG    | __main__:trials:29 - Trial = 10217/30000 | Total reward = 28.93
2022-01-26 14:17:14.619 | DEBUG    | __main__:trials:24 - Trial = 10218/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.621 | DEBUG    | __main__:trials:29 - Trial = 10218/30000 | Total reward = 41.88
2022-01-26 14:17:14.622 | DEBUG    | __main__:trials:26 - Trial = 10219/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.624 | DEBUG    | __main__:trials:29 - Trial = 10219/30000 | Total reward = 6.97
2022-01-26 14:17:14.627 | DEBUG    | __main__:trials:24 - Trial = 10220/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.629 | DEBUG    | __main__:trials:29 - Trial = 10220/30000 | Total reward = 37.17
2022-01-26 14:17:14.632 | DEBUG    | __main__:trials:24 - Trial = 10221/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.634 | DEBUG    | __main__:trials:29 - Trial = 10221/30000 | Total reward = 32.80
2022-01-26 14:17:14.637 | DEBUG    | __main__:trials:24 - Trial = 10222/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.639 | DEBUG    | __main__:trials:29 - Trial = 10222/30000 | Total reward = 64.13
2022-01-26 14:17:14.642 | DEBUG    | __main__:trials:24 - Trial = 10223/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.643 | DEBUG    | __main__:trials:29 - Trial = 10223/30000 | Total reward = 41.27
2022-01-26 14:17:14.647 | DEBUG    | __main__:trials:24 - Trial = 10224/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.649 | DEBUG    | __main__:trials:29 - Trial = 10224/30000 | Total reward = 40.61
2022-01-26 14:17:14.652 | DEBUG    | __main__:trials:24 - Trial = 10225/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.654 | DEBUG    | __main__:trials:29 - Trial = 10225/30000 | Total reward = 39.66
2022-01-26 14:17:14.657 | DEBUG    | __main__:trials:24 - Trial = 10226/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.659 | DEBUG    | __main__:trials:29 - Trial = 10226/30000 | Total reward = 44.22
2022-01-26 14:17:14.663 | DEBUG    | __main__:trials:24 - Trial = 10227/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.664 | DEBUG    | __main__:trials:29 - Trial = 10227/30000 | Total reward = 41.07
2022-01-26 14:17:14.668 | DEBUG    | __main__:trials:24 - Trial = 10228/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.669 | DEBUG    | __main__:trials:29 - Trial = 10228/30000 | Total reward = 41.05
2022-01-26 14:17:14.672 | DEBUG    | __main__:trials:24 - Trial = 10229/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.674 | DEBUG    | __main__:trials:29 - Trial = 10229/30000 | Total reward = 41.27
2022-01-26 14:17:14.678 | DEBUG    | __main__:trials:24 - Trial = 10230/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.678 | DEBUG    | __main__:trials:29 - Trial = 10230/30000 | Total reward = 41.08
2022-01-26 14:17:14.682 | DEBUG    | __main__:trials:24 - Trial = 10231/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.684 | DEBUG    | __main__:trials:29 - Trial = 10231/30000 | Total reward = 41.72
2022-01-26 14:17:14.687 | DEBUG    | __main__:trials:24 - Trial = 10232/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.689 | DEBUG    | __main__:trials:29 - Trial = 10232/30000 | Total reward = 41.66
2022-01-26 14:17:14.692 | DEBUG    | __main__:trials:24 - Trial = 10233/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.694 | DEBUG    | __main__:trials:29 - Trial = 10233/30000 | Total reward = 45.22
2022-01-26 14:17:14.698 | DEBUG    | __main__:trials:26 - Trial = 10234/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.698 | DEBUG    | __main__:trials:29 - Trial = 10234/30000 | Total reward = 16.29
2022-01-26 14:17:14.703 | DEBUG    | __main__:trials:24 - Trial = 10235/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.704 | DEBUG    | __main__:trials:29 - Trial = 10235/30000 | Total reward = 44.20
2022-01-26 14:17:14.708 | DEBUG    | __main__:trials:24 - Trial = 10236/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.709 | DEBUG    | __main__:trials:29 - Trial = 10236/30000 | Total reward = 30.04
2022-01-26 14:17:14.712 | DEBUG    | __main__:trials:24 - Trial = 10237/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.714 | DEBUG    | __main__:trials:29 - Trial = 10237/30000 | Total reward = 58.87
2022-01-26 14:17:14.718 | DEBUG    | __main__:trials:24 - Trial = 10238/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.718 | DEBUG    | __main__:trials:29 - Trial = 10238/30000 | Total reward = 40.34
2022-01-26 14:17:14.723 | DEBUG    | __main__:trials:24 - Trial = 10239/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.723 | DEBUG    | __main__:trials:29 - Trial = 10239/30000 | Total reward = 20.89
2022-01-26 14:17:14.728 | DEBUG    | __main__:trials:24 - Trial = 10240/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.729 | DEBUG    | __main__:trials:29 - Trial = 10240/30000 | Total reward = 20.66
2022-01-26 14:17:14.731 | DEBUG    | __main__:trials:26 - Trial = 10241/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.733 | DEBUG    | __main__:trials:29 - Trial = 10241/30000 | Total reward = 8.95
2022-01-26 14:17:14.736 | DEBUG    | __main__:trials:24 - Trial = 10242/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.738 | DEBUG    | __main__:trials:29 - Trial = 10242/30000 | Total reward = 43.25
2022-01-26 14:17:14.740 | DEBUG    | __main__:trials:26 - Trial = 10243/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.742 | DEBUG    | __main__:trials:29 - Trial = 10243/30000 | Total reward = 7.84
2022-01-26 14:17:14.745 | DEBUG    | __main__:trials:24 - Trial = 10244/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.747 | DEBUG    | __main__:trials:29 - Trial = 10244/30000 | Total reward = 39.66
2022-01-26 14:17:14.750 | DEBUG    | __main__:trials:24 - Trial = 10245/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.752 | DEBUG    | __main__:trials:29 - Trial = 10245/30000 | Total reward = 21.96
2022-01-26 14:17:14.755 | DEBUG    | __main__:trials:24 - Trial = 10246/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.756 | DEBUG    | __main__:trials:29 - Trial = 10246/30000 | Total reward = 44.00
2022-01-26 14:17:14.759 | DEBUG    | __main__:trials:24 - Trial = 10247/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.761 | DEBUG    | __main__:trials:29 - Trial = 10247/30000 | Total reward = 30.03
2022-01-26 14:17:14.765 | DEBUG    | __main__:trials:24 - Trial = 10248/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.766 | DEBUG    | __main__:trials:29 - Trial = 10248/30000 | Total reward = 23.25
2022-01-26 14:17:14.770 | DEBUG    | __main__:trials:24 - Trial = 10249/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.771 | DEBUG    | __main__:trials:29 - Trial = 10249/30000 | Total reward = 38.10
2022-01-26 14:17:14.775 | DEBUG    | __main__:trials:24 - Trial = 10250/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.776 | DEBUG    | __main__:trials:29 - Trial = 10250/30000 | Total reward = 45.05
2022-01-26 14:17:14.779 | DEBUG    | __main__:trials:24 - Trial = 10251/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.781 | DEBUG    | __main__:trials:29 - Trial = 10251/30000 | Total reward = 43.23
2022-01-26 14:17:14.784 | DEBUG    | __main__:trials:24 - Trial = 10252/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.786 | DEBUG    | __main__:trials:29 - Trial = 10252/30000 | Total reward = 31.64
2022-01-26 14:17:14.789 | DEBUG    | __main__:trials:24 - Trial = 10253/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.790 | DEBUG    | __main__:trials:29 - Trial = 10253/30000 | Total reward = 34.66
2022-01-26 14:17:14.794 | DEBUG    | __main__:trials:24 - Trial = 10254/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.795 | DEBUG    | __main__:trials:29 - Trial = 10254/30000 | Total reward = 41.98
2022-01-26 14:17:14.799 | DEBUG    | __main__:trials:24 - Trial = 10255/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.800 | DEBUG    | __main__:trials:29 - Trial = 10255/30000 | Total reward = 46.32
2022-01-26 14:17:14.804 | DEBUG    | __main__:trials:24 - Trial = 10256/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.805 | DEBUG    | __main__:trials:29 - Trial = 10256/30000 | Total reward = 44.40
2022-01-26 14:17:14.808 | DEBUG    | __main__:trials:24 - Trial = 10257/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.810 | DEBUG    | __main__:trials:29 - Trial = 10257/30000 | Total reward = 39.89
2022-01-26 14:17:14.814 | DEBUG    | __main__:trials:24 - Trial = 10258/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.814 | DEBUG    | __main__:trials:29 - Trial = 10258/30000 | Total reward = 35.45
2022-01-26 14:17:14.819 | DEBUG    | __main__:trials:24 - Trial = 10259/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.820 | DEBUG    | __main__:trials:29 - Trial = 10259/30000 | Total reward = 41.08
2022-01-26 14:17:14.823 | DEBUG    | __main__:trials:24 - Trial = 10260/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.825 | DEBUG    | __main__:trials:29 - Trial = 10260/30000 | Total reward = 42.43
2022-01-26 14:17:14.828 | DEBUG    | __main__:trials:24 - Trial = 10261/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.829 | DEBUG    | __main__:trials:29 - Trial = 10261/30000 | Total reward = 39.93
2022-01-26 14:17:14.833 | DEBUG    | __main__:trials:24 - Trial = 10262/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.835 | DEBUG    | __main__:trials:29 - Trial = 10262/30000 | Total reward = 45.03
2022-01-26 14:17:14.839 | DEBUG    | __main__:trials:24 - Trial = 10263/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.839 | DEBUG    | __main__:trials:29 - Trial = 10263/30000 | Total reward = 42.58
2022-01-26 14:17:14.844 | DEBUG    | __main__:trials:24 - Trial = 10264/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.844 | DEBUG    | __main__:trials:29 - Trial = 10264/30000 | Total reward = 29.31
2022-01-26 14:17:14.849 | DEBUG    | __main__:trials:24 - Trial = 10265/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.851 | DEBUG    | __main__:trials:29 - Trial = 10265/30000 | Total reward = 10.16
2022-01-26 14:17:14.855 | DEBUG    | __main__:trials:24 - Trial = 10266/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.855 | DEBUG    | __main__:trials:29 - Trial = 10266/30000 | Total reward = 37.18
2022-01-26 14:17:14.860 | DEBUG    | __main__:trials:24 - Trial = 10267/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.860 | DEBUG    | __main__:trials:29 - Trial = 10267/30000 | Total reward = 50.48
2022-01-26 14:17:14.865 | DEBUG    | __main__:trials:24 - Trial = 10268/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.866 | DEBUG    | __main__:trials:29 - Trial = 10268/30000 | Total reward = 45.04
2022-01-26 14:17:14.869 | DEBUG    | __main__:trials:24 - Trial = 10269/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.870 | DEBUG    | __main__:trials:29 - Trial = 10269/30000 | Total reward = 53.83
2022-01-26 14:17:14.874 | DEBUG    | __main__:trials:24 - Trial = 10270/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.874 | DEBUG    | __main__:trials:29 - Trial = 10270/30000 | Total reward = 32.92
2022-01-26 14:17:14.878 | DEBUG    | __main__:trials:24 - Trial = 10271/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.879 | DEBUG    | __main__:trials:29 - Trial = 10271/30000 | Total reward = 46.82
2022-01-26 14:17:14.882 | DEBUG    | __main__:trials:24 - Trial = 10272/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.884 | DEBUG    | __main__:trials:29 - Trial = 10272/30000 | Total reward = 28.36
2022-01-26 14:17:14.888 | DEBUG    | __main__:trials:24 - Trial = 10273/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.888 | DEBUG    | __main__:trials:29 - Trial = 10273/30000 | Total reward = 29.25
2022-01-26 14:17:14.892 | DEBUG    | __main__:trials:24 - Trial = 10274/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.893 | DEBUG    | __main__:trials:29 - Trial = 10274/30000 | Total reward = 50.23
2022-01-26 14:17:14.896 | DEBUG    | __main__:trials:24 - Trial = 10275/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.898 | DEBUG    | __main__:trials:29 - Trial = 10275/30000 | Total reward = 29.61
2022-01-26 14:17:14.901 | DEBUG    | __main__:trials:24 - Trial = 10276/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.903 | DEBUG    | __main__:trials:29 - Trial = 10276/30000 | Total reward = 29.99
2022-01-26 14:17:14.905 | DEBUG    | __main__:trials:26 - Trial = 10277/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.907 | DEBUG    | __main__:trials:29 - Trial = 10277/30000 | Total reward = 12.27
2022-01-26 14:17:14.911 | DEBUG    | __main__:trials:24 - Trial = 10278/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.912 | DEBUG    | __main__:trials:29 - Trial = 10278/30000 | Total reward = 34.21
2022-01-26 14:17:14.916 | DEBUG    | __main__:trials:24 - Trial = 10279/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.918 | DEBUG    | __main__:trials:29 - Trial = 10279/30000 | Total reward = 29.27
2022-01-26 14:17:14.921 | DEBUG    | __main__:trials:24 - Trial = 10280/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.923 | DEBUG    | __main__:trials:29 - Trial = 10280/30000 | Total reward = 54.04
2022-01-26 14:17:14.927 | DEBUG    | __main__:trials:24 - Trial = 10281/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.928 | DEBUG    | __main__:trials:29 - Trial = 10281/30000 | Total reward = 51.00
2022-01-26 14:17:14.931 | DEBUG    | __main__:trials:26 - Trial = 10282/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.932 | DEBUG    | __main__:trials:29 - Trial = 10282/30000 | Total reward = 12.93
2022-01-26 14:17:14.936 | DEBUG    | __main__:trials:24 - Trial = 10283/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.937 | DEBUG    | __main__:trials:29 - Trial = 10283/30000 | Total reward = 47.18
2022-01-26 14:17:14.941 | DEBUG    | __main__:trials:24 - Trial = 10284/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.942 | DEBUG    | __main__:trials:29 - Trial = 10284/30000 | Total reward = 50.80
2022-01-26 14:17:14.946 | DEBUG    | __main__:trials:24 - Trial = 10285/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.947 | DEBUG    | __main__:trials:29 - Trial = 10285/30000 | Total reward = 26.00
2022-01-26 14:17:14.950 | DEBUG    | __main__:trials:26 - Trial = 10286/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.951 | DEBUG    | __main__:trials:29 - Trial = 10286/30000 | Total reward = 14.35
2022-01-26 14:17:14.955 | DEBUG    | __main__:trials:24 - Trial = 10287/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.956 | DEBUG    | __main__:trials:29 - Trial = 10287/30000 | Total reward = 27.86
2022-01-26 14:17:14.960 | DEBUG    | __main__:trials:24 - Trial = 10288/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.962 | DEBUG    | __main__:trials:29 - Trial = 10288/30000 | Total reward = 27.22
2022-01-26 14:17:14.965 | DEBUG    | __main__:trials:24 - Trial = 10289/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.966 | DEBUG    | __main__:trials:29 - Trial = 10289/30000 | Total reward = 30.10
2022-01-26 14:17:14.970 | DEBUG    | __main__:trials:24 - Trial = 10290/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.970 | DEBUG    | __main__:trials:29 - Trial = 10290/30000 | Total reward = 38.17
2022-01-26 14:17:14.975 | DEBUG    | __main__:trials:24 - Trial = 10291/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.975 | DEBUG    | __main__:trials:29 - Trial = 10291/30000 | Total reward = 24.35
2022-01-26 14:17:14.979 | DEBUG    | __main__:trials:24 - Trial = 10292/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.981 | DEBUG    | __main__:trials:29 - Trial = 10292/30000 | Total reward = 24.22
2022-01-26 14:17:14.984 | DEBUG    | __main__:trials:24 - Trial = 10293/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.985 | DEBUG    | __main__:trials:29 - Trial = 10293/30000 | Total reward = 40.41
2022-01-26 14:17:14.988 | DEBUG    | __main__:trials:24 - Trial = 10294/30000 | Max number of steps (20) reached
2022-01-26 14:17:14.990 | DEBUG    | __main__:trials:29 - Trial = 10294/30000 | Total reward = 32.28
2022-01-26 14:17:14.991 | DEBUG    | __main__:trials:26 - Trial = 10295/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.992 | DEBUG    | __main__:trials:29 - Trial = 10295/30000 | Total reward = 7.12
2022-01-26 14:17:14.994 | DEBUG    | __main__:trials:26 - Trial = 10296/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:14.996 | DEBUG    | __main__:trials:29 - Trial = 10296/30000 | Total reward = 8.64
2022-01-26 14:17:14.999 | DEBUG    | __main__:trials:24 - Trial = 10297/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.000 | DEBUG    | __main__:trials:29 - Trial = 10297/30000 | Total reward = 32.97
2022-01-26 14:17:15.004 | DEBUG    | __main__:trials:24 - Trial = 10298/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.006 | DEBUG    | __main__:trials:29 - Trial = 10298/30000 | Total reward = 27.81
2022-01-26 14:17:15.010 | DEBUG    | __main__:trials:24 - Trial = 10299/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.010 | DEBUG    | __main__:trials:29 - Trial = 10299/30000 | Total reward = 42.96
2022-01-26 14:17:15.015 | DEBUG    | __main__:trials:24 - Trial = 10300/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.016 | DEBUG    | __main__:trials:29 - Trial = 10300/30000 | Total reward = 46.93
2022-01-26 14:17:15.020 | DEBUG    | __main__:trials:24 - Trial = 10301/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.022 | DEBUG    | __main__:trials:29 - Trial = 10301/30000 | Total reward = 40.42
2022-01-26 14:17:15.025 | DEBUG    | __main__:trials:24 - Trial = 10302/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.026 | DEBUG    | __main__:trials:29 - Trial = 10302/30000 | Total reward = 28.82
2022-01-26 14:17:15.030 | DEBUG    | __main__:trials:24 - Trial = 10303/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.031 | DEBUG    | __main__:trials:29 - Trial = 10303/30000 | Total reward = 30.29
2022-01-26 14:17:15.035 | DEBUG    | __main__:trials:24 - Trial = 10304/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.036 | DEBUG    | __main__:trials:29 - Trial = 10304/30000 | Total reward = 29.33
2022-01-26 14:17:15.040 | DEBUG    | __main__:trials:24 - Trial = 10305/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.042 | DEBUG    | __main__:trials:29 - Trial = 10305/30000 | Total reward = 38.56
2022-01-26 14:17:15.045 | DEBUG    | __main__:trials:24 - Trial = 10306/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.047 | DEBUG    | __main__:trials:29 - Trial = 10306/30000 | Total reward = 57.13
2022-01-26 14:17:15.050 | DEBUG    | __main__:trials:24 - Trial = 10307/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.051 | DEBUG    | __main__:trials:29 - Trial = 10307/30000 | Total reward = 29.14
2022-01-26 14:17:15.054 | DEBUG    | __main__:trials:24 - Trial = 10308/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.056 | DEBUG    | __main__:trials:29 - Trial = 10308/30000 | Total reward = 37.60
2022-01-26 14:17:15.059 | DEBUG    | __main__:trials:24 - Trial = 10309/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.061 | DEBUG    | __main__:trials:29 - Trial = 10309/30000 | Total reward = 32.72
2022-01-26 14:17:15.064 | DEBUG    | __main__:trials:24 - Trial = 10310/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.066 | DEBUG    | __main__:trials:29 - Trial = 10310/30000 | Total reward = 36.49
2022-01-26 14:17:15.069 | DEBUG    | __main__:trials:24 - Trial = 10311/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.071 | DEBUG    | __main__:trials:29 - Trial = 10311/30000 | Total reward = 40.31
2022-01-26 14:17:15.074 | DEBUG    | __main__:trials:24 - Trial = 10312/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.075 | DEBUG    | __main__:trials:29 - Trial = 10312/30000 | Total reward = 29.33
2022-01-26 14:17:15.079 | DEBUG    | __main__:trials:24 - Trial = 10313/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.081 | DEBUG    | __main__:trials:29 - Trial = 10313/30000 | Total reward = 42.30
2022-01-26 14:17:15.084 | DEBUG    | __main__:trials:24 - Trial = 10314/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.085 | DEBUG    | __main__:trials:29 - Trial = 10314/30000 | Total reward = 47.05
2022-01-26 14:17:15.089 | DEBUG    | __main__:trials:24 - Trial = 10315/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.090 | DEBUG    | __main__:trials:29 - Trial = 10315/30000 | Total reward = 61.67
2022-01-26 14:17:15.094 | DEBUG    | __main__:trials:24 - Trial = 10316/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.095 | DEBUG    | __main__:trials:29 - Trial = 10316/30000 | Total reward = 50.20
2022-01-26 14:17:15.098 | DEBUG    | __main__:trials:26 - Trial = 10317/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:15.099 | DEBUG    | __main__:trials:29 - Trial = 10317/30000 | Total reward = 23.14
2022-01-26 14:17:15.103 | DEBUG    | __main__:trials:26 - Trial = 10318/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:15.105 | DEBUG    | __main__:trials:29 - Trial = 10318/30000 | Total reward = 15.56
2022-01-26 14:17:15.108 | DEBUG    | __main__:trials:24 - Trial = 10319/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.109 | DEBUG    | __main__:trials:29 - Trial = 10319/30000 | Total reward = 45.39
2022-01-26 14:17:15.113 | DEBUG    | __main__:trials:24 - Trial = 10320/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.115 | DEBUG    | __main__:trials:29 - Trial = 10320/30000 | Total reward = 46.44
2022-01-26 14:17:15.118 | DEBUG    | __main__:trials:24 - Trial = 10321/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.120 | DEBUG    | __main__:trials:29 - Trial = 10321/30000 | Total reward = 41.96
2022-01-26 14:17:15.123 | DEBUG    | __main__:trials:24 - Trial = 10322/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.125 | DEBUG    | __main__:trials:29 - Trial = 10322/30000 | Total reward = 32.25
2022-01-26 14:17:15.128 | DEBUG    | __main__:trials:24 - Trial = 10323/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.129 | DEBUG    | __main__:trials:29 - Trial = 10323/30000 | Total reward = 43.25
2022-01-26 14:17:15.133 | DEBUG    | __main__:trials:24 - Trial = 10324/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.135 | DEBUG    | __main__:trials:29 - Trial = 10324/30000 | Total reward = 40.29
2022-01-26 14:17:15.137 | DEBUG    | __main__:trials:24 - Trial = 10325/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.139 | DEBUG    | __main__:trials:29 - Trial = 10325/30000 | Total reward = 42.07
2022-01-26 14:17:15.143 | DEBUG    | __main__:trials:24 - Trial = 10326/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.144 | DEBUG    | __main__:trials:29 - Trial = 10326/30000 | Total reward = 30.72
2022-01-26 14:17:15.148 | DEBUG    | __main__:trials:24 - Trial = 10327/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.149 | DEBUG    | __main__:trials:29 - Trial = 10327/30000 | Total reward = 43.74
2022-01-26 14:17:15.152 | DEBUG    | __main__:trials:24 - Trial = 10328/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.154 | DEBUG    | __main__:trials:29 - Trial = 10328/30000 | Total reward = 55.15
2022-01-26 14:17:15.157 | DEBUG    | __main__:trials:24 - Trial = 10329/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.158 | DEBUG    | __main__:trials:29 - Trial = 10329/30000 | Total reward = 28.32
2022-01-26 14:17:15.162 | DEBUG    | __main__:trials:24 - Trial = 10330/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.163 | DEBUG    | __main__:trials:29 - Trial = 10330/30000 | Total reward = 56.49
2022-01-26 14:17:15.166 | DEBUG    | __main__:trials:24 - Trial = 10331/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.167 | DEBUG    | __main__:trials:29 - Trial = 10331/30000 | Total reward = 39.22
2022-01-26 14:17:15.170 | DEBUG    | __main__:trials:24 - Trial = 10332/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.171 | DEBUG    | __main__:trials:29 - Trial = 10332/30000 | Total reward = 41.16
2022-01-26 14:17:15.175 | DEBUG    | __main__:trials:24 - Trial = 10333/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.175 | DEBUG    | __main__:trials:29 - Trial = 10333/30000 | Total reward = 41.01
2022-01-26 14:17:15.180 | DEBUG    | __main__:trials:24 - Trial = 10334/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.181 | DEBUG    | __main__:trials:29 - Trial = 10334/30000 | Total reward = 39.20
2022-01-26 14:17:15.184 | DEBUG    | __main__:trials:24 - Trial = 10335/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.186 | DEBUG    | __main__:trials:29 - Trial = 10335/30000 | Total reward = 46.61
2022-01-26 14:17:15.190 | DEBUG    | __main__:trials:24 - Trial = 10336/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.190 | DEBUG    | __main__:trials:29 - Trial = 10336/30000 | Total reward = 36.53
2022-01-26 14:17:15.194 | DEBUG    | __main__:trials:24 - Trial = 10337/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.196 | DEBUG    | __main__:trials:29 - Trial = 10337/30000 | Total reward = 49.32
2022-01-26 14:17:15.199 | DEBUG    | __main__:trials:24 - Trial = 10338/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.200 | DEBUG    | __main__:trials:29 - Trial = 10338/30000 | Total reward = 48.10
2022-01-26 14:17:15.204 | DEBUG    | __main__:trials:24 - Trial = 10339/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.206 | DEBUG    | __main__:trials:29 - Trial = 10339/30000 | Total reward = 41.42
2022-01-26 14:17:15.209 | DEBUG    | __main__:trials:24 - Trial = 10340/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.210 | DEBUG    | __main__:trials:29 - Trial = 10340/30000 | Total reward = 41.51
2022-01-26 14:17:15.214 | DEBUG    | __main__:trials:24 - Trial = 10341/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.216 | DEBUG    | __main__:trials:29 - Trial = 10341/30000 | Total reward = 28.68
2022-01-26 14:17:15.218 | DEBUG    | __main__:trials:24 - Trial = 10342/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.220 | DEBUG    | __main__:trials:29 - Trial = 10342/30000 | Total reward = 36.67
2022-01-26 14:17:15.223 | DEBUG    | __main__:trials:24 - Trial = 10343/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.225 | DEBUG    | __main__:trials:29 - Trial = 10343/30000 | Total reward = 32.42
2022-01-26 14:17:15.228 | DEBUG    | __main__:trials:24 - Trial = 10344/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.230 | DEBUG    | __main__:trials:29 - Trial = 10344/30000 | Total reward = 38.97
2022-01-26 14:17:15.234 | DEBUG    | __main__:trials:24 - Trial = 10345/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.234 | DEBUG    | __main__:trials:29 - Trial = 10345/30000 | Total reward = 36.98
2022-01-26 14:17:15.239 | DEBUG    | __main__:trials:24 - Trial = 10346/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.240 | DEBUG    | __main__:trials:29 - Trial = 10346/30000 | Total reward = 39.51
2022-01-26 14:17:15.244 | DEBUG    | __main__:trials:24 - Trial = 10347/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.245 | DEBUG    | __main__:trials:29 - Trial = 10347/30000 | Total reward = 33.50
2022-01-26 14:17:15.249 | DEBUG    | __main__:trials:24 - Trial = 10348/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.250 | DEBUG    | __main__:trials:29 - Trial = 10348/30000 | Total reward = 41.70
2022-01-26 14:17:15.254 | DEBUG    | __main__:trials:24 - Trial = 10349/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.255 | DEBUG    | __main__:trials:29 - Trial = 10349/30000 | Total reward = 41.20
2022-01-26 14:17:15.259 | DEBUG    | __main__:trials:24 - Trial = 10350/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.260 | DEBUG    | __main__:trials:29 - Trial = 10350/30000 | Total reward = 26.75
2022-01-26 14:17:15.263 | DEBUG    | __main__:trials:24 - Trial = 10351/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.265 | DEBUG    | __main__:trials:29 - Trial = 10351/30000 | Total reward = 44.13
2022-01-26 14:17:15.268 | DEBUG    | __main__:trials:24 - Trial = 10352/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.270 | DEBUG    | __main__:trials:29 - Trial = 10352/30000 | Total reward = 46.60
2022-01-26 14:17:15.273 | DEBUG    | __main__:trials:24 - Trial = 10353/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.275 | DEBUG    | __main__:trials:29 - Trial = 10353/30000 | Total reward = 32.15
2022-01-26 14:17:15.278 | DEBUG    | __main__:trials:24 - Trial = 10354/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.280 | DEBUG    | __main__:trials:29 - Trial = 10354/30000 | Total reward = 40.04
2022-01-26 14:17:15.284 | DEBUG    | __main__:trials:24 - Trial = 10355/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.285 | DEBUG    | __main__:trials:29 - Trial = 10355/30000 | Total reward = 32.20
2022-01-26 14:17:15.288 | DEBUG    | __main__:trials:24 - Trial = 10356/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.290 | DEBUG    | __main__:trials:29 - Trial = 10356/30000 | Total reward = 42.58
2022-01-26 14:17:15.294 | DEBUG    | __main__:trials:24 - Trial = 10357/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.294 | DEBUG    | __main__:trials:29 - Trial = 10357/30000 | Total reward = 45.77
2022-01-26 14:17:15.299 | DEBUG    | __main__:trials:24 - Trial = 10358/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.299 | DEBUG    | __main__:trials:29 - Trial = 10358/30000 | Total reward = 41.32
2022-01-26 14:17:15.302 | DEBUG    | __main__:trials:24 - Trial = 10359/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.303 | DEBUG    | __main__:trials:29 - Trial = 10359/30000 | Total reward = 45.34
2022-01-26 14:17:15.306 | DEBUG    | __main__:trials:24 - Trial = 10360/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.308 | DEBUG    | __main__:trials:29 - Trial = 10360/30000 | Total reward = 33.85
2022-01-26 14:17:15.311 | DEBUG    | __main__:trials:24 - Trial = 10361/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.313 | DEBUG    | __main__:trials:29 - Trial = 10361/30000 | Total reward = 41.31
2022-01-26 14:17:15.316 | DEBUG    | __main__:trials:26 - Trial = 10362/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:15.317 | DEBUG    | __main__:trials:29 - Trial = 10362/30000 | Total reward = 19.79
2022-01-26 14:17:15.320 | DEBUG    | __main__:trials:24 - Trial = 10363/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.321 | DEBUG    | __main__:trials:29 - Trial = 10363/30000 | Total reward = 28.51
2022-01-26 14:17:15.325 | DEBUG    | __main__:trials:24 - Trial = 10364/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.325 | DEBUG    | __main__:trials:29 - Trial = 10364/30000 | Total reward = 37.35
2022-01-26 14:17:15.329 | DEBUG    | __main__:trials:24 - Trial = 10365/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.329 | DEBUG    | __main__:trials:29 - Trial = 10365/30000 | Total reward = 45.83
2022-01-26 14:17:15.333 | DEBUG    | __main__:trials:24 - Trial = 10366/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.335 | DEBUG    | __main__:trials:29 - Trial = 10366/30000 | Total reward = 40.92
2022-01-26 14:17:15.338 | DEBUG    | __main__:trials:24 - Trial = 10367/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.340 | DEBUG    | __main__:trials:29 - Trial = 10367/30000 | Total reward = 35.58
2022-01-26 14:17:15.343 | DEBUG    | __main__:trials:24 - Trial = 10368/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.344 | DEBUG    | __main__:trials:29 - Trial = 10368/30000 | Total reward = 52.66
2022-01-26 14:17:15.348 | DEBUG    | __main__:trials:24 - Trial = 10369/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.349 | DEBUG    | __main__:trials:29 - Trial = 10369/30000 | Total reward = 41.81
2022-01-26 14:17:15.352 | DEBUG    | __main__:trials:24 - Trial = 10370/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.353 | DEBUG    | __main__:trials:29 - Trial = 10370/30000 | Total reward = 39.69
2022-01-26 14:17:15.357 | DEBUG    | __main__:trials:24 - Trial = 10371/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.357 | DEBUG    | __main__:trials:29 - Trial = 10371/30000 | Total reward = 47.81
2022-01-26 14:17:15.361 | DEBUG    | __main__:trials:24 - Trial = 10372/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.362 | DEBUG    | __main__:trials:29 - Trial = 10372/30000 | Total reward = 35.69
2022-01-26 14:17:15.365 | DEBUG    | __main__:trials:24 - Trial = 10373/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.367 | DEBUG    | __main__:trials:29 - Trial = 10373/30000 | Total reward = 25.44
2022-01-26 14:17:15.370 | DEBUG    | __main__:trials:24 - Trial = 10374/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.370 | DEBUG    | __main__:trials:29 - Trial = 10374/30000 | Total reward = 39.32
2022-01-26 14:17:15.374 | DEBUG    | __main__:trials:24 - Trial = 10375/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.375 | DEBUG    | __main__:trials:29 - Trial = 10375/30000 | Total reward = 45.59
2022-01-26 14:17:15.379 | DEBUG    | __main__:trials:24 - Trial = 10376/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.380 | DEBUG    | __main__:trials:29 - Trial = 10376/30000 | Total reward = 34.38
2022-01-26 14:17:15.384 | DEBUG    | __main__:trials:24 - Trial = 10377/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.385 | DEBUG    | __main__:trials:29 - Trial = 10377/30000 | Total reward = 35.54
2022-01-26 14:17:15.389 | DEBUG    | __main__:trials:24 - Trial = 10378/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.390 | DEBUG    | __main__:trials:29 - Trial = 10378/30000 | Total reward = 50.66
2022-01-26 14:17:15.393 | DEBUG    | __main__:trials:24 - Trial = 10379/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.394 | DEBUG    | __main__:trials:29 - Trial = 10379/30000 | Total reward = 39.82
2022-01-26 14:17:15.397 | DEBUG    | __main__:trials:24 - Trial = 10380/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.399 | DEBUG    | __main__:trials:29 - Trial = 10380/30000 | Total reward = 40.33
2022-01-26 14:17:15.402 | DEBUG    | __main__:trials:24 - Trial = 10381/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.403 | DEBUG    | __main__:trials:29 - Trial = 10381/30000 | Total reward = 44.82
2022-01-26 14:17:15.407 | DEBUG    | __main__:trials:24 - Trial = 10382/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.408 | DEBUG    | __main__:trials:29 - Trial = 10382/30000 | Total reward = 32.48
2022-01-26 14:17:15.412 | DEBUG    | __main__:trials:24 - Trial = 10383/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.414 | DEBUG    | __main__:trials:29 - Trial = 10383/30000 | Total reward = 40.25
2022-01-26 14:17:15.417 | DEBUG    | __main__:trials:24 - Trial = 10384/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.418 | DEBUG    | __main__:trials:29 - Trial = 10384/30000 | Total reward = 32.29
2022-01-26 14:17:15.422 | DEBUG    | __main__:trials:24 - Trial = 10385/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.423 | DEBUG    | __main__:trials:29 - Trial = 10385/30000 | Total reward = 36.76
2022-01-26 14:17:15.427 | DEBUG    | __main__:trials:24 - Trial = 10386/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.428 | DEBUG    | __main__:trials:29 - Trial = 10386/30000 | Total reward = 24.27
2022-01-26 14:17:15.432 | DEBUG    | __main__:trials:24 - Trial = 10387/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.433 | DEBUG    | __main__:trials:29 - Trial = 10387/30000 | Total reward = 44.69
2022-01-26 14:17:15.437 | DEBUG    | __main__:trials:24 - Trial = 10388/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.438 | DEBUG    | __main__:trials:29 - Trial = 10388/30000 | Total reward = 34.67
2022-01-26 14:17:15.442 | DEBUG    | __main__:trials:24 - Trial = 10389/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.444 | DEBUG    | __main__:trials:29 - Trial = 10389/30000 | Total reward = 42.57
2022-01-26 14:17:15.447 | DEBUG    | __main__:trials:24 - Trial = 10390/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.448 | DEBUG    | __main__:trials:29 - Trial = 10390/30000 | Total reward = 31.89
2022-01-26 14:17:15.452 | DEBUG    | __main__:trials:24 - Trial = 10391/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.453 | DEBUG    | __main__:trials:29 - Trial = 10391/30000 | Total reward = 43.65
2022-01-26 14:17:15.455 | DEBUG    | __main__:trials:26 - Trial = 10392/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:15.457 | DEBUG    | __main__:trials:29 - Trial = 10392/30000 | Total reward = 14.11
2022-01-26 14:17:15.461 | DEBUG    | __main__:trials:24 - Trial = 10393/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.462 | DEBUG    | __main__:trials:29 - Trial = 10393/30000 | Total reward = 30.24
2022-01-26 14:17:15.466 | DEBUG    | __main__:trials:24 - Trial = 10394/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.467 | DEBUG    | __main__:trials:29 - Trial = 10394/30000 | Total reward = 43.21
2022-01-26 14:17:15.471 | DEBUG    | __main__:trials:24 - Trial = 10395/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.472 | DEBUG    | __main__:trials:29 - Trial = 10395/30000 | Total reward = 32.27
2022-01-26 14:17:15.476 | DEBUG    | __main__:trials:24 - Trial = 10396/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.477 | DEBUG    | __main__:trials:29 - Trial = 10396/30000 | Total reward = 41.33
2022-01-26 14:17:15.480 | DEBUG    | __main__:trials:24 - Trial = 10397/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.482 | DEBUG    | __main__:trials:29 - Trial = 10397/30000 | Total reward = 28.80
2022-01-26 14:17:15.486 | DEBUG    | __main__:trials:24 - Trial = 10398/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.486 | DEBUG    | __main__:trials:29 - Trial = 10398/30000 | Total reward = 42.00
2022-01-26 14:17:15.489 | DEBUG    | __main__:trials:26 - Trial = 10399/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:15.491 | DEBUG    | __main__:trials:29 - Trial = 10399/30000 | Total reward = 17.41
2022-01-26 14:17:15.494 | DEBUG    | __main__:trials:24 - Trial = 10400/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.496 | DEBUG    | __main__:trials:29 - Trial = 10400/30000 | Total reward = 31.32
2022-01-26 14:17:15.500 | DEBUG    | __main__:trials:24 - Trial = 10401/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.501 | DEBUG    | __main__:trials:29 - Trial = 10401/30000 | Total reward = 33.40
2022-01-26 14:17:15.505 | DEBUG    | __main__:trials:24 - Trial = 10402/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.506 | DEBUG    | __main__:trials:29 - Trial = 10402/30000 | Total reward = 33.82
2022-01-26 14:17:15.510 | DEBUG    | __main__:trials:24 - Trial = 10403/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.511 | DEBUG    | __main__:trials:29 - Trial = 10403/30000 | Total reward = 28.68
2022-01-26 14:17:15.515 | DEBUG    | __main__:trials:24 - Trial = 10404/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.516 | DEBUG    | __main__:trials:29 - Trial = 10404/30000 | Total reward = 22.64
2022-01-26 14:17:15.519 | DEBUG    | __main__:trials:24 - Trial = 10405/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.521 | DEBUG    | __main__:trials:29 - Trial = 10405/30000 | Total reward = 15.94
2022-01-26 14:17:15.525 | DEBUG    | __main__:trials:24 - Trial = 10406/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.525 | DEBUG    | __main__:trials:29 - Trial = 10406/30000 | Total reward = 34.15
2022-01-26 14:17:15.528 | DEBUG    | __main__:trials:24 - Trial = 10407/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.529 | DEBUG    | __main__:trials:29 - Trial = 10407/30000 | Total reward = 31.96
2022-01-26 14:17:15.533 | DEBUG    | __main__:trials:24 - Trial = 10408/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.534 | DEBUG    | __main__:trials:29 - Trial = 10408/30000 | Total reward = 28.99
2022-01-26 14:17:15.537 | DEBUG    | __main__:trials:24 - Trial = 10409/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.539 | DEBUG    | __main__:trials:29 - Trial = 10409/30000 | Total reward = 27.42
2022-01-26 14:17:15.542 | DEBUG    | __main__:trials:24 - Trial = 10410/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.543 | DEBUG    | __main__:trials:29 - Trial = 10410/30000 | Total reward = 27.61
2022-01-26 14:17:15.546 | DEBUG    | __main__:trials:24 - Trial = 10411/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.548 | DEBUG    | __main__:trials:29 - Trial = 10411/30000 | Total reward = 31.03
2022-01-26 14:17:15.552 | DEBUG    | __main__:trials:24 - Trial = 10412/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.553 | DEBUG    | __main__:trials:29 - Trial = 10412/30000 | Total reward = 50.78
2022-01-26 14:17:15.557 | DEBUG    | __main__:trials:24 - Trial = 10413/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.559 | DEBUG    | __main__:trials:29 - Trial = 10413/30000 | Total reward = 42.06
2022-01-26 14:17:15.562 | DEBUG    | __main__:trials:24 - Trial = 10414/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.564 | DEBUG    | __main__:trials:29 - Trial = 10414/30000 | Total reward = 56.93
2022-01-26 14:17:15.568 | DEBUG    | __main__:trials:24 - Trial = 10415/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.569 | DEBUG    | __main__:trials:29 - Trial = 10415/30000 | Total reward = 34.61
2022-01-26 14:17:15.573 | DEBUG    | __main__:trials:24 - Trial = 10416/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.574 | DEBUG    | __main__:trials:29 - Trial = 10416/30000 | Total reward = 38.71
2022-01-26 14:17:15.578 | DEBUG    | __main__:trials:24 - Trial = 10417/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.579 | DEBUG    | __main__:trials:29 - Trial = 10417/30000 | Total reward = 49.12
2022-01-26 14:17:15.583 | DEBUG    | __main__:trials:24 - Trial = 10418/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.585 | DEBUG    | __main__:trials:29 - Trial = 10418/30000 | Total reward = 41.31
2022-01-26 14:17:15.589 | DEBUG    | __main__:trials:24 - Trial = 10419/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.590 | DEBUG    | __main__:trials:29 - Trial = 10419/30000 | Total reward = 47.85
2022-01-26 14:17:15.593 | DEBUG    | __main__:trials:24 - Trial = 10420/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.595 | DEBUG    | __main__:trials:29 - Trial = 10420/30000 | Total reward = 39.03
2022-01-26 14:17:15.598 | DEBUG    | __main__:trials:24 - Trial = 10421/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.598 | DEBUG    | __main__:trials:29 - Trial = 10421/30000 | Total reward = 49.32
2022-01-26 14:17:15.602 | DEBUG    | __main__:trials:24 - Trial = 10422/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.604 | DEBUG    | __main__:trials:29 - Trial = 10422/30000 | Total reward = 43.20
2022-01-26 14:17:15.608 | DEBUG    | __main__:trials:24 - Trial = 10423/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.610 | DEBUG    | __main__:trials:29 - Trial = 10423/30000 | Total reward = 46.06
2022-01-26 14:17:15.614 | DEBUG    | __main__:trials:24 - Trial = 10424/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.615 | DEBUG    | __main__:trials:29 - Trial = 10424/30000 | Total reward = 41.96
2022-01-26 14:17:15.618 | DEBUG    | __main__:trials:24 - Trial = 10425/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.620 | DEBUG    | __main__:trials:29 - Trial = 10425/30000 | Total reward = 47.64
2022-01-26 14:17:15.624 | DEBUG    | __main__:trials:24 - Trial = 10426/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.624 | DEBUG    | __main__:trials:29 - Trial = 10426/30000 | Total reward = 40.56
2022-01-26 14:17:15.629 | DEBUG    | __main__:trials:24 - Trial = 10427/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.630 | DEBUG    | __main__:trials:29 - Trial = 10427/30000 | Total reward = 32.95
2022-01-26 14:17:15.634 | DEBUG    | __main__:trials:24 - Trial = 10428/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.634 | DEBUG    | __main__:trials:29 - Trial = 10428/30000 | Total reward = 40.59
2022-01-26 14:17:15.639 | DEBUG    | __main__:trials:24 - Trial = 10429/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.641 | DEBUG    | __main__:trials:29 - Trial = 10429/30000 | Total reward = 42.54
2022-01-26 14:17:15.644 | DEBUG    | __main__:trials:24 - Trial = 10430/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.645 | DEBUG    | __main__:trials:29 - Trial = 10430/30000 | Total reward = 37.08
2022-01-26 14:17:15.650 | DEBUG    | __main__:trials:24 - Trial = 10431/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.651 | DEBUG    | __main__:trials:29 - Trial = 10431/30000 | Total reward = 59.83
2022-01-26 14:17:15.655 | DEBUG    | __main__:trials:24 - Trial = 10432/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.656 | DEBUG    | __main__:trials:29 - Trial = 10432/30000 | Total reward = 49.49
2022-01-26 14:17:15.660 | DEBUG    | __main__:trials:24 - Trial = 10433/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.661 | DEBUG    | __main__:trials:29 - Trial = 10433/30000 | Total reward = 53.08
2022-01-26 14:17:15.665 | DEBUG    | __main__:trials:24 - Trial = 10434/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.666 | DEBUG    | __main__:trials:29 - Trial = 10434/30000 | Total reward = 38.53
2022-01-26 14:17:15.670 | DEBUG    | __main__:trials:24 - Trial = 10435/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.671 | DEBUG    | __main__:trials:29 - Trial = 10435/30000 | Total reward = 45.50
2022-01-26 14:17:15.675 | DEBUG    | __main__:trials:24 - Trial = 10436/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.676 | DEBUG    | __main__:trials:29 - Trial = 10436/30000 | Total reward = 39.16
2022-01-26 14:17:15.680 | DEBUG    | __main__:trials:24 - Trial = 10437/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.682 | DEBUG    | __main__:trials:29 - Trial = 10437/30000 | Total reward = 39.78
2022-01-26 14:17:15.686 | DEBUG    | __main__:trials:24 - Trial = 10438/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.687 | DEBUG    | __main__:trials:29 - Trial = 10438/30000 | Total reward = 45.92
2022-01-26 14:17:15.691 | DEBUG    | __main__:trials:24 - Trial = 10439/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.693 | DEBUG    | __main__:trials:29 - Trial = 10439/30000 | Total reward = 41.01
2022-01-26 14:17:15.696 | DEBUG    | __main__:trials:24 - Trial = 10440/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.697 | DEBUG    | __main__:trials:29 - Trial = 10440/30000 | Total reward = 43.32
2022-01-26 14:17:15.701 | DEBUG    | __main__:trials:24 - Trial = 10441/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.703 | DEBUG    | __main__:trials:29 - Trial = 10441/30000 | Total reward = 37.02
2022-01-26 14:17:15.706 | DEBUG    | __main__:trials:24 - Trial = 10442/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.707 | DEBUG    | __main__:trials:29 - Trial = 10442/30000 | Total reward = 36.91
2022-01-26 14:17:15.711 | DEBUG    | __main__:trials:24 - Trial = 10443/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.712 | DEBUG    | __main__:trials:29 - Trial = 10443/30000 | Total reward = 54.62
2022-01-26 14:17:15.715 | DEBUG    | __main__:trials:24 - Trial = 10444/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.716 | DEBUG    | __main__:trials:29 - Trial = 10444/30000 | Total reward = 36.41
2022-01-26 14:17:15.720 | DEBUG    | __main__:trials:24 - Trial = 10445/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.722 | DEBUG    | __main__:trials:29 - Trial = 10445/30000 | Total reward = 50.32
2022-01-26 14:17:15.726 | DEBUG    | __main__:trials:24 - Trial = 10446/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.727 | DEBUG    | __main__:trials:29 - Trial = 10446/30000 | Total reward = 50.35
2022-01-26 14:17:15.731 | DEBUG    | __main__:trials:24 - Trial = 10447/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.732 | DEBUG    | __main__:trials:29 - Trial = 10447/30000 | Total reward = 42.84
2022-01-26 14:17:15.736 | DEBUG    | __main__:trials:24 - Trial = 10448/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.738 | DEBUG    | __main__:trials:29 - Trial = 10448/30000 | Total reward = 49.32
2022-01-26 14:17:15.741 | DEBUG    | __main__:trials:24 - Trial = 10449/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.742 | DEBUG    | __main__:trials:29 - Trial = 10449/30000 | Total reward = 39.54
2022-01-26 14:17:15.747 | DEBUG    | __main__:trials:24 - Trial = 10450/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.747 | DEBUG    | __main__:trials:29 - Trial = 10450/30000 | Total reward = 39.76
2022-01-26 14:17:15.752 | DEBUG    | __main__:trials:24 - Trial = 10451/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.752 | DEBUG    | __main__:trials:29 - Trial = 10451/30000 | Total reward = 59.16
2022-01-26 14:17:15.757 | DEBUG    | __main__:trials:24 - Trial = 10452/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.758 | DEBUG    | __main__:trials:29 - Trial = 10452/30000 | Total reward = 41.49
2022-01-26 14:17:15.762 | DEBUG    | __main__:trials:24 - Trial = 10453/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.762 | DEBUG    | __main__:trials:29 - Trial = 10453/30000 | Total reward = 33.70
2022-01-26 14:17:15.767 | DEBUG    | __main__:trials:24 - Trial = 10454/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.769 | DEBUG    | __main__:trials:29 - Trial = 10454/30000 | Total reward = 42.07
2022-01-26 14:17:15.772 | DEBUG    | __main__:trials:24 - Trial = 10455/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.773 | DEBUG    | __main__:trials:29 - Trial = 10455/30000 | Total reward = 61.01
2022-01-26 14:17:15.777 | DEBUG    | __main__:trials:24 - Trial = 10456/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.779 | DEBUG    | __main__:trials:29 - Trial = 10456/30000 | Total reward = 47.19
2022-01-26 14:17:15.782 | DEBUG    | __main__:trials:24 - Trial = 10457/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.783 | DEBUG    | __main__:trials:29 - Trial = 10457/30000 | Total reward = 36.44
2022-01-26 14:17:15.787 | DEBUG    | __main__:trials:24 - Trial = 10458/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.789 | DEBUG    | __main__:trials:29 - Trial = 10458/30000 | Total reward = 31.06
2022-01-26 14:17:15.795 | DEBUG    | __main__:trials:24 - Trial = 10459/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.795 | DEBUG    | __main__:trials:29 - Trial = 10459/30000 | Total reward = 49.76
2022-01-26 14:17:15.799 | DEBUG    | __main__:trials:24 - Trial = 10460/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.801 | DEBUG    | __main__:trials:29 - Trial = 10460/30000 | Total reward = 58.70
2022-01-26 14:17:15.804 | DEBUG    | __main__:trials:24 - Trial = 10461/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.805 | DEBUG    | __main__:trials:29 - Trial = 10461/30000 | Total reward = 50.07
2022-01-26 14:17:15.809 | DEBUG    | __main__:trials:24 - Trial = 10462/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.810 | DEBUG    | __main__:trials:29 - Trial = 10462/30000 | Total reward = 44.70
2022-01-26 14:17:15.814 | DEBUG    | __main__:trials:24 - Trial = 10463/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.816 | DEBUG    | __main__:trials:29 - Trial = 10463/30000 | Total reward = 39.72
2022-01-26 14:17:15.819 | DEBUG    | __main__:trials:24 - Trial = 10464/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.820 | DEBUG    | __main__:trials:29 - Trial = 10464/30000 | Total reward = 18.08
2022-01-26 14:17:15.824 | DEBUG    | __main__:trials:24 - Trial = 10465/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.826 | DEBUG    | __main__:trials:29 - Trial = 10465/30000 | Total reward = 29.18
2022-01-26 14:17:15.830 | DEBUG    | __main__:trials:24 - Trial = 10466/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.831 | DEBUG    | __main__:trials:29 - Trial = 10466/30000 | Total reward = 27.28
2022-01-26 14:17:15.835 | DEBUG    | __main__:trials:24 - Trial = 10467/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.836 | DEBUG    | __main__:trials:29 - Trial = 10467/30000 | Total reward = 33.04
2022-01-26 14:17:15.839 | DEBUG    | __main__:trials:24 - Trial = 10468/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.841 | DEBUG    | __main__:trials:29 - Trial = 10468/30000 | Total reward = 25.49
2022-01-26 14:17:15.844 | DEBUG    | __main__:trials:24 - Trial = 10469/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.846 | DEBUG    | __main__:trials:29 - Trial = 10469/30000 | Total reward = 47.15
2022-01-26 14:17:15.849 | DEBUG    | __main__:trials:24 - Trial = 10470/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.850 | DEBUG    | __main__:trials:29 - Trial = 10470/30000 | Total reward = 30.17
2022-01-26 14:17:15.854 | DEBUG    | __main__:trials:24 - Trial = 10471/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.855 | DEBUG    | __main__:trials:29 - Trial = 10471/30000 | Total reward = 32.91
2022-01-26 14:17:15.859 | DEBUG    | __main__:trials:24 - Trial = 10472/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.861 | DEBUG    | __main__:trials:29 - Trial = 10472/30000 | Total reward = 43.49
2022-01-26 14:17:15.864 | DEBUG    | __main__:trials:24 - Trial = 10473/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.866 | DEBUG    | __main__:trials:29 - Trial = 10473/30000 | Total reward = 53.18
2022-01-26 14:17:15.870 | DEBUG    | __main__:trials:24 - Trial = 10474/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.870 | DEBUG    | __main__:trials:29 - Trial = 10474/30000 | Total reward = 27.08
2022-01-26 14:17:15.875 | DEBUG    | __main__:trials:24 - Trial = 10475/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.876 | DEBUG    | __main__:trials:29 - Trial = 10475/30000 | Total reward = 28.82
2022-01-26 14:17:15.880 | DEBUG    | __main__:trials:24 - Trial = 10476/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.882 | DEBUG    | __main__:trials:29 - Trial = 10476/30000 | Total reward = 29.18
2022-01-26 14:17:15.885 | DEBUG    | __main__:trials:24 - Trial = 10477/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.886 | DEBUG    | __main__:trials:29 - Trial = 10477/30000 | Total reward = 28.78
2022-01-26 14:17:15.890 | DEBUG    | __main__:trials:24 - Trial = 10478/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.891 | DEBUG    | __main__:trials:29 - Trial = 10478/30000 | Total reward = 28.50
2022-01-26 14:17:15.895 | DEBUG    | __main__:trials:24 - Trial = 10479/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.896 | DEBUG    | __main__:trials:29 - Trial = 10479/30000 | Total reward = 29.87
2022-01-26 14:17:15.900 | DEBUG    | __main__:trials:24 - Trial = 10480/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.901 | DEBUG    | __main__:trials:29 - Trial = 10480/30000 | Total reward = 41.91
2022-01-26 14:17:15.905 | DEBUG    | __main__:trials:24 - Trial = 10481/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.907 | DEBUG    | __main__:trials:29 - Trial = 10481/30000 | Total reward = 25.36
2022-01-26 14:17:15.910 | DEBUG    | __main__:trials:24 - Trial = 10482/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.911 | DEBUG    | __main__:trials:29 - Trial = 10482/30000 | Total reward = 29.33
2022-01-26 14:17:15.915 | DEBUG    | __main__:trials:24 - Trial = 10483/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.917 | DEBUG    | __main__:trials:29 - Trial = 10483/30000 | Total reward = 29.87
2022-01-26 14:17:15.919 | DEBUG    | __main__:trials:24 - Trial = 10484/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.921 | DEBUG    | __main__:trials:29 - Trial = 10484/30000 | Total reward = 37.53
2022-01-26 14:17:15.925 | DEBUG    | __main__:trials:24 - Trial = 10485/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.926 | DEBUG    | __main__:trials:29 - Trial = 10485/30000 | Total reward = 47.15
2022-01-26 14:17:15.930 | DEBUG    | __main__:trials:24 - Trial = 10486/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.932 | DEBUG    | __main__:trials:29 - Trial = 10486/30000 | Total reward = 29.32
2022-01-26 14:17:15.935 | DEBUG    | __main__:trials:24 - Trial = 10487/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.937 | DEBUG    | __main__:trials:29 - Trial = 10487/30000 | Total reward = 35.65
2022-01-26 14:17:15.940 | DEBUG    | __main__:trials:24 - Trial = 10488/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.941 | DEBUG    | __main__:trials:29 - Trial = 10488/30000 | Total reward = 43.39
2022-01-26 14:17:15.944 | DEBUG    | __main__:trials:24 - Trial = 10489/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.946 | DEBUG    | __main__:trials:29 - Trial = 10489/30000 | Total reward = 37.76
2022-01-26 14:17:15.950 | DEBUG    | __main__:trials:24 - Trial = 10490/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.951 | DEBUG    | __main__:trials:29 - Trial = 10490/30000 | Total reward = 27.54
2022-01-26 14:17:15.955 | DEBUG    | __main__:trials:24 - Trial = 10491/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.957 | DEBUG    | __main__:trials:29 - Trial = 10491/30000 | Total reward = 31.75
2022-01-26 14:17:15.959 | DEBUG    | __main__:trials:24 - Trial = 10492/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.961 | DEBUG    | __main__:trials:29 - Trial = 10492/30000 | Total reward = 28.85
2022-01-26 14:17:15.964 | DEBUG    | __main__:trials:24 - Trial = 10493/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.966 | DEBUG    | __main__:trials:29 - Trial = 10493/30000 | Total reward = 25.49
2022-01-26 14:17:15.970 | DEBUG    | __main__:trials:24 - Trial = 10494/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.970 | DEBUG    | __main__:trials:29 - Trial = 10494/30000 | Total reward = 41.41
2022-01-26 14:17:15.975 | DEBUG    | __main__:trials:24 - Trial = 10495/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.976 | DEBUG    | __main__:trials:29 - Trial = 10495/30000 | Total reward = 55.82
2022-01-26 14:17:15.980 | DEBUG    | __main__:trials:24 - Trial = 10496/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.981 | DEBUG    | __main__:trials:29 - Trial = 10496/30000 | Total reward = 42.55
2022-01-26 14:17:15.985 | DEBUG    | __main__:trials:24 - Trial = 10497/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.986 | DEBUG    | __main__:trials:29 - Trial = 10497/30000 | Total reward = 27.87
2022-01-26 14:17:15.990 | DEBUG    | __main__:trials:24 - Trial = 10498/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.992 | DEBUG    | __main__:trials:29 - Trial = 10498/30000 | Total reward = 28.22
2022-01-26 14:17:15.995 | DEBUG    | __main__:trials:24 - Trial = 10499/30000 | Max number of steps (20) reached
2022-01-26 14:17:15.996 | DEBUG    | __main__:trials:29 - Trial = 10499/30000 | Total reward = 28.83
2022-01-26 14:17:16.000 | DEBUG    | __main__:trials:24 - Trial = 10500/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.001 | DEBUG    | __main__:trials:29 - Trial = 10500/30000 | Total reward = 26.86
2022-01-26 14:17:16.005 | DEBUG    | __main__:trials:24 - Trial = 10501/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.007 | DEBUG    | __main__:trials:29 - Trial = 10501/30000 | Total reward = 37.11
2022-01-26 14:17:16.010 | DEBUG    | __main__:trials:26 - Trial = 10502/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.011 | DEBUG    | __main__:trials:29 - Trial = 10502/30000 | Total reward = 32.15
2022-01-26 14:17:16.015 | DEBUG    | __main__:trials:24 - Trial = 10503/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.017 | DEBUG    | __main__:trials:29 - Trial = 10503/30000 | Total reward = 42.89
2022-01-26 14:17:16.020 | DEBUG    | __main__:trials:24 - Trial = 10504/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.021 | DEBUG    | __main__:trials:29 - Trial = 10504/30000 | Total reward = 34.36
2022-01-26 14:17:16.024 | DEBUG    | __main__:trials:24 - Trial = 10505/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.026 | DEBUG    | __main__:trials:29 - Trial = 10505/30000 | Total reward = 41.21
2022-01-26 14:17:16.030 | DEBUG    | __main__:trials:24 - Trial = 10506/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.030 | DEBUG    | __main__:trials:29 - Trial = 10506/30000 | Total reward = 38.83
2022-01-26 14:17:16.034 | DEBUG    | __main__:trials:24 - Trial = 10507/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.035 | DEBUG    | __main__:trials:29 - Trial = 10507/30000 | Total reward = 33.93
2022-01-26 14:17:16.038 | DEBUG    | __main__:trials:24 - Trial = 10508/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.040 | DEBUG    | __main__:trials:29 - Trial = 10508/30000 | Total reward = 53.93
2022-01-26 14:17:16.044 | DEBUG    | __main__:trials:24 - Trial = 10509/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.045 | DEBUG    | __main__:trials:29 - Trial = 10509/30000 | Total reward = 35.36
2022-01-26 14:17:16.049 | DEBUG    | __main__:trials:24 - Trial = 10510/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.050 | DEBUG    | __main__:trials:29 - Trial = 10510/30000 | Total reward = 53.39
2022-01-26 14:17:16.053 | DEBUG    | __main__:trials:24 - Trial = 10511/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.054 | DEBUG    | __main__:trials:29 - Trial = 10511/30000 | Total reward = 31.03
2022-01-26 14:17:16.057 | DEBUG    | __main__:trials:24 - Trial = 10512/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.059 | DEBUG    | __main__:trials:29 - Trial = 10512/30000 | Total reward = 29.33
2022-01-26 14:17:16.062 | DEBUG    | __main__:trials:24 - Trial = 10513/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.063 | DEBUG    | __main__:trials:29 - Trial = 10513/30000 | Total reward = 35.16
2022-01-26 14:17:16.067 | DEBUG    | __main__:trials:24 - Trial = 10514/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.067 | DEBUG    | __main__:trials:29 - Trial = 10514/30000 | Total reward = 56.93
2022-01-26 14:17:16.071 | DEBUG    | __main__:trials:24 - Trial = 10515/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.071 | DEBUG    | __main__:trials:29 - Trial = 10515/30000 | Total reward = 35.82
2022-01-26 14:17:16.075 | DEBUG    | __main__:trials:24 - Trial = 10516/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.076 | DEBUG    | __main__:trials:29 - Trial = 10516/30000 | Total reward = 34.17
2022-01-26 14:17:16.080 | DEBUG    | __main__:trials:24 - Trial = 10517/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.082 | DEBUG    | __main__:trials:29 - Trial = 10517/30000 | Total reward = 29.33
2022-01-26 14:17:16.085 | DEBUG    | __main__:trials:24 - Trial = 10518/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.087 | DEBUG    | __main__:trials:29 - Trial = 10518/30000 | Total reward = 28.64
2022-01-26 14:17:16.090 | DEBUG    | __main__:trials:24 - Trial = 10519/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.092 | DEBUG    | __main__:trials:29 - Trial = 10519/30000 | Total reward = 26.20
2022-01-26 14:17:16.096 | DEBUG    | __main__:trials:24 - Trial = 10520/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.096 | DEBUG    | __main__:trials:29 - Trial = 10520/30000 | Total reward = 29.07
2022-01-26 14:17:16.101 | DEBUG    | __main__:trials:24 - Trial = 10521/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.101 | DEBUG    | __main__:trials:29 - Trial = 10521/30000 | Total reward = 39.44
2022-01-26 14:17:16.105 | DEBUG    | __main__:trials:24 - Trial = 10522/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.106 | DEBUG    | __main__:trials:29 - Trial = 10522/30000 | Total reward = 12.99
2022-01-26 14:17:16.110 | DEBUG    | __main__:trials:24 - Trial = 10523/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.111 | DEBUG    | __main__:trials:29 - Trial = 10523/30000 | Total reward = 29.62
2022-01-26 14:17:16.115 | DEBUG    | __main__:trials:24 - Trial = 10524/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.116 | DEBUG    | __main__:trials:29 - Trial = 10524/30000 | Total reward = 44.59
2022-01-26 14:17:16.120 | DEBUG    | __main__:trials:24 - Trial = 10525/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.121 | DEBUG    | __main__:trials:29 - Trial = 10525/30000 | Total reward = 29.60
2022-01-26 14:17:16.127 | DEBUG    | __main__:trials:24 - Trial = 10526/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.128 | DEBUG    | __main__:trials:29 - Trial = 10526/30000 | Total reward = 38.84
2022-01-26 14:17:16.132 | DEBUG    | __main__:trials:24 - Trial = 10527/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.134 | DEBUG    | __main__:trials:29 - Trial = 10527/30000 | Total reward = 28.48
2022-01-26 14:17:16.138 | DEBUG    | __main__:trials:24 - Trial = 10528/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.139 | DEBUG    | __main__:trials:29 - Trial = 10528/30000 | Total reward = 59.53
2022-01-26 14:17:16.142 | DEBUG    | __main__:trials:24 - Trial = 10529/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.144 | DEBUG    | __main__:trials:29 - Trial = 10529/30000 | Total reward = 27.21
2022-01-26 14:17:16.147 | DEBUG    | __main__:trials:24 - Trial = 10530/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.148 | DEBUG    | __main__:trials:29 - Trial = 10530/30000 | Total reward = 54.07
2022-01-26 14:17:16.152 | DEBUG    | __main__:trials:24 - Trial = 10531/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.154 | DEBUG    | __main__:trials:29 - Trial = 10531/30000 | Total reward = 39.32
2022-01-26 14:17:16.157 | DEBUG    | __main__:trials:24 - Trial = 10532/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.159 | DEBUG    | __main__:trials:29 - Trial = 10532/30000 | Total reward = 35.68
2022-01-26 14:17:16.163 | DEBUG    | __main__:trials:24 - Trial = 10533/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.164 | DEBUG    | __main__:trials:29 - Trial = 10533/30000 | Total reward = 28.46
2022-01-26 14:17:16.168 | DEBUG    | __main__:trials:24 - Trial = 10534/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.169 | DEBUG    | __main__:trials:29 - Trial = 10534/30000 | Total reward = 31.69
2022-01-26 14:17:16.173 | DEBUG    | __main__:trials:24 - Trial = 10535/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.175 | DEBUG    | __main__:trials:29 - Trial = 10535/30000 | Total reward = 33.61
2022-01-26 14:17:16.177 | DEBUG    | __main__:trials:26 - Trial = 10536/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.179 | DEBUG    | __main__:trials:29 - Trial = 10536/30000 | Total reward = 7.43
2022-01-26 14:17:16.182 | DEBUG    | __main__:trials:24 - Trial = 10537/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.183 | DEBUG    | __main__:trials:29 - Trial = 10537/30000 | Total reward = 42.03
2022-01-26 14:17:16.187 | DEBUG    | __main__:trials:24 - Trial = 10538/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.189 | DEBUG    | __main__:trials:29 - Trial = 10538/30000 | Total reward = 41.40
2022-01-26 14:17:16.192 | DEBUG    | __main__:trials:24 - Trial = 10539/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.194 | DEBUG    | __main__:trials:29 - Trial = 10539/30000 | Total reward = 57.91
2022-01-26 14:17:16.197 | DEBUG    | __main__:trials:24 - Trial = 10540/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.197 | DEBUG    | __main__:trials:29 - Trial = 10540/30000 | Total reward = 29.77
2022-01-26 14:17:16.202 | DEBUG    | __main__:trials:24 - Trial = 10541/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.203 | DEBUG    | __main__:trials:29 - Trial = 10541/30000 | Total reward = 58.05
2022-01-26 14:17:16.207 | DEBUG    | __main__:trials:24 - Trial = 10542/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.208 | DEBUG    | __main__:trials:29 - Trial = 10542/30000 | Total reward = 29.18
2022-01-26 14:17:16.212 | DEBUG    | __main__:trials:24 - Trial = 10543/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.213 | DEBUG    | __main__:trials:29 - Trial = 10543/30000 | Total reward = 32.37
2022-01-26 14:17:16.216 | DEBUG    | __main__:trials:24 - Trial = 10544/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.217 | DEBUG    | __main__:trials:29 - Trial = 10544/30000 | Total reward = 53.62
2022-01-26 14:17:16.221 | DEBUG    | __main__:trials:24 - Trial = 10545/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.222 | DEBUG    | __main__:trials:29 - Trial = 10545/30000 | Total reward = 28.97
2022-01-26 14:17:16.225 | DEBUG    | __main__:trials:24 - Trial = 10546/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.226 | DEBUG    | __main__:trials:29 - Trial = 10546/30000 | Total reward = 29.02
2022-01-26 14:17:16.230 | DEBUG    | __main__:trials:24 - Trial = 10547/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.231 | DEBUG    | __main__:trials:29 - Trial = 10547/30000 | Total reward = 28.97
2022-01-26 14:17:16.235 | DEBUG    | __main__:trials:24 - Trial = 10548/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.235 | DEBUG    | __main__:trials:29 - Trial = 10548/30000 | Total reward = 29.33
2022-01-26 14:17:16.240 | DEBUG    | __main__:trials:24 - Trial = 10549/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.240 | DEBUG    | __main__:trials:29 - Trial = 10549/30000 | Total reward = 27.69
2022-01-26 14:17:16.243 | DEBUG    | __main__:trials:26 - Trial = 10550/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.244 | DEBUG    | __main__:trials:29 - Trial = 10550/30000 | Total reward = 8.43
2022-01-26 14:17:16.248 | DEBUG    | __main__:trials:24 - Trial = 10551/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.249 | DEBUG    | __main__:trials:29 - Trial = 10551/30000 | Total reward = 30.43
2022-01-26 14:17:16.253 | DEBUG    | __main__:trials:24 - Trial = 10552/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.254 | DEBUG    | __main__:trials:29 - Trial = 10552/30000 | Total reward = 42.96
2022-01-26 14:17:16.258 | DEBUG    | __main__:trials:24 - Trial = 10553/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.259 | DEBUG    | __main__:trials:29 - Trial = 10553/30000 | Total reward = 19.85
2022-01-26 14:17:16.263 | DEBUG    | __main__:trials:24 - Trial = 10554/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.265 | DEBUG    | __main__:trials:29 - Trial = 10554/30000 | Total reward = 36.49
2022-01-26 14:17:16.268 | DEBUG    | __main__:trials:26 - Trial = 10555/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.269 | DEBUG    | __main__:trials:29 - Trial = 10555/30000 | Total reward = 20.23
2022-01-26 14:17:16.273 | DEBUG    | __main__:trials:24 - Trial = 10556/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.275 | DEBUG    | __main__:trials:29 - Trial = 10556/30000 | Total reward = 29.18
2022-01-26 14:17:16.278 | DEBUG    | __main__:trials:24 - Trial = 10557/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.279 | DEBUG    | __main__:trials:29 - Trial = 10557/30000 | Total reward = 41.62
2022-01-26 14:17:16.283 | DEBUG    | __main__:trials:24 - Trial = 10558/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.284 | DEBUG    | __main__:trials:29 - Trial = 10558/30000 | Total reward = 29.29
2022-01-26 14:17:16.288 | DEBUG    | __main__:trials:24 - Trial = 10559/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.289 | DEBUG    | __main__:trials:29 - Trial = 10559/30000 | Total reward = 29.16
2022-01-26 14:17:16.293 | DEBUG    | __main__:trials:24 - Trial = 10560/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.295 | DEBUG    | __main__:trials:29 - Trial = 10560/30000 | Total reward = 15.61
2022-01-26 14:17:16.298 | DEBUG    | __main__:trials:26 - Trial = 10561/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.299 | DEBUG    | __main__:trials:29 - Trial = 10561/30000 | Total reward = 18.84
2022-01-26 14:17:16.303 | DEBUG    | __main__:trials:24 - Trial = 10562/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.304 | DEBUG    | __main__:trials:29 - Trial = 10562/30000 | Total reward = 19.03
2022-01-26 14:17:16.306 | DEBUG    | __main__:trials:26 - Trial = 10563/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.309 | DEBUG    | __main__:trials:29 - Trial = 10563/30000 | Total reward = 7.44
2022-01-26 14:17:16.312 | DEBUG    | __main__:trials:24 - Trial = 10564/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.314 | DEBUG    | __main__:trials:29 - Trial = 10564/30000 | Total reward = 49.22
2022-01-26 14:17:16.318 | DEBUG    | __main__:trials:24 - Trial = 10565/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.319 | DEBUG    | __main__:trials:29 - Trial = 10565/30000 | Total reward = 28.84
2022-01-26 14:17:16.323 | DEBUG    | __main__:trials:24 - Trial = 10566/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.324 | DEBUG    | __main__:trials:29 - Trial = 10566/30000 | Total reward = 45.37
2022-01-26 14:17:16.328 | DEBUG    | __main__:trials:24 - Trial = 10567/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.329 | DEBUG    | __main__:trials:29 - Trial = 10567/30000 | Total reward = 38.60
2022-01-26 14:17:16.333 | DEBUG    | __main__:trials:24 - Trial = 10568/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.335 | DEBUG    | __main__:trials:29 - Trial = 10568/30000 | Total reward = 28.84
2022-01-26 14:17:16.338 | DEBUG    | __main__:trials:24 - Trial = 10569/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.340 | DEBUG    | __main__:trials:29 - Trial = 10569/30000 | Total reward = 29.01
2022-01-26 14:17:16.343 | DEBUG    | __main__:trials:26 - Trial = 10570/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.344 | DEBUG    | __main__:trials:29 - Trial = 10570/30000 | Total reward = 11.51
2022-01-26 14:17:16.348 | DEBUG    | __main__:trials:24 - Trial = 10571/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.349 | DEBUG    | __main__:trials:29 - Trial = 10571/30000 | Total reward = 40.39
2022-01-26 14:17:16.353 | DEBUG    | __main__:trials:24 - Trial = 10572/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.354 | DEBUG    | __main__:trials:29 - Trial = 10572/30000 | Total reward = 26.20
2022-01-26 14:17:16.358 | DEBUG    | __main__:trials:24 - Trial = 10573/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.359 | DEBUG    | __main__:trials:29 - Trial = 10573/30000 | Total reward = 52.15
2022-01-26 14:17:16.363 | DEBUG    | __main__:trials:24 - Trial = 10574/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.364 | DEBUG    | __main__:trials:29 - Trial = 10574/30000 | Total reward = 29.18
2022-01-26 14:17:16.368 | DEBUG    | __main__:trials:24 - Trial = 10575/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.370 | DEBUG    | __main__:trials:29 - Trial = 10575/30000 | Total reward = 37.56
2022-01-26 14:17:16.373 | DEBUG    | __main__:trials:24 - Trial = 10576/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.375 | DEBUG    | __main__:trials:29 - Trial = 10576/30000 | Total reward = 37.06
2022-01-26 14:17:16.378 | DEBUG    | __main__:trials:26 - Trial = 10577/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.379 | DEBUG    | __main__:trials:29 - Trial = 10577/30000 | Total reward = 12.51
2022-01-26 14:17:16.383 | DEBUG    | __main__:trials:24 - Trial = 10578/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.384 | DEBUG    | __main__:trials:29 - Trial = 10578/30000 | Total reward = 32.88
2022-01-26 14:17:16.388 | DEBUG    | __main__:trials:24 - Trial = 10579/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.389 | DEBUG    | __main__:trials:29 - Trial = 10579/30000 | Total reward = 26.98
2022-01-26 14:17:16.393 | DEBUG    | __main__:trials:24 - Trial = 10580/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.395 | DEBUG    | __main__:trials:29 - Trial = 10580/30000 | Total reward = 28.12
2022-01-26 14:17:16.398 | DEBUG    | __main__:trials:24 - Trial = 10581/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.400 | DEBUG    | __main__:trials:29 - Trial = 10581/30000 | Total reward = 35.04
2022-01-26 14:17:16.403 | DEBUG    | __main__:trials:24 - Trial = 10582/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.405 | DEBUG    | __main__:trials:29 - Trial = 10582/30000 | Total reward = 42.57
2022-01-26 14:17:16.408 | DEBUG    | __main__:trials:24 - Trial = 10583/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.410 | DEBUG    | __main__:trials:29 - Trial = 10583/30000 | Total reward = 33.64
2022-01-26 14:17:16.414 | DEBUG    | __main__:trials:24 - Trial = 10584/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.414 | DEBUG    | __main__:trials:29 - Trial = 10584/30000 | Total reward = 29.90
2022-01-26 14:17:16.419 | DEBUG    | __main__:trials:24 - Trial = 10585/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.420 | DEBUG    | __main__:trials:29 - Trial = 10585/30000 | Total reward = 29.19
2022-01-26 14:17:16.423 | DEBUG    | __main__:trials:24 - Trial = 10586/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.425 | DEBUG    | __main__:trials:29 - Trial = 10586/30000 | Total reward = 37.26
2022-01-26 14:17:16.428 | DEBUG    | __main__:trials:24 - Trial = 10587/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.430 | DEBUG    | __main__:trials:29 - Trial = 10587/30000 | Total reward = 59.45
2022-01-26 14:17:16.433 | DEBUG    | __main__:trials:24 - Trial = 10588/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.434 | DEBUG    | __main__:trials:29 - Trial = 10588/30000 | Total reward = 30.84
2022-01-26 14:17:16.437 | DEBUG    | __main__:trials:24 - Trial = 10589/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.438 | DEBUG    | __main__:trials:29 - Trial = 10589/30000 | Total reward = 24.83
2022-01-26 14:17:16.442 | DEBUG    | __main__:trials:24 - Trial = 10590/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.442 | DEBUG    | __main__:trials:29 - Trial = 10590/30000 | Total reward = 25.21
2022-01-26 14:17:16.446 | DEBUG    | __main__:trials:24 - Trial = 10591/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.448 | DEBUG    | __main__:trials:29 - Trial = 10591/30000 | Total reward = 47.32
2022-01-26 14:17:16.452 | DEBUG    | __main__:trials:24 - Trial = 10592/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.452 | DEBUG    | __main__:trials:29 - Trial = 10592/30000 | Total reward = 29.75
2022-01-26 14:17:16.456 | DEBUG    | __main__:trials:26 - Trial = 10593/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.457 | DEBUG    | __main__:trials:29 - Trial = 10593/30000 | Total reward = 15.94
2022-01-26 14:17:16.460 | DEBUG    | __main__:trials:24 - Trial = 10594/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.462 | DEBUG    | __main__:trials:29 - Trial = 10594/30000 | Total reward = 27.91
2022-01-26 14:17:16.466 | DEBUG    | __main__:trials:24 - Trial = 10595/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.467 | DEBUG    | __main__:trials:29 - Trial = 10595/30000 | Total reward = 28.82
2022-01-26 14:17:16.471 | DEBUG    | __main__:trials:24 - Trial = 10596/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.472 | DEBUG    | __main__:trials:29 - Trial = 10596/30000 | Total reward = 35.17
2022-01-26 14:17:16.476 | DEBUG    | __main__:trials:24 - Trial = 10597/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.477 | DEBUG    | __main__:trials:29 - Trial = 10597/30000 | Total reward = 38.37
2022-01-26 14:17:16.481 | DEBUG    | __main__:trials:24 - Trial = 10598/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.482 | DEBUG    | __main__:trials:29 - Trial = 10598/30000 | Total reward = 56.50
2022-01-26 14:17:16.486 | DEBUG    | __main__:trials:24 - Trial = 10599/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.488 | DEBUG    | __main__:trials:29 - Trial = 10599/30000 | Total reward = 32.24
2022-01-26 14:17:16.491 | DEBUG    | __main__:trials:24 - Trial = 10600/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.492 | DEBUG    | __main__:trials:29 - Trial = 10600/30000 | Total reward = 44.08
2022-01-26 14:17:16.496 | DEBUG    | __main__:trials:24 - Trial = 10601/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.498 | DEBUG    | __main__:trials:29 - Trial = 10601/30000 | Total reward = 29.18
2022-01-26 14:17:16.501 | DEBUG    | __main__:trials:24 - Trial = 10602/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.502 | DEBUG    | __main__:trials:29 - Trial = 10602/30000 | Total reward = 28.92
2022-01-26 14:17:16.506 | DEBUG    | __main__:trials:24 - Trial = 10603/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.508 | DEBUG    | __main__:trials:29 - Trial = 10603/30000 | Total reward = 32.80
2022-01-26 14:17:16.511 | DEBUG    | __main__:trials:24 - Trial = 10604/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.513 | DEBUG    | __main__:trials:29 - Trial = 10604/30000 | Total reward = 29.35
2022-01-26 14:17:16.516 | DEBUG    | __main__:trials:24 - Trial = 10605/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.518 | DEBUG    | __main__:trials:29 - Trial = 10605/30000 | Total reward = 33.54
2022-01-26 14:17:16.522 | DEBUG    | __main__:trials:24 - Trial = 10606/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.523 | DEBUG    | __main__:trials:29 - Trial = 10606/30000 | Total reward = 28.43
2022-01-26 14:17:16.527 | DEBUG    | __main__:trials:24 - Trial = 10607/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.528 | DEBUG    | __main__:trials:29 - Trial = 10607/30000 | Total reward = 29.14
2022-01-26 14:17:16.532 | DEBUG    | __main__:trials:24 - Trial = 10608/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.534 | DEBUG    | __main__:trials:29 - Trial = 10608/30000 | Total reward = 11.89
2022-01-26 14:17:16.537 | DEBUG    | __main__:trials:24 - Trial = 10609/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.539 | DEBUG    | __main__:trials:29 - Trial = 10609/30000 | Total reward = 34.79
2022-01-26 14:17:16.543 | DEBUG    | __main__:trials:24 - Trial = 10610/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.543 | DEBUG    | __main__:trials:29 - Trial = 10610/30000 | Total reward = 33.14
2022-01-26 14:17:16.547 | DEBUG    | __main__:trials:24 - Trial = 10611/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.549 | DEBUG    | __main__:trials:29 - Trial = 10611/30000 | Total reward = 29.28
2022-01-26 14:17:16.553 | DEBUG    | __main__:trials:24 - Trial = 10612/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.553 | DEBUG    | __main__:trials:29 - Trial = 10612/30000 | Total reward = 31.64
2022-01-26 14:17:16.557 | DEBUG    | __main__:trials:24 - Trial = 10613/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.559 | DEBUG    | __main__:trials:29 - Trial = 10613/30000 | Total reward = 33.53
2022-01-26 14:17:16.562 | DEBUG    | __main__:trials:26 - Trial = 10614/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.564 | DEBUG    | __main__:trials:29 - Trial = 10614/30000 | Total reward = 18.76
2022-01-26 14:17:16.567 | DEBUG    | __main__:trials:24 - Trial = 10615/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.569 | DEBUG    | __main__:trials:29 - Trial = 10615/30000 | Total reward = 27.97
2022-01-26 14:17:16.571 | DEBUG    | __main__:trials:26 - Trial = 10616/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.573 | DEBUG    | __main__:trials:29 - Trial = 10616/30000 | Total reward = 7.27
2022-01-26 14:17:16.577 | DEBUG    | __main__:trials:24 - Trial = 10617/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.577 | DEBUG    | __main__:trials:29 - Trial = 10617/30000 | Total reward = 36.84
2022-01-26 14:17:16.581 | DEBUG    | __main__:trials:24 - Trial = 10618/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.582 | DEBUG    | __main__:trials:29 - Trial = 10618/30000 | Total reward = 36.75
2022-01-26 14:17:16.585 | DEBUG    | __main__:trials:24 - Trial = 10619/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.586 | DEBUG    | __main__:trials:29 - Trial = 10619/30000 | Total reward = 35.89
2022-01-26 14:17:16.589 | DEBUG    | __main__:trials:24 - Trial = 10620/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.591 | DEBUG    | __main__:trials:29 - Trial = 10620/30000 | Total reward = 42.65
2022-01-26 14:17:16.594 | DEBUG    | __main__:trials:24 - Trial = 10621/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.595 | DEBUG    | __main__:trials:29 - Trial = 10621/30000 | Total reward = 30.87
2022-01-26 14:17:16.598 | DEBUG    | __main__:trials:24 - Trial = 10622/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.599 | DEBUG    | __main__:trials:29 - Trial = 10622/30000 | Total reward = 29.49
2022-01-26 14:17:16.603 | DEBUG    | __main__:trials:24 - Trial = 10623/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.604 | DEBUG    | __main__:trials:29 - Trial = 10623/30000 | Total reward = 42.50
2022-01-26 14:17:16.608 | DEBUG    | __main__:trials:24 - Trial = 10624/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.610 | DEBUG    | __main__:trials:29 - Trial = 10624/30000 | Total reward = 24.37
2022-01-26 14:17:16.612 | DEBUG    | __main__:trials:26 - Trial = 10625/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.614 | DEBUG    | __main__:trials:29 - Trial = 10625/30000 | Total reward = 8.86
2022-01-26 14:17:16.616 | DEBUG    | __main__:trials:26 - Trial = 10626/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.618 | DEBUG    | __main__:trials:29 - Trial = 10626/30000 | Total reward = 7.44
2022-01-26 14:17:16.622 | DEBUG    | __main__:trials:24 - Trial = 10627/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.623 | DEBUG    | __main__:trials:29 - Trial = 10627/30000 | Total reward = 34.90
2022-01-26 14:17:16.627 | DEBUG    | __main__:trials:24 - Trial = 10628/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.628 | DEBUG    | __main__:trials:29 - Trial = 10628/30000 | Total reward = 35.18
2022-01-26 14:17:16.631 | DEBUG    | __main__:trials:24 - Trial = 10629/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.633 | DEBUG    | __main__:trials:29 - Trial = 10629/30000 | Total reward = 35.99
2022-01-26 14:17:16.637 | DEBUG    | __main__:trials:24 - Trial = 10630/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.638 | DEBUG    | __main__:trials:29 - Trial = 10630/30000 | Total reward = 30.39
2022-01-26 14:17:16.641 | DEBUG    | __main__:trials:26 - Trial = 10631/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.643 | DEBUG    | __main__:trials:29 - Trial = 10631/30000 | Total reward = 11.51
2022-01-26 14:17:16.646 | DEBUG    | __main__:trials:24 - Trial = 10632/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.649 | DEBUG    | __main__:trials:29 - Trial = 10632/30000 | Total reward = 29.91
2022-01-26 14:17:16.652 | DEBUG    | __main__:trials:24 - Trial = 10633/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.654 | DEBUG    | __main__:trials:29 - Trial = 10633/30000 | Total reward = 29.35
2022-01-26 14:17:16.657 | DEBUG    | __main__:trials:24 - Trial = 10634/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.659 | DEBUG    | __main__:trials:29 - Trial = 10634/30000 | Total reward = 36.11
2022-01-26 14:17:16.662 | DEBUG    | __main__:trials:24 - Trial = 10635/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.663 | DEBUG    | __main__:trials:29 - Trial = 10635/30000 | Total reward = 33.36
2022-01-26 14:17:16.666 | DEBUG    | __main__:trials:24 - Trial = 10636/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.668 | DEBUG    | __main__:trials:29 - Trial = 10636/30000 | Total reward = 29.35
2022-01-26 14:17:16.672 | DEBUG    | __main__:trials:24 - Trial = 10637/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.673 | DEBUG    | __main__:trials:29 - Trial = 10637/30000 | Total reward = 29.53
2022-01-26 14:17:16.676 | DEBUG    | __main__:trials:24 - Trial = 10638/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.678 | DEBUG    | __main__:trials:29 - Trial = 10638/30000 | Total reward = 50.84
2022-01-26 14:17:16.681 | DEBUG    | __main__:trials:24 - Trial = 10639/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.682 | DEBUG    | __main__:trials:29 - Trial = 10639/30000 | Total reward = 33.47
2022-01-26 14:17:16.686 | DEBUG    | __main__:trials:24 - Trial = 10640/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.687 | DEBUG    | __main__:trials:29 - Trial = 10640/30000 | Total reward = 29.36
2022-01-26 14:17:16.691 | DEBUG    | __main__:trials:24 - Trial = 10641/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.693 | DEBUG    | __main__:trials:29 - Trial = 10641/30000 | Total reward = 36.47
2022-01-26 14:17:16.696 | DEBUG    | __main__:trials:24 - Trial = 10642/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.697 | DEBUG    | __main__:trials:29 - Trial = 10642/30000 | Total reward = 44.11
2022-01-26 14:17:16.701 | DEBUG    | __main__:trials:24 - Trial = 10643/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.702 | DEBUG    | __main__:trials:29 - Trial = 10643/30000 | Total reward = 27.27
2022-01-26 14:17:16.706 | DEBUG    | __main__:trials:24 - Trial = 10644/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.707 | DEBUG    | __main__:trials:29 - Trial = 10644/30000 | Total reward = 30.21
2022-01-26 14:17:16.710 | DEBUG    | __main__:trials:24 - Trial = 10645/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.712 | DEBUG    | __main__:trials:29 - Trial = 10645/30000 | Total reward = 33.47
2022-01-26 14:17:16.716 | DEBUG    | __main__:trials:24 - Trial = 10646/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.717 | DEBUG    | __main__:trials:29 - Trial = 10646/30000 | Total reward = 43.29
2022-01-26 14:17:16.720 | DEBUG    | __main__:trials:24 - Trial = 10647/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.722 | DEBUG    | __main__:trials:29 - Trial = 10647/30000 | Total reward = 44.84
2022-01-26 14:17:16.725 | DEBUG    | __main__:trials:24 - Trial = 10648/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.727 | DEBUG    | __main__:trials:29 - Trial = 10648/30000 | Total reward = 40.78
2022-01-26 14:17:16.730 | DEBUG    | __main__:trials:24 - Trial = 10649/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.731 | DEBUG    | __main__:trials:29 - Trial = 10649/30000 | Total reward = 35.01
2022-01-26 14:17:16.735 | DEBUG    | __main__:trials:24 - Trial = 10650/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.737 | DEBUG    | __main__:trials:29 - Trial = 10650/30000 | Total reward = 30.01
2022-01-26 14:17:16.739 | DEBUG    | __main__:trials:24 - Trial = 10651/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.741 | DEBUG    | __main__:trials:29 - Trial = 10651/30000 | Total reward = 30.24
2022-01-26 14:17:16.745 | DEBUG    | __main__:trials:24 - Trial = 10652/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.746 | DEBUG    | __main__:trials:29 - Trial = 10652/30000 | Total reward = 17.20
2022-01-26 14:17:16.750 | DEBUG    | __main__:trials:24 - Trial = 10653/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.752 | DEBUG    | __main__:trials:29 - Trial = 10653/30000 | Total reward = 28.36
2022-01-26 14:17:16.755 | DEBUG    | __main__:trials:24 - Trial = 10654/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.757 | DEBUG    | __main__:trials:29 - Trial = 10654/30000 | Total reward = 31.95
2022-01-26 14:17:16.761 | DEBUG    | __main__:trials:24 - Trial = 10655/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.761 | DEBUG    | __main__:trials:29 - Trial = 10655/30000 | Total reward = 42.92
2022-01-26 14:17:16.764 | DEBUG    | __main__:trials:24 - Trial = 10656/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.766 | DEBUG    | __main__:trials:29 - Trial = 10656/30000 | Total reward = 47.70
2022-01-26 14:17:16.768 | DEBUG    | __main__:trials:26 - Trial = 10657/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.769 | DEBUG    | __main__:trials:29 - Trial = 10657/30000 | Total reward = 12.47
2022-01-26 14:17:16.772 | DEBUG    | __main__:trials:24 - Trial = 10658/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.774 | DEBUG    | __main__:trials:29 - Trial = 10658/30000 | Total reward = 30.12
2022-01-26 14:17:16.777 | DEBUG    | __main__:trials:24 - Trial = 10659/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.778 | DEBUG    | __main__:trials:29 - Trial = 10659/30000 | Total reward = 27.36
2022-01-26 14:17:16.781 | DEBUG    | __main__:trials:24 - Trial = 10660/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.783 | DEBUG    | __main__:trials:29 - Trial = 10660/30000 | Total reward = 31.66
2022-01-26 14:17:16.786 | DEBUG    | __main__:trials:24 - Trial = 10661/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.788 | DEBUG    | __main__:trials:29 - Trial = 10661/30000 | Total reward = 31.95
2022-01-26 14:17:16.792 | DEBUG    | __main__:trials:24 - Trial = 10662/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.793 | DEBUG    | __main__:trials:29 - Trial = 10662/30000 | Total reward = 52.46
2022-01-26 14:17:16.797 | DEBUG    | __main__:trials:24 - Trial = 10663/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.798 | DEBUG    | __main__:trials:29 - Trial = 10663/30000 | Total reward = 50.30
2022-01-26 14:17:16.802 | DEBUG    | __main__:trials:24 - Trial = 10664/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.803 | DEBUG    | __main__:trials:29 - Trial = 10664/30000 | Total reward = 36.06
2022-01-26 14:17:16.806 | DEBUG    | __main__:trials:26 - Trial = 10665/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.807 | DEBUG    | __main__:trials:29 - Trial = 10665/30000 | Total reward = 6.25
2022-01-26 14:17:16.811 | DEBUG    | __main__:trials:24 - Trial = 10666/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.812 | DEBUG    | __main__:trials:29 - Trial = 10666/30000 | Total reward = 29.35
2022-01-26 14:17:16.816 | DEBUG    | __main__:trials:24 - Trial = 10667/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.817 | DEBUG    | __main__:trials:29 - Trial = 10667/30000 | Total reward = 51.54
2022-01-26 14:17:16.821 | DEBUG    | __main__:trials:24 - Trial = 10668/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.822 | DEBUG    | __main__:trials:29 - Trial = 10668/30000 | Total reward = 46.73
2022-01-26 14:17:16.826 | DEBUG    | __main__:trials:24 - Trial = 10669/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.827 | DEBUG    | __main__:trials:29 - Trial = 10669/30000 | Total reward = 25.81
2022-01-26 14:17:16.831 | DEBUG    | __main__:trials:24 - Trial = 10670/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.832 | DEBUG    | __main__:trials:29 - Trial = 10670/30000 | Total reward = 26.70
2022-01-26 14:17:16.837 | DEBUG    | __main__:trials:24 - Trial = 10671/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.838 | DEBUG    | __main__:trials:29 - Trial = 10671/30000 | Total reward = 46.01
2022-01-26 14:17:16.841 | DEBUG    | __main__:trials:24 - Trial = 10672/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.842 | DEBUG    | __main__:trials:29 - Trial = 10672/30000 | Total reward = 28.58
2022-01-26 14:17:16.844 | DEBUG    | __main__:trials:26 - Trial = 10673/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.845 | DEBUG    | __main__:trials:29 - Trial = 10673/30000 | Total reward = 7.43
2022-01-26 14:17:16.849 | DEBUG    | __main__:trials:24 - Trial = 10674/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.849 | DEBUG    | __main__:trials:29 - Trial = 10674/30000 | Total reward = 28.89
2022-01-26 14:17:16.854 | DEBUG    | __main__:trials:24 - Trial = 10675/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.855 | DEBUG    | __main__:trials:29 - Trial = 10675/30000 | Total reward = 29.20
2022-01-26 14:17:16.859 | DEBUG    | __main__:trials:24 - Trial = 10676/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.860 | DEBUG    | __main__:trials:29 - Trial = 10676/30000 | Total reward = 33.20
2022-01-26 14:17:16.864 | DEBUG    | __main__:trials:24 - Trial = 10677/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.865 | DEBUG    | __main__:trials:29 - Trial = 10677/30000 | Total reward = 27.42
2022-01-26 14:17:16.868 | DEBUG    | __main__:trials:24 - Trial = 10678/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.870 | DEBUG    | __main__:trials:29 - Trial = 10678/30000 | Total reward = 28.12
2022-01-26 14:17:16.873 | DEBUG    | __main__:trials:24 - Trial = 10679/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.875 | DEBUG    | __main__:trials:29 - Trial = 10679/30000 | Total reward = 45.94
2022-01-26 14:17:16.879 | DEBUG    | __main__:trials:24 - Trial = 10680/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.880 | DEBUG    | __main__:trials:29 - Trial = 10680/30000 | Total reward = 43.47
2022-01-26 14:17:16.883 | DEBUG    | __main__:trials:24 - Trial = 10681/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.885 | DEBUG    | __main__:trials:29 - Trial = 10681/30000 | Total reward = 29.33
2022-01-26 14:17:16.888 | DEBUG    | __main__:trials:24 - Trial = 10682/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.890 | DEBUG    | __main__:trials:29 - Trial = 10682/30000 | Total reward = 46.68
2022-01-26 14:17:16.892 | DEBUG    | __main__:trials:26 - Trial = 10683/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.893 | DEBUG    | __main__:trials:29 - Trial = 10683/30000 | Total reward = 14.32
2022-01-26 14:17:16.896 | DEBUG    | __main__:trials:24 - Trial = 10684/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.897 | DEBUG    | __main__:trials:29 - Trial = 10684/30000 | Total reward = 45.19
2022-01-26 14:17:16.901 | DEBUG    | __main__:trials:24 - Trial = 10685/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.902 | DEBUG    | __main__:trials:29 - Trial = 10685/30000 | Total reward = 39.78
2022-01-26 14:17:16.906 | DEBUG    | __main__:trials:24 - Trial = 10686/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.906 | DEBUG    | __main__:trials:29 - Trial = 10686/30000 | Total reward = 23.53
2022-01-26 14:17:16.911 | DEBUG    | __main__:trials:24 - Trial = 10687/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.912 | DEBUG    | __main__:trials:29 - Trial = 10687/30000 | Total reward = 53.40
2022-01-26 14:17:16.915 | DEBUG    | __main__:trials:24 - Trial = 10688/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.917 | DEBUG    | __main__:trials:29 - Trial = 10688/30000 | Total reward = 29.59
2022-01-26 14:17:16.920 | DEBUG    | __main__:trials:24 - Trial = 10689/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.921 | DEBUG    | __main__:trials:29 - Trial = 10689/30000 | Total reward = 29.35
2022-01-26 14:17:16.924 | DEBUG    | __main__:trials:24 - Trial = 10690/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.926 | DEBUG    | __main__:trials:29 - Trial = 10690/30000 | Total reward = 46.77
2022-01-26 14:17:16.929 | DEBUG    | __main__:trials:24 - Trial = 10691/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.930 | DEBUG    | __main__:trials:29 - Trial = 10691/30000 | Total reward = 28.39
2022-01-26 14:17:16.933 | DEBUG    | __main__:trials:24 - Trial = 10692/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.934 | DEBUG    | __main__:trials:29 - Trial = 10692/30000 | Total reward = 39.96
2022-01-26 14:17:16.936 | DEBUG    | __main__:trials:26 - Trial = 10693/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:16.938 | DEBUG    | __main__:trials:29 - Trial = 10693/30000 | Total reward = 7.00
2022-01-26 14:17:16.942 | DEBUG    | __main__:trials:24 - Trial = 10694/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.943 | DEBUG    | __main__:trials:29 - Trial = 10694/30000 | Total reward = 28.79
2022-01-26 14:17:16.947 | DEBUG    | __main__:trials:24 - Trial = 10695/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.948 | DEBUG    | __main__:trials:29 - Trial = 10695/30000 | Total reward = 29.18
2022-01-26 14:17:16.952 | DEBUG    | __main__:trials:24 - Trial = 10696/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.954 | DEBUG    | __main__:trials:29 - Trial = 10696/30000 | Total reward = 27.91
2022-01-26 14:17:16.957 | DEBUG    | __main__:trials:24 - Trial = 10697/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.959 | DEBUG    | __main__:trials:29 - Trial = 10697/30000 | Total reward = 46.01
2022-01-26 14:17:16.963 | DEBUG    | __main__:trials:24 - Trial = 10698/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.963 | DEBUG    | __main__:trials:29 - Trial = 10698/30000 | Total reward = 55.22
2022-01-26 14:17:16.968 | DEBUG    | __main__:trials:24 - Trial = 10699/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.969 | DEBUG    | __main__:trials:29 - Trial = 10699/30000 | Total reward = 28.99
2022-01-26 14:17:16.973 | DEBUG    | __main__:trials:24 - Trial = 10700/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.974 | DEBUG    | __main__:trials:29 - Trial = 10700/30000 | Total reward = 31.91
2022-01-26 14:17:16.978 | DEBUG    | __main__:trials:24 - Trial = 10701/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.979 | DEBUG    | __main__:trials:29 - Trial = 10701/30000 | Total reward = 22.58
2022-01-26 14:17:16.983 | DEBUG    | __main__:trials:24 - Trial = 10702/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.983 | DEBUG    | __main__:trials:29 - Trial = 10702/30000 | Total reward = 25.37
2022-01-26 14:17:16.988 | DEBUG    | __main__:trials:24 - Trial = 10703/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.989 | DEBUG    | __main__:trials:29 - Trial = 10703/30000 | Total reward = 42.65
2022-01-26 14:17:16.992 | DEBUG    | __main__:trials:24 - Trial = 10704/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.993 | DEBUG    | __main__:trials:29 - Trial = 10704/30000 | Total reward = 31.33
2022-01-26 14:17:16.997 | DEBUG    | __main__:trials:24 - Trial = 10705/30000 | Max number of steps (20) reached
2022-01-26 14:17:16.998 | DEBUG    | __main__:trials:29 - Trial = 10705/30000 | Total reward = 30.94
2022-01-26 14:17:17.003 | DEBUG    | __main__:trials:24 - Trial = 10706/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.004 | DEBUG    | __main__:trials:29 - Trial = 10706/30000 | Total reward = 49.46
2022-01-26 14:17:17.007 | DEBUG    | __main__:trials:24 - Trial = 10707/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.009 | DEBUG    | __main__:trials:29 - Trial = 10707/30000 | Total reward = 32.65
2022-01-26 14:17:17.012 | DEBUG    | __main__:trials:24 - Trial = 10708/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.014 | DEBUG    | __main__:trials:29 - Trial = 10708/30000 | Total reward = 42.25
2022-01-26 14:17:17.016 | DEBUG    | __main__:trials:26 - Trial = 10709/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:17.018 | DEBUG    | __main__:trials:29 - Trial = 10709/30000 | Total reward = 6.41
2022-01-26 14:17:17.021 | DEBUG    | __main__:trials:24 - Trial = 10710/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.023 | DEBUG    | __main__:trials:29 - Trial = 10710/30000 | Total reward = 44.50
2022-01-26 14:17:17.026 | DEBUG    | __main__:trials:24 - Trial = 10711/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.027 | DEBUG    | __main__:trials:29 - Trial = 10711/30000 | Total reward = 34.12
2022-01-26 14:17:17.031 | DEBUG    | __main__:trials:24 - Trial = 10712/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.032 | DEBUG    | __main__:trials:29 - Trial = 10712/30000 | Total reward = 48.04
2022-01-26 14:17:17.036 | DEBUG    | __main__:trials:24 - Trial = 10713/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.038 | DEBUG    | __main__:trials:29 - Trial = 10713/30000 | Total reward = 48.92
2022-01-26 14:17:17.041 | DEBUG    | __main__:trials:24 - Trial = 10714/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.043 | DEBUG    | __main__:trials:29 - Trial = 10714/30000 | Total reward = 47.67
2022-01-26 14:17:17.046 | DEBUG    | __main__:trials:24 - Trial = 10715/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.048 | DEBUG    | __main__:trials:29 - Trial = 10715/30000 | Total reward = 42.33
2022-01-26 14:17:17.051 | DEBUG    | __main__:trials:24 - Trial = 10716/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.052 | DEBUG    | __main__:trials:29 - Trial = 10716/30000 | Total reward = 41.04
2022-01-26 14:17:17.056 | DEBUG    | __main__:trials:24 - Trial = 10717/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.058 | DEBUG    | __main__:trials:29 - Trial = 10717/30000 | Total reward = 40.20
2022-01-26 14:17:17.061 | DEBUG    | __main__:trials:24 - Trial = 10718/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.063 | DEBUG    | __main__:trials:29 - Trial = 10718/30000 | Total reward = 48.92
2022-01-26 14:17:17.066 | DEBUG    | __main__:trials:24 - Trial = 10719/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.067 | DEBUG    | __main__:trials:29 - Trial = 10719/30000 | Total reward = 30.82
2022-01-26 14:17:17.072 | DEBUG    | __main__:trials:24 - Trial = 10720/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.072 | DEBUG    | __main__:trials:29 - Trial = 10720/30000 | Total reward = 61.50
2022-01-26 14:17:17.076 | DEBUG    | __main__:trials:24 - Trial = 10721/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.078 | DEBUG    | __main__:trials:29 - Trial = 10721/30000 | Total reward = 40.31
2022-01-26 14:17:17.081 | DEBUG    | __main__:trials:24 - Trial = 10722/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.082 | DEBUG    | __main__:trials:29 - Trial = 10722/30000 | Total reward = 53.23
2022-01-26 14:17:17.086 | DEBUG    | __main__:trials:24 - Trial = 10723/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.087 | DEBUG    | __main__:trials:29 - Trial = 10723/30000 | Total reward = 38.28
2022-01-26 14:17:17.091 | DEBUG    | __main__:trials:24 - Trial = 10724/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.093 | DEBUG    | __main__:trials:29 - Trial = 10724/30000 | Total reward = 40.54
2022-01-26 14:17:17.096 | DEBUG    | __main__:trials:24 - Trial = 10725/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.097 | DEBUG    | __main__:trials:29 - Trial = 10725/30000 | Total reward = 41.61
2022-01-26 14:17:17.101 | DEBUG    | __main__:trials:24 - Trial = 10726/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.102 | DEBUG    | __main__:trials:29 - Trial = 10726/30000 | Total reward = 40.51
2022-01-26 14:17:17.106 | DEBUG    | __main__:trials:24 - Trial = 10727/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.107 | DEBUG    | __main__:trials:29 - Trial = 10727/30000 | Total reward = 43.48
2022-01-26 14:17:17.111 | DEBUG    | __main__:trials:24 - Trial = 10728/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.113 | DEBUG    | __main__:trials:29 - Trial = 10728/30000 | Total reward = 33.63
2022-01-26 14:17:17.116 | DEBUG    | __main__:trials:24 - Trial = 10729/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.118 | DEBUG    | __main__:trials:29 - Trial = 10729/30000 | Total reward = 38.83
2022-01-26 14:17:17.121 | DEBUG    | __main__:trials:24 - Trial = 10730/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.123 | DEBUG    | __main__:trials:29 - Trial = 10730/30000 | Total reward = 37.35
2022-01-26 14:17:17.126 | DEBUG    | __main__:trials:24 - Trial = 10731/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.127 | DEBUG    | __main__:trials:29 - Trial = 10731/30000 | Total reward = 39.93
2022-01-26 14:17:17.131 | DEBUG    | __main__:trials:24 - Trial = 10732/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.133 | DEBUG    | __main__:trials:29 - Trial = 10732/30000 | Total reward = 49.87
2022-01-26 14:17:17.136 | DEBUG    | __main__:trials:24 - Trial = 10733/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.138 | DEBUG    | __main__:trials:29 - Trial = 10733/30000 | Total reward = 32.96
2022-01-26 14:17:17.141 | DEBUG    | __main__:trials:24 - Trial = 10734/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.142 | DEBUG    | __main__:trials:29 - Trial = 10734/30000 | Total reward = 41.55
2022-01-26 14:17:17.146 | DEBUG    | __main__:trials:24 - Trial = 10735/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.147 | DEBUG    | __main__:trials:29 - Trial = 10735/30000 | Total reward = 43.35
2022-01-26 14:17:17.151 | DEBUG    | __main__:trials:24 - Trial = 10736/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.153 | DEBUG    | __main__:trials:29 - Trial = 10736/30000 | Total reward = 39.67
2022-01-26 14:17:17.157 | DEBUG    | __main__:trials:24 - Trial = 10737/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.158 | DEBUG    | __main__:trials:29 - Trial = 10737/30000 | Total reward = 32.42
2022-01-26 14:17:17.162 | DEBUG    | __main__:trials:24 - Trial = 10738/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.163 | DEBUG    | __main__:trials:29 - Trial = 10738/30000 | Total reward = 36.24
2022-01-26 14:17:17.167 | DEBUG    | __main__:trials:24 - Trial = 10739/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.167 | DEBUG    | __main__:trials:29 - Trial = 10739/30000 | Total reward = 43.49
2022-01-26 14:17:17.171 | DEBUG    | __main__:trials:24 - Trial = 10740/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.172 | DEBUG    | __main__:trials:29 - Trial = 10740/30000 | Total reward = 40.61
2022-01-26 14:17:17.175 | DEBUG    | __main__:trials:24 - Trial = 10741/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.177 | DEBUG    | __main__:trials:29 - Trial = 10741/30000 | Total reward = 37.52
2022-01-26 14:17:17.180 | DEBUG    | __main__:trials:24 - Trial = 10742/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.181 | DEBUG    | __main__:trials:29 - Trial = 10742/30000 | Total reward = 41.27
2022-01-26 14:17:17.184 | DEBUG    | __main__:trials:24 - Trial = 10743/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.185 | DEBUG    | __main__:trials:29 - Trial = 10743/30000 | Total reward = 58.79
2022-01-26 14:17:17.189 | DEBUG    | __main__:trials:24 - Trial = 10744/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.189 | DEBUG    | __main__:trials:29 - Trial = 10744/30000 | Total reward = 33.85
2022-01-26 14:17:17.193 | DEBUG    | __main__:trials:24 - Trial = 10745/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.193 | DEBUG    | __main__:trials:29 - Trial = 10745/30000 | Total reward = 33.31
2022-01-26 14:17:17.197 | DEBUG    | __main__:trials:24 - Trial = 10746/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.197 | DEBUG    | __main__:trials:29 - Trial = 10746/30000 | Total reward = 32.21
2022-01-26 14:17:17.201 | DEBUG    | __main__:trials:24 - Trial = 10747/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.201 | DEBUG    | __main__:trials:29 - Trial = 10747/30000 | Total reward = 38.39
2022-01-26 14:17:17.205 | DEBUG    | __main__:trials:24 - Trial = 10748/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.207 | DEBUG    | __main__:trials:29 - Trial = 10748/30000 | Total reward = 33.84
2022-01-26 14:17:17.210 | DEBUG    | __main__:trials:24 - Trial = 10749/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.211 | DEBUG    | __main__:trials:29 - Trial = 10749/30000 | Total reward = 55.72
2022-01-26 14:17:17.215 | DEBUG    | __main__:trials:24 - Trial = 10750/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.217 | DEBUG    | __main__:trials:29 - Trial = 10750/30000 | Total reward = 40.48
2022-01-26 14:17:17.219 | DEBUG    | __main__:trials:24 - Trial = 10751/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.221 | DEBUG    | __main__:trials:29 - Trial = 10751/30000 | Total reward = 31.84
2022-01-26 14:17:17.224 | DEBUG    | __main__:trials:24 - Trial = 10752/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.226 | DEBUG    | __main__:trials:29 - Trial = 10752/30000 | Total reward = 34.19
2022-01-26 14:17:17.228 | DEBUG    | __main__:trials:24 - Trial = 10753/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.230 | DEBUG    | __main__:trials:29 - Trial = 10753/30000 | Total reward = 34.37
2022-01-26 14:17:17.233 | DEBUG    | __main__:trials:24 - Trial = 10754/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.234 | DEBUG    | __main__:trials:29 - Trial = 10754/30000 | Total reward = 34.02
2022-01-26 14:17:17.237 | DEBUG    | __main__:trials:24 - Trial = 10755/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.237 | DEBUG    | __main__:trials:29 - Trial = 10755/30000 | Total reward = 45.00
2022-01-26 14:17:17.241 | DEBUG    | __main__:trials:24 - Trial = 10756/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.243 | DEBUG    | __main__:trials:29 - Trial = 10756/30000 | Total reward = 42.59
2022-01-26 14:17:17.246 | DEBUG    | __main__:trials:24 - Trial = 10757/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.246 | DEBUG    | __main__:trials:29 - Trial = 10757/30000 | Total reward = 34.57
2022-01-26 14:17:17.250 | DEBUG    | __main__:trials:24 - Trial = 10758/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.252 | DEBUG    | __main__:trials:29 - Trial = 10758/30000 | Total reward = 44.24
2022-01-26 14:17:17.255 | DEBUG    | __main__:trials:24 - Trial = 10759/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.256 | DEBUG    | __main__:trials:29 - Trial = 10759/30000 | Total reward = 40.80
2022-01-26 14:17:17.259 | DEBUG    | __main__:trials:24 - Trial = 10760/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.260 | DEBUG    | __main__:trials:29 - Trial = 10760/30000 | Total reward = 15.99
2022-01-26 14:17:17.263 | DEBUG    | __main__:trials:24 - Trial = 10761/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.264 | DEBUG    | __main__:trials:29 - Trial = 10761/30000 | Total reward = 36.35
2022-01-26 14:17:17.268 | DEBUG    | __main__:trials:24 - Trial = 10762/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.269 | DEBUG    | __main__:trials:29 - Trial = 10762/30000 | Total reward = 42.72
2022-01-26 14:17:17.272 | DEBUG    | __main__:trials:24 - Trial = 10763/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.273 | DEBUG    | __main__:trials:29 - Trial = 10763/30000 | Total reward = 33.84
2022-01-26 14:17:17.277 | DEBUG    | __main__:trials:24 - Trial = 10764/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.278 | DEBUG    | __main__:trials:29 - Trial = 10764/30000 | Total reward = 35.62
2022-01-26 14:17:17.281 | DEBUG    | __main__:trials:24 - Trial = 10765/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.282 | DEBUG    | __main__:trials:29 - Trial = 10765/30000 | Total reward = 35.87
2022-01-26 14:17:17.285 | DEBUG    | __main__:trials:24 - Trial = 10766/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.286 | DEBUG    | __main__:trials:29 - Trial = 10766/30000 | Total reward = 34.58
2022-01-26 14:17:17.289 | DEBUG    | __main__:trials:24 - Trial = 10767/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.291 | DEBUG    | __main__:trials:29 - Trial = 10767/30000 | Total reward = 38.04
2022-01-26 14:17:17.294 | DEBUG    | __main__:trials:24 - Trial = 10768/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.294 | DEBUG    | __main__:trials:29 - Trial = 10768/30000 | Total reward = 39.10
2022-01-26 14:17:17.298 | DEBUG    | __main__:trials:24 - Trial = 10769/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.298 | DEBUG    | __main__:trials:29 - Trial = 10769/30000 | Total reward = 42.99
2022-01-26 14:17:17.302 | DEBUG    | __main__:trials:24 - Trial = 10770/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.303 | DEBUG    | __main__:trials:29 - Trial = 10770/30000 | Total reward = 34.67
2022-01-26 14:17:17.307 | DEBUG    | __main__:trials:24 - Trial = 10771/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.309 | DEBUG    | __main__:trials:29 - Trial = 10771/30000 | Total reward = 34.20
2022-01-26 14:17:17.312 | DEBUG    | __main__:trials:24 - Trial = 10772/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.314 | DEBUG    | __main__:trials:29 - Trial = 10772/30000 | Total reward = 44.69
2022-01-26 14:17:17.316 | DEBUG    | __main__:trials:24 - Trial = 10773/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.318 | DEBUG    | __main__:trials:29 - Trial = 10773/30000 | Total reward = 31.01
2022-01-26 14:17:17.321 | DEBUG    | __main__:trials:24 - Trial = 10774/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.322 | DEBUG    | __main__:trials:29 - Trial = 10774/30000 | Total reward = 34.57
2022-01-26 14:17:17.325 | DEBUG    | __main__:trials:24 - Trial = 10775/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.327 | DEBUG    | __main__:trials:29 - Trial = 10775/30000 | Total reward = 39.52
2022-01-26 14:17:17.330 | DEBUG    | __main__:trials:24 - Trial = 10776/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.332 | DEBUG    | __main__:trials:29 - Trial = 10776/30000 | Total reward = 39.20
2022-01-26 14:17:17.336 | DEBUG    | __main__:trials:24 - Trial = 10777/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.336 | DEBUG    | __main__:trials:29 - Trial = 10777/30000 | Total reward = 41.70
2022-01-26 14:17:17.340 | DEBUG    | __main__:trials:24 - Trial = 10778/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.342 | DEBUG    | __main__:trials:29 - Trial = 10778/30000 | Total reward = 39.41
2022-01-26 14:17:17.344 | DEBUG    | __main__:trials:24 - Trial = 10779/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.346 | DEBUG    | __main__:trials:29 - Trial = 10779/30000 | Total reward = 45.87
2022-01-26 14:17:17.349 | DEBUG    | __main__:trials:24 - Trial = 10780/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.351 | DEBUG    | __main__:trials:29 - Trial = 10780/30000 | Total reward = 39.65
2022-01-26 14:17:17.354 | DEBUG    | __main__:trials:24 - Trial = 10781/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.355 | DEBUG    | __main__:trials:29 - Trial = 10781/30000 | Total reward = 43.77
2022-01-26 14:17:17.359 | DEBUG    | __main__:trials:24 - Trial = 10782/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.361 | DEBUG    | __main__:trials:29 - Trial = 10782/30000 | Total reward = 38.51
2022-01-26 14:17:17.363 | DEBUG    | __main__:trials:24 - Trial = 10783/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.364 | DEBUG    | __main__:trials:29 - Trial = 10783/30000 | Total reward = 34.16
2022-01-26 14:17:17.367 | DEBUG    | __main__:trials:24 - Trial = 10784/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.369 | DEBUG    | __main__:trials:29 - Trial = 10784/30000 | Total reward = 41.41
2022-01-26 14:17:17.373 | DEBUG    | __main__:trials:24 - Trial = 10785/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.374 | DEBUG    | __main__:trials:29 - Trial = 10785/30000 | Total reward = 32.75
2022-01-26 14:17:17.377 | DEBUG    | __main__:trials:24 - Trial = 10786/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.378 | DEBUG    | __main__:trials:29 - Trial = 10786/30000 | Total reward = 35.65
2022-01-26 14:17:17.383 | DEBUG    | __main__:trials:24 - Trial = 10787/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.385 | DEBUG    | __main__:trials:29 - Trial = 10787/30000 | Total reward = 39.45
2022-01-26 14:17:17.388 | DEBUG    | __main__:trials:24 - Trial = 10788/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.390 | DEBUG    | __main__:trials:29 - Trial = 10788/30000 | Total reward = 42.24
2022-01-26 14:17:17.393 | DEBUG    | __main__:trials:24 - Trial = 10789/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.394 | DEBUG    | __main__:trials:29 - Trial = 10789/30000 | Total reward = 31.07
2022-01-26 14:17:17.398 | DEBUG    | __main__:trials:24 - Trial = 10790/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.399 | DEBUG    | __main__:trials:29 - Trial = 10790/30000 | Total reward = 49.89
2022-01-26 14:17:17.403 | DEBUG    | __main__:trials:24 - Trial = 10791/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.403 | DEBUG    | __main__:trials:29 - Trial = 10791/30000 | Total reward = 48.98
2022-01-26 14:17:17.407 | DEBUG    | __main__:trials:24 - Trial = 10792/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.409 | DEBUG    | __main__:trials:29 - Trial = 10792/30000 | Total reward = 46.03
2022-01-26 14:17:17.412 | DEBUG    | __main__:trials:24 - Trial = 10793/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.414 | DEBUG    | __main__:trials:29 - Trial = 10793/30000 | Total reward = 46.32
2022-01-26 14:17:17.418 | DEBUG    | __main__:trials:24 - Trial = 10794/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.419 | DEBUG    | __main__:trials:29 - Trial = 10794/30000 | Total reward = 34.35
2022-01-26 14:17:17.423 | DEBUG    | __main__:trials:24 - Trial = 10795/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.424 | DEBUG    | __main__:trials:29 - Trial = 10795/30000 | Total reward = 47.69
2022-01-26 14:17:17.428 | DEBUG    | __main__:trials:24 - Trial = 10796/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.429 | DEBUG    | __main__:trials:29 - Trial = 10796/30000 | Total reward = 42.58
2022-01-26 14:17:17.432 | DEBUG    | __main__:trials:24 - Trial = 10797/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.433 | DEBUG    | __main__:trials:29 - Trial = 10797/30000 | Total reward = 59.43
2022-01-26 14:17:17.437 | DEBUG    | __main__:trials:24 - Trial = 10798/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.438 | DEBUG    | __main__:trials:29 - Trial = 10798/30000 | Total reward = 41.66
2022-01-26 14:17:17.441 | DEBUG    | __main__:trials:24 - Trial = 10799/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.442 | DEBUG    | __main__:trials:29 - Trial = 10799/30000 | Total reward = 37.79
2022-01-26 14:17:17.445 | DEBUG    | __main__:trials:24 - Trial = 10800/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.447 | DEBUG    | __main__:trials:29 - Trial = 10800/30000 | Total reward = 47.25
2022-01-26 14:17:17.450 | DEBUG    | __main__:trials:24 - Trial = 10801/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.451 | DEBUG    | __main__:trials:29 - Trial = 10801/30000 | Total reward = 38.49
2022-01-26 14:17:17.454 | DEBUG    | __main__:trials:24 - Trial = 10802/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.456 | DEBUG    | __main__:trials:29 - Trial = 10802/30000 | Total reward = 39.64
2022-01-26 14:17:17.459 | DEBUG    | __main__:trials:24 - Trial = 10803/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.460 | DEBUG    | __main__:trials:29 - Trial = 10803/30000 | Total reward = 28.97
2022-01-26 14:17:17.464 | DEBUG    | __main__:trials:24 - Trial = 10804/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.465 | DEBUG    | __main__:trials:29 - Trial = 10804/30000 | Total reward = 38.68
2022-01-26 14:17:17.469 | DEBUG    | __main__:trials:24 - Trial = 10805/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.471 | DEBUG    | __main__:trials:29 - Trial = 10805/30000 | Total reward = 33.05
2022-01-26 14:17:17.474 | DEBUG    | __main__:trials:24 - Trial = 10806/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.475 | DEBUG    | __main__:trials:29 - Trial = 10806/30000 | Total reward = 46.01
2022-01-26 14:17:17.479 | DEBUG    | __main__:trials:24 - Trial = 10807/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.481 | DEBUG    | __main__:trials:29 - Trial = 10807/30000 | Total reward = 42.88
2022-01-26 14:17:17.484 | DEBUG    | __main__:trials:24 - Trial = 10808/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.485 | DEBUG    | __main__:trials:29 - Trial = 10808/30000 | Total reward = 44.39
2022-01-26 14:17:17.489 | DEBUG    | __main__:trials:24 - Trial = 10809/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.491 | DEBUG    | __main__:trials:29 - Trial = 10809/30000 | Total reward = 39.57
2022-01-26 14:17:17.494 | DEBUG    | __main__:trials:24 - Trial = 10810/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.495 | DEBUG    | __main__:trials:29 - Trial = 10810/30000 | Total reward = 36.16
2022-01-26 14:17:17.499 | DEBUG    | __main__:trials:24 - Trial = 10811/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.500 | DEBUG    | __main__:trials:29 - Trial = 10811/30000 | Total reward = 44.82
2022-01-26 14:17:17.504 | DEBUG    | __main__:trials:24 - Trial = 10812/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.506 | DEBUG    | __main__:trials:29 - Trial = 10812/30000 | Total reward = 40.90
2022-01-26 14:17:17.509 | DEBUG    | __main__:trials:26 - Trial = 10813/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:17.510 | DEBUG    | __main__:trials:29 - Trial = 10813/30000 | Total reward = 19.25
2022-01-26 14:17:17.514 | DEBUG    | __main__:trials:24 - Trial = 10814/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.515 | DEBUG    | __main__:trials:29 - Trial = 10814/30000 | Total reward = 34.65
2022-01-26 14:17:17.519 | DEBUG    | __main__:trials:24 - Trial = 10815/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.520 | DEBUG    | __main__:trials:29 - Trial = 10815/30000 | Total reward = 36.59
2022-01-26 14:17:17.524 | DEBUG    | __main__:trials:24 - Trial = 10816/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.525 | DEBUG    | __main__:trials:29 - Trial = 10816/30000 | Total reward = 39.68
2022-01-26 14:17:17.528 | DEBUG    | __main__:trials:24 - Trial = 10817/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.530 | DEBUG    | __main__:trials:29 - Trial = 10817/30000 | Total reward = 38.98
2022-01-26 14:17:17.533 | DEBUG    | __main__:trials:24 - Trial = 10818/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.535 | DEBUG    | __main__:trials:29 - Trial = 10818/30000 | Total reward = 44.76
2022-01-26 14:17:17.538 | DEBUG    | __main__:trials:24 - Trial = 10819/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.540 | DEBUG    | __main__:trials:29 - Trial = 10819/30000 | Total reward = 48.92
2022-01-26 14:17:17.543 | DEBUG    | __main__:trials:24 - Trial = 10820/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.545 | DEBUG    | __main__:trials:29 - Trial = 10820/30000 | Total reward = 48.92
2022-01-26 14:17:17.548 | DEBUG    | __main__:trials:24 - Trial = 10821/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.549 | DEBUG    | __main__:trials:29 - Trial = 10821/30000 | Total reward = 62.73
2022-01-26 14:17:17.552 | DEBUG    | __main__:trials:24 - Trial = 10822/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.554 | DEBUG    | __main__:trials:29 - Trial = 10822/30000 | Total reward = 37.39
2022-01-26 14:17:17.557 | DEBUG    | __main__:trials:24 - Trial = 10823/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.559 | DEBUG    | __main__:trials:29 - Trial = 10823/30000 | Total reward = 48.92
2022-01-26 14:17:17.563 | DEBUG    | __main__:trials:24 - Trial = 10824/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.564 | DEBUG    | __main__:trials:29 - Trial = 10824/30000 | Total reward = 47.20
2022-01-26 14:17:17.568 | DEBUG    | __main__:trials:24 - Trial = 10825/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.569 | DEBUG    | __main__:trials:29 - Trial = 10825/30000 | Total reward = 33.76
2022-01-26 14:17:17.573 | DEBUG    | __main__:trials:24 - Trial = 10826/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.574 | DEBUG    | __main__:trials:29 - Trial = 10826/30000 | Total reward = 34.38
2022-01-26 14:17:17.577 | DEBUG    | __main__:trials:24 - Trial = 10827/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.577 | DEBUG    | __main__:trials:29 - Trial = 10827/30000 | Total reward = 35.47
2022-01-26 14:17:17.581 | DEBUG    | __main__:trials:24 - Trial = 10828/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.582 | DEBUG    | __main__:trials:29 - Trial = 10828/30000 | Total reward = 15.94
2022-01-26 14:17:17.585 | DEBUG    | __main__:trials:26 - Trial = 10829/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:17.586 | DEBUG    | __main__:trials:29 - Trial = 10829/30000 | Total reward = 39.85
2022-01-26 14:17:17.591 | DEBUG    | __main__:trials:24 - Trial = 10830/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.592 | DEBUG    | __main__:trials:29 - Trial = 10830/30000 | Total reward = 56.75
2022-01-26 14:17:17.595 | DEBUG    | __main__:trials:24 - Trial = 10831/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.597 | DEBUG    | __main__:trials:29 - Trial = 10831/30000 | Total reward = 49.20
2022-01-26 14:17:17.600 | DEBUG    | __main__:trials:24 - Trial = 10832/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.601 | DEBUG    | __main__:trials:29 - Trial = 10832/30000 | Total reward = 31.99
2022-01-26 14:17:17.605 | DEBUG    | __main__:trials:24 - Trial = 10833/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.606 | DEBUG    | __main__:trials:29 - Trial = 10833/30000 | Total reward = 28.12
2022-01-26 14:17:17.611 | DEBUG    | __main__:trials:24 - Trial = 10834/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.612 | DEBUG    | __main__:trials:29 - Trial = 10834/30000 | Total reward = 29.33
2022-01-26 14:17:17.615 | DEBUG    | __main__:trials:24 - Trial = 10835/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.617 | DEBUG    | __main__:trials:29 - Trial = 10835/30000 | Total reward = 41.04
2022-01-26 14:17:17.620 | DEBUG    | __main__:trials:24 - Trial = 10836/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.621 | DEBUG    | __main__:trials:29 - Trial = 10836/30000 | Total reward = 31.99
2022-01-26 14:17:17.625 | DEBUG    | __main__:trials:24 - Trial = 10837/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.627 | DEBUG    | __main__:trials:29 - Trial = 10837/30000 | Total reward = 32.04
2022-01-26 14:17:17.630 | DEBUG    | __main__:trials:24 - Trial = 10838/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.631 | DEBUG    | __main__:trials:29 - Trial = 10838/30000 | Total reward = 41.58
2022-01-26 14:17:17.636 | DEBUG    | __main__:trials:24 - Trial = 10839/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.636 | DEBUG    | __main__:trials:29 - Trial = 10839/30000 | Total reward = 31.25
2022-01-26 14:17:17.639 | DEBUG    | __main__:trials:26 - Trial = 10840/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:17.640 | DEBUG    | __main__:trials:29 - Trial = 10840/30000 | Total reward = 11.21
2022-01-26 14:17:17.644 | DEBUG    | __main__:trials:24 - Trial = 10841/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.645 | DEBUG    | __main__:trials:29 - Trial = 10841/30000 | Total reward = 44.33
2022-01-26 14:17:17.649 | DEBUG    | __main__:trials:24 - Trial = 10842/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.650 | DEBUG    | __main__:trials:29 - Trial = 10842/30000 | Total reward = 38.70
2022-01-26 14:17:17.653 | DEBUG    | __main__:trials:24 - Trial = 10843/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.655 | DEBUG    | __main__:trials:29 - Trial = 10843/30000 | Total reward = 42.61
2022-01-26 14:17:17.659 | DEBUG    | __main__:trials:24 - Trial = 10844/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.660 | DEBUG    | __main__:trials:29 - Trial = 10844/30000 | Total reward = 43.71
2022-01-26 14:17:17.663 | DEBUG    | __main__:trials:24 - Trial = 10845/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.665 | DEBUG    | __main__:trials:29 - Trial = 10845/30000 | Total reward = 28.15
2022-01-26 14:17:17.669 | DEBUG    | __main__:trials:24 - Trial = 10846/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.670 | DEBUG    | __main__:trials:29 - Trial = 10846/30000 | Total reward = 43.53
2022-01-26 14:17:17.673 | DEBUG    | __main__:trials:24 - Trial = 10847/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.674 | DEBUG    | __main__:trials:29 - Trial = 10847/30000 | Total reward = 34.70
2022-01-26 14:17:17.677 | DEBUG    | __main__:trials:24 - Trial = 10848/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.679 | DEBUG    | __main__:trials:29 - Trial = 10848/30000 | Total reward = 34.35
2022-01-26 14:17:17.681 | DEBUG    | __main__:trials:24 - Trial = 10849/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.683 | DEBUG    | __main__:trials:29 - Trial = 10849/30000 | Total reward = 43.22
2022-01-26 14:17:17.686 | DEBUG    | __main__:trials:24 - Trial = 10850/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.688 | DEBUG    | __main__:trials:29 - Trial = 10850/30000 | Total reward = 36.05
2022-01-26 14:17:17.691 | DEBUG    | __main__:trials:24 - Trial = 10851/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.693 | DEBUG    | __main__:trials:29 - Trial = 10851/30000 | Total reward = 48.84
2022-01-26 14:17:17.696 | DEBUG    | __main__:trials:24 - Trial = 10852/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.698 | DEBUG    | __main__:trials:29 - Trial = 10852/30000 | Total reward = 48.92
2022-01-26 14:17:17.701 | DEBUG    | __main__:trials:24 - Trial = 10853/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.702 | DEBUG    | __main__:trials:29 - Trial = 10853/30000 | Total reward = 47.78
2022-01-26 14:17:17.706 | DEBUG    | __main__:trials:24 - Trial = 10854/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.707 | DEBUG    | __main__:trials:29 - Trial = 10854/30000 | Total reward = 43.20
2022-01-26 14:17:17.711 | DEBUG    | __main__:trials:24 - Trial = 10855/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.712 | DEBUG    | __main__:trials:29 - Trial = 10855/30000 | Total reward = 42.83
2022-01-26 14:17:17.715 | DEBUG    | __main__:trials:24 - Trial = 10856/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.717 | DEBUG    | __main__:trials:29 - Trial = 10856/30000 | Total reward = 45.49
2022-01-26 14:17:17.719 | DEBUG    | __main__:trials:24 - Trial = 10857/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.721 | DEBUG    | __main__:trials:29 - Trial = 10857/30000 | Total reward = 46.70
2022-01-26 14:17:17.724 | DEBUG    | __main__:trials:24 - Trial = 10858/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.725 | DEBUG    | __main__:trials:29 - Trial = 10858/30000 | Total reward = 47.26
2022-01-26 14:17:17.728 | DEBUG    | __main__:trials:24 - Trial = 10859/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.730 | DEBUG    | __main__:trials:29 - Trial = 10859/30000 | Total reward = 39.09
2022-01-26 14:17:17.733 | DEBUG    | __main__:trials:24 - Trial = 10860/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.734 | DEBUG    | __main__:trials:29 - Trial = 10860/30000 | Total reward = 43.29
2022-01-26 14:17:17.737 | DEBUG    | __main__:trials:24 - Trial = 10861/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.739 | DEBUG    | __main__:trials:29 - Trial = 10861/30000 | Total reward = 43.41
2022-01-26 14:17:17.742 | DEBUG    | __main__:trials:24 - Trial = 10862/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.744 | DEBUG    | __main__:trials:29 - Trial = 10862/30000 | Total reward = 43.91
2022-01-26 14:17:17.747 | DEBUG    | __main__:trials:24 - Trial = 10863/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.748 | DEBUG    | __main__:trials:29 - Trial = 10863/30000 | Total reward = 43.72
2022-01-26 14:17:17.752 | DEBUG    | __main__:trials:24 - Trial = 10864/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.753 | DEBUG    | __main__:trials:29 - Trial = 10864/30000 | Total reward = 40.67
2022-01-26 14:17:17.757 | DEBUG    | __main__:trials:24 - Trial = 10865/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.758 | DEBUG    | __main__:trials:29 - Trial = 10865/30000 | Total reward = 42.55
2022-01-26 14:17:17.762 | DEBUG    | __main__:trials:26 - Trial = 10866/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:17.763 | DEBUG    | __main__:trials:29 - Trial = 10866/30000 | Total reward = 29.68
2022-01-26 14:17:17.767 | DEBUG    | __main__:trials:24 - Trial = 10867/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.767 | DEBUG    | __main__:trials:29 - Trial = 10867/30000 | Total reward = 42.58
2022-01-26 14:17:17.771 | DEBUG    | __main__:trials:24 - Trial = 10868/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.772 | DEBUG    | __main__:trials:29 - Trial = 10868/30000 | Total reward = 43.42
2022-01-26 14:17:17.775 | DEBUG    | __main__:trials:24 - Trial = 10869/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.777 | DEBUG    | __main__:trials:29 - Trial = 10869/30000 | Total reward = 32.60
2022-01-26 14:17:17.780 | DEBUG    | __main__:trials:24 - Trial = 10870/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.782 | DEBUG    | __main__:trials:29 - Trial = 10870/30000 | Total reward = 52.40
2022-01-26 14:17:17.785 | DEBUG    | __main__:trials:24 - Trial = 10871/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.785 | DEBUG    | __main__:trials:29 - Trial = 10871/30000 | Total reward = 43.45
2022-01-26 14:17:17.789 | DEBUG    | __main__:trials:24 - Trial = 10872/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.790 | DEBUG    | __main__:trials:29 - Trial = 10872/30000 | Total reward = 33.72
2022-01-26 14:17:17.793 | DEBUG    | __main__:trials:24 - Trial = 10873/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.794 | DEBUG    | __main__:trials:29 - Trial = 10873/30000 | Total reward = 55.53
2022-01-26 14:17:17.798 | DEBUG    | __main__:trials:24 - Trial = 10874/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.800 | DEBUG    | __main__:trials:29 - Trial = 10874/30000 | Total reward = 26.09
2022-01-26 14:17:17.802 | DEBUG    | __main__:trials:24 - Trial = 10875/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.803 | DEBUG    | __main__:trials:29 - Trial = 10875/30000 | Total reward = 37.55
2022-01-26 14:17:17.807 | DEBUG    | __main__:trials:24 - Trial = 10876/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.807 | DEBUG    | __main__:trials:29 - Trial = 10876/30000 | Total reward = 54.50
2022-01-26 14:17:17.811 | DEBUG    | __main__:trials:24 - Trial = 10877/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.812 | DEBUG    | __main__:trials:29 - Trial = 10877/30000 | Total reward = 29.18
2022-01-26 14:17:17.815 | DEBUG    | __main__:trials:24 - Trial = 10878/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.817 | DEBUG    | __main__:trials:29 - Trial = 10878/30000 | Total reward = 29.01
2022-01-26 14:17:17.821 | DEBUG    | __main__:trials:24 - Trial = 10879/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.822 | DEBUG    | __main__:trials:29 - Trial = 10879/30000 | Total reward = 48.92
2022-01-26 14:17:17.826 | DEBUG    | __main__:trials:24 - Trial = 10880/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.827 | DEBUG    | __main__:trials:29 - Trial = 10880/30000 | Total reward = 39.12
2022-01-26 14:17:17.830 | DEBUG    | __main__:trials:24 - Trial = 10881/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.831 | DEBUG    | __main__:trials:29 - Trial = 10881/30000 | Total reward = 41.63
2022-01-26 14:17:17.834 | DEBUG    | __main__:trials:24 - Trial = 10882/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.835 | DEBUG    | __main__:trials:29 - Trial = 10882/30000 | Total reward = 46.87
2022-01-26 14:17:17.839 | DEBUG    | __main__:trials:24 - Trial = 10883/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.839 | DEBUG    | __main__:trials:29 - Trial = 10883/30000 | Total reward = 48.23
2022-01-26 14:17:17.843 | DEBUG    | __main__:trials:24 - Trial = 10884/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.845 | DEBUG    | __main__:trials:29 - Trial = 10884/30000 | Total reward = 44.19
2022-01-26 14:17:17.849 | DEBUG    | __main__:trials:24 - Trial = 10885/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.850 | DEBUG    | __main__:trials:29 - Trial = 10885/30000 | Total reward = 46.03
2022-01-26 14:17:17.853 | DEBUG    | __main__:trials:24 - Trial = 10886/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.854 | DEBUG    | __main__:trials:29 - Trial = 10886/30000 | Total reward = 43.03
2022-01-26 14:17:17.857 | DEBUG    | __main__:trials:24 - Trial = 10887/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.858 | DEBUG    | __main__:trials:29 - Trial = 10887/30000 | Total reward = 39.88
2022-01-26 14:17:17.861 | DEBUG    | __main__:trials:24 - Trial = 10888/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.862 | DEBUG    | __main__:trials:29 - Trial = 10888/30000 | Total reward = 48.92
2022-01-26 14:17:17.866 | DEBUG    | __main__:trials:24 - Trial = 10889/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.866 | DEBUG    | __main__:trials:29 - Trial = 10889/30000 | Total reward = 46.95
2022-01-26 14:17:17.870 | DEBUG    | __main__:trials:24 - Trial = 10890/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.871 | DEBUG    | __main__:trials:29 - Trial = 10890/30000 | Total reward = 37.39
2022-01-26 14:17:17.874 | DEBUG    | __main__:trials:24 - Trial = 10891/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.875 | DEBUG    | __main__:trials:29 - Trial = 10891/30000 | Total reward = 41.68
2022-01-26 14:17:17.878 | DEBUG    | __main__:trials:24 - Trial = 10892/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.879 | DEBUG    | __main__:trials:29 - Trial = 10892/30000 | Total reward = 46.01
2022-01-26 14:17:17.883 | DEBUG    | __main__:trials:24 - Trial = 10893/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.884 | DEBUG    | __main__:trials:29 - Trial = 10893/30000 | Total reward = 42.88
2022-01-26 14:17:17.887 | DEBUG    | __main__:trials:24 - Trial = 10894/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.888 | DEBUG    | __main__:trials:29 - Trial = 10894/30000 | Total reward = 42.01
2022-01-26 14:17:17.892 | DEBUG    | __main__:trials:24 - Trial = 10895/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.893 | DEBUG    | __main__:trials:29 - Trial = 10895/30000 | Total reward = 47.43
2022-01-26 14:17:17.896 | DEBUG    | __main__:trials:24 - Trial = 10896/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.897 | DEBUG    | __main__:trials:29 - Trial = 10896/30000 | Total reward = 45.50
2022-01-26 14:17:17.899 | DEBUG    | __main__:trials:24 - Trial = 10897/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.900 | DEBUG    | __main__:trials:29 - Trial = 10897/30000 | Total reward = 41.01
2022-01-26 14:17:17.904 | DEBUG    | __main__:trials:24 - Trial = 10898/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.905 | DEBUG    | __main__:trials:29 - Trial = 10898/30000 | Total reward = 34.15
2022-01-26 14:17:17.909 | DEBUG    | __main__:trials:24 - Trial = 10899/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.909 | DEBUG    | __main__:trials:29 - Trial = 10899/30000 | Total reward = 44.67
2022-01-26 14:17:17.912 | DEBUG    | __main__:trials:24 - Trial = 10900/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.914 | DEBUG    | __main__:trials:29 - Trial = 10900/30000 | Total reward = 44.48
2022-01-26 14:17:17.917 | DEBUG    | __main__:trials:24 - Trial = 10901/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.918 | DEBUG    | __main__:trials:29 - Trial = 10901/30000 | Total reward = 43.26
2022-01-26 14:17:17.921 | DEBUG    | __main__:trials:24 - Trial = 10902/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.922 | DEBUG    | __main__:trials:29 - Trial = 10902/30000 | Total reward = 32.24
2022-01-26 14:17:17.925 | DEBUG    | __main__:trials:24 - Trial = 10903/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.926 | DEBUG    | __main__:trials:29 - Trial = 10903/30000 | Total reward = 41.87
2022-01-26 14:17:17.929 | DEBUG    | __main__:trials:24 - Trial = 10904/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.930 | DEBUG    | __main__:trials:29 - Trial = 10904/30000 | Total reward = 35.97
2022-01-26 14:17:17.933 | DEBUG    | __main__:trials:24 - Trial = 10905/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.934 | DEBUG    | __main__:trials:29 - Trial = 10905/30000 | Total reward = 45.64
2022-01-26 14:17:17.937 | DEBUG    | __main__:trials:24 - Trial = 10906/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.938 | DEBUG    | __main__:trials:29 - Trial = 10906/30000 | Total reward = 35.30
2022-01-26 14:17:17.942 | DEBUG    | __main__:trials:24 - Trial = 10907/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.943 | DEBUG    | __main__:trials:29 - Trial = 10907/30000 | Total reward = 33.72
2022-01-26 14:17:17.946 | DEBUG    | __main__:trials:24 - Trial = 10908/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.948 | DEBUG    | __main__:trials:29 - Trial = 10908/30000 | Total reward = 27.40
2022-01-26 14:17:17.951 | DEBUG    | __main__:trials:24 - Trial = 10909/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.952 | DEBUG    | __main__:trials:29 - Trial = 10909/30000 | Total reward = 44.38
2022-01-26 14:17:17.956 | DEBUG    | __main__:trials:24 - Trial = 10910/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.957 | DEBUG    | __main__:trials:29 - Trial = 10910/30000 | Total reward = 45.90
2022-01-26 14:17:17.960 | DEBUG    | __main__:trials:24 - Trial = 10911/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.962 | DEBUG    | __main__:trials:29 - Trial = 10911/30000 | Total reward = 46.63
2022-01-26 14:17:17.965 | DEBUG    | __main__:trials:24 - Trial = 10912/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.966 | DEBUG    | __main__:trials:29 - Trial = 10912/30000 | Total reward = 41.17
2022-01-26 14:17:17.969 | DEBUG    | __main__:trials:24 - Trial = 10913/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.970 | DEBUG    | __main__:trials:29 - Trial = 10913/30000 | Total reward = 27.78
2022-01-26 14:17:17.973 | DEBUG    | __main__:trials:24 - Trial = 10914/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.974 | DEBUG    | __main__:trials:29 - Trial = 10914/30000 | Total reward = 30.57
2022-01-26 14:17:17.977 | DEBUG    | __main__:trials:24 - Trial = 10915/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.978 | DEBUG    | __main__:trials:29 - Trial = 10915/30000 | Total reward = 28.06
2022-01-26 14:17:17.981 | DEBUG    | __main__:trials:24 - Trial = 10916/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.983 | DEBUG    | __main__:trials:29 - Trial = 10916/30000 | Total reward = 51.04
2022-01-26 14:17:17.985 | DEBUG    | __main__:trials:24 - Trial = 10917/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.987 | DEBUG    | __main__:trials:29 - Trial = 10917/30000 | Total reward = 47.30
2022-01-26 14:17:17.991 | DEBUG    | __main__:trials:24 - Trial = 10918/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.992 | DEBUG    | __main__:trials:29 - Trial = 10918/30000 | Total reward = 29.86
2022-01-26 14:17:17.995 | DEBUG    | __main__:trials:24 - Trial = 10919/30000 | Max number of steps (20) reached
2022-01-26 14:17:17.997 | DEBUG    | __main__:trials:29 - Trial = 10919/30000 | Total reward = 29.21
2022-01-26 14:17:18.000 | DEBUG    | __main__:trials:24 - Trial = 10920/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.002 | DEBUG    | __main__:trials:29 - Trial = 10920/30000 | Total reward = 35.02
2022-01-26 14:17:18.005 | DEBUG    | __main__:trials:24 - Trial = 10921/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.007 | DEBUG    | __main__:trials:29 - Trial = 10921/30000 | Total reward = 29.86
2022-01-26 14:17:18.011 | DEBUG    | __main__:trials:24 - Trial = 10922/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.012 | DEBUG    | __main__:trials:29 - Trial = 10922/30000 | Total reward = 31.28
2022-01-26 14:17:18.016 | DEBUG    | __main__:trials:24 - Trial = 10923/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.018 | DEBUG    | __main__:trials:29 - Trial = 10923/30000 | Total reward = 29.58
2022-01-26 14:17:18.022 | DEBUG    | __main__:trials:24 - Trial = 10924/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.022 | DEBUG    | __main__:trials:29 - Trial = 10924/30000 | Total reward = 49.31
2022-01-26 14:17:18.026 | DEBUG    | __main__:trials:24 - Trial = 10925/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.028 | DEBUG    | __main__:trials:29 - Trial = 10925/30000 | Total reward = 41.32
2022-01-26 14:17:18.031 | DEBUG    | __main__:trials:24 - Trial = 10926/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.032 | DEBUG    | __main__:trials:29 - Trial = 10926/30000 | Total reward = 42.85
2022-01-26 14:17:18.036 | DEBUG    | __main__:trials:24 - Trial = 10927/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.037 | DEBUG    | __main__:trials:29 - Trial = 10927/30000 | Total reward = 49.29
2022-01-26 14:17:18.041 | DEBUG    | __main__:trials:24 - Trial = 10928/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.042 | DEBUG    | __main__:trials:29 - Trial = 10928/30000 | Total reward = 45.27
2022-01-26 14:17:18.046 | DEBUG    | __main__:trials:24 - Trial = 10929/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.047 | DEBUG    | __main__:trials:29 - Trial = 10929/30000 | Total reward = 32.59
2022-01-26 14:17:18.050 | DEBUG    | __main__:trials:24 - Trial = 10930/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.051 | DEBUG    | __main__:trials:29 - Trial = 10930/30000 | Total reward = 42.81
2022-01-26 14:17:18.055 | DEBUG    | __main__:trials:24 - Trial = 10931/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.057 | DEBUG    | __main__:trials:29 - Trial = 10931/30000 | Total reward = 32.94
2022-01-26 14:17:18.060 | DEBUG    | __main__:trials:24 - Trial = 10932/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.062 | DEBUG    | __main__:trials:29 - Trial = 10932/30000 | Total reward = 39.50
2022-01-26 14:17:18.065 | DEBUG    | __main__:trials:24 - Trial = 10933/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.066 | DEBUG    | __main__:trials:29 - Trial = 10933/30000 | Total reward = 29.63
2022-01-26 14:17:18.070 | DEBUG    | __main__:trials:24 - Trial = 10934/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.072 | DEBUG    | __main__:trials:29 - Trial = 10934/30000 | Total reward = 29.16
2022-01-26 14:17:18.076 | DEBUG    | __main__:trials:24 - Trial = 10935/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.076 | DEBUG    | __main__:trials:29 - Trial = 10935/30000 | Total reward = 29.35
2022-01-26 14:17:18.081 | DEBUG    | __main__:trials:26 - Trial = 10936/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.082 | DEBUG    | __main__:trials:29 - Trial = 10936/30000 | Total reward = 26.17
2022-01-26 14:17:18.086 | DEBUG    | __main__:trials:24 - Trial = 10937/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.088 | DEBUG    | __main__:trials:29 - Trial = 10937/30000 | Total reward = 28.58
2022-01-26 14:17:18.091 | DEBUG    | __main__:trials:24 - Trial = 10938/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.092 | DEBUG    | __main__:trials:29 - Trial = 10938/30000 | Total reward = 42.16
2022-01-26 14:17:18.096 | DEBUG    | __main__:trials:24 - Trial = 10939/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.098 | DEBUG    | __main__:trials:29 - Trial = 10939/30000 | Total reward = 29.39
2022-01-26 14:17:18.101 | DEBUG    | __main__:trials:26 - Trial = 10940/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.101 | DEBUG    | __main__:trials:29 - Trial = 10940/30000 | Total reward = 13.83
2022-01-26 14:17:18.106 | DEBUG    | __main__:trials:24 - Trial = 10941/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.106 | DEBUG    | __main__:trials:29 - Trial = 10941/30000 | Total reward = 29.89
2022-01-26 14:17:18.111 | DEBUG    | __main__:trials:24 - Trial = 10942/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.113 | DEBUG    | __main__:trials:29 - Trial = 10942/30000 | Total reward = 33.81
2022-01-26 14:17:18.116 | DEBUG    | __main__:trials:24 - Trial = 10943/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.117 | DEBUG    | __main__:trials:29 - Trial = 10943/30000 | Total reward = 26.56
2022-01-26 14:17:18.121 | DEBUG    | __main__:trials:26 - Trial = 10944/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.121 | DEBUG    | __main__:trials:29 - Trial = 10944/30000 | Total reward = 21.38
2022-01-26 14:17:18.124 | DEBUG    | __main__:trials:24 - Trial = 10945/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.126 | DEBUG    | __main__:trials:29 - Trial = 10945/30000 | Total reward = 51.60
2022-01-26 14:17:18.129 | DEBUG    | __main__:trials:24 - Trial = 10946/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.130 | DEBUG    | __main__:trials:29 - Trial = 10946/30000 | Total reward = 28.27
2022-01-26 14:17:18.133 | DEBUG    | __main__:trials:24 - Trial = 10947/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.134 | DEBUG    | __main__:trials:29 - Trial = 10947/30000 | Total reward = 24.18
2022-01-26 14:17:18.137 | DEBUG    | __main__:trials:24 - Trial = 10948/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.138 | DEBUG    | __main__:trials:29 - Trial = 10948/30000 | Total reward = 38.62
2022-01-26 14:17:18.141 | DEBUG    | __main__:trials:24 - Trial = 10949/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.143 | DEBUG    | __main__:trials:29 - Trial = 10949/30000 | Total reward = 37.65
2022-01-26 14:17:18.146 | DEBUG    | __main__:trials:24 - Trial = 10950/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.147 | DEBUG    | __main__:trials:29 - Trial = 10950/30000 | Total reward = 27.36
2022-01-26 14:17:18.150 | DEBUG    | __main__:trials:24 - Trial = 10951/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.152 | DEBUG    | __main__:trials:29 - Trial = 10951/30000 | Total reward = 27.17
2022-01-26 14:17:18.156 | DEBUG    | __main__:trials:24 - Trial = 10952/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.156 | DEBUG    | __main__:trials:29 - Trial = 10952/30000 | Total reward = 43.29
2022-01-26 14:17:18.161 | DEBUG    | __main__:trials:24 - Trial = 10953/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.161 | DEBUG    | __main__:trials:29 - Trial = 10953/30000 | Total reward = 43.92
2022-01-26 14:17:18.166 | DEBUG    | __main__:trials:26 - Trial = 10954/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.167 | DEBUG    | __main__:trials:29 - Trial = 10954/30000 | Total reward = 14.88
2022-01-26 14:17:18.169 | DEBUG    | __main__:trials:26 - Trial = 10955/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.170 | DEBUG    | __main__:trials:29 - Trial = 10955/30000 | Total reward = 8.98
2022-01-26 14:17:18.174 | DEBUG    | __main__:trials:24 - Trial = 10956/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.175 | DEBUG    | __main__:trials:29 - Trial = 10956/30000 | Total reward = 27.89
2022-01-26 14:17:18.177 | DEBUG    | __main__:trials:24 - Trial = 10957/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.178 | DEBUG    | __main__:trials:29 - Trial = 10957/30000 | Total reward = 16.13
2022-01-26 14:17:18.182 | DEBUG    | __main__:trials:24 - Trial = 10958/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.183 | DEBUG    | __main__:trials:29 - Trial = 10958/30000 | Total reward = 20.66
2022-01-26 14:17:18.186 | DEBUG    | __main__:trials:24 - Trial = 10959/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.187 | DEBUG    | __main__:trials:29 - Trial = 10959/30000 | Total reward = 27.21
2022-01-26 14:17:18.191 | DEBUG    | __main__:trials:24 - Trial = 10960/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.191 | DEBUG    | __main__:trials:29 - Trial = 10960/30000 | Total reward = 46.57
2022-01-26 14:17:18.195 | DEBUG    | __main__:trials:24 - Trial = 10961/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.196 | DEBUG    | __main__:trials:29 - Trial = 10961/30000 | Total reward = 22.48
2022-01-26 14:17:18.199 | DEBUG    | __main__:trials:24 - Trial = 10962/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.201 | DEBUG    | __main__:trials:29 - Trial = 10962/30000 | Total reward = 44.53
2022-01-26 14:17:18.204 | DEBUG    | __main__:trials:24 - Trial = 10963/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.205 | DEBUG    | __main__:trials:29 - Trial = 10963/30000 | Total reward = 47.21
2022-01-26 14:17:18.208 | DEBUG    | __main__:trials:26 - Trial = 10964/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.210 | DEBUG    | __main__:trials:29 - Trial = 10964/30000 | Total reward = 17.31
2022-01-26 14:17:18.213 | DEBUG    | __main__:trials:24 - Trial = 10965/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.214 | DEBUG    | __main__:trials:29 - Trial = 10965/30000 | Total reward = 25.17
2022-01-26 14:17:18.218 | DEBUG    | __main__:trials:24 - Trial = 10966/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.219 | DEBUG    | __main__:trials:29 - Trial = 10966/30000 | Total reward = 48.09
2022-01-26 14:17:18.222 | DEBUG    | __main__:trials:24 - Trial = 10967/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.224 | DEBUG    | __main__:trials:29 - Trial = 10967/30000 | Total reward = 26.71
2022-01-26 14:17:18.227 | DEBUG    | __main__:trials:24 - Trial = 10968/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.228 | DEBUG    | __main__:trials:29 - Trial = 10968/30000 | Total reward = 46.43
2022-01-26 14:17:18.231 | DEBUG    | __main__:trials:24 - Trial = 10969/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.233 | DEBUG    | __main__:trials:29 - Trial = 10969/30000 | Total reward = 26.59
2022-01-26 14:17:18.236 | DEBUG    | __main__:trials:24 - Trial = 10970/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.237 | DEBUG    | __main__:trials:29 - Trial = 10970/30000 | Total reward = 26.37
2022-01-26 14:17:18.240 | DEBUG    | __main__:trials:24 - Trial = 10971/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.241 | DEBUG    | __main__:trials:29 - Trial = 10971/30000 | Total reward = 59.31
2022-01-26 14:17:18.244 | DEBUG    | __main__:trials:24 - Trial = 10972/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.245 | DEBUG    | __main__:trials:29 - Trial = 10972/30000 | Total reward = 32.42
2022-01-26 14:17:18.247 | DEBUG    | __main__:trials:26 - Trial = 10973/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.248 | DEBUG    | __main__:trials:29 - Trial = 10973/30000 | Total reward = 8.39
2022-01-26 14:17:18.251 | DEBUG    | __main__:trials:24 - Trial = 10974/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.252 | DEBUG    | __main__:trials:29 - Trial = 10974/30000 | Total reward = 26.67
2022-01-26 14:17:18.255 | DEBUG    | __main__:trials:24 - Trial = 10975/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.257 | DEBUG    | __main__:trials:29 - Trial = 10975/30000 | Total reward = 25.67
2022-01-26 14:17:18.260 | DEBUG    | __main__:trials:24 - Trial = 10976/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.262 | DEBUG    | __main__:trials:29 - Trial = 10976/30000 | Total reward = 44.39
2022-01-26 14:17:18.265 | DEBUG    | __main__:trials:24 - Trial = 10977/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.266 | DEBUG    | __main__:trials:29 - Trial = 10977/30000 | Total reward = 61.51
2022-01-26 14:17:18.269 | DEBUG    | __main__:trials:26 - Trial = 10978/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.270 | DEBUG    | __main__:trials:29 - Trial = 10978/30000 | Total reward = 19.03
2022-01-26 14:17:18.272 | DEBUG    | __main__:trials:26 - Trial = 10979/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.274 | DEBUG    | __main__:trials:29 - Trial = 10979/30000 | Total reward = 7.44
2022-01-26 14:17:18.277 | DEBUG    | __main__:trials:24 - Trial = 10980/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.279 | DEBUG    | __main__:trials:29 - Trial = 10980/30000 | Total reward = 40.17
2022-01-26 14:17:18.282 | DEBUG    | __main__:trials:24 - Trial = 10981/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.282 | DEBUG    | __main__:trials:29 - Trial = 10981/30000 | Total reward = 47.18
2022-01-26 14:17:18.286 | DEBUG    | __main__:trials:24 - Trial = 10982/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.288 | DEBUG    | __main__:trials:29 - Trial = 10982/30000 | Total reward = 22.23
2022-01-26 14:17:18.290 | DEBUG    | __main__:trials:24 - Trial = 10983/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.291 | DEBUG    | __main__:trials:29 - Trial = 10983/30000 | Total reward = 42.14
2022-01-26 14:17:18.295 | DEBUG    | __main__:trials:24 - Trial = 10984/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.296 | DEBUG    | __main__:trials:29 - Trial = 10984/30000 | Total reward = 39.34
2022-01-26 14:17:18.299 | DEBUG    | __main__:trials:24 - Trial = 10985/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.301 | DEBUG    | __main__:trials:29 - Trial = 10985/30000 | Total reward = 44.28
2022-01-26 14:17:18.304 | DEBUG    | __main__:trials:24 - Trial = 10986/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.305 | DEBUG    | __main__:trials:29 - Trial = 10986/30000 | Total reward = 48.92
2022-01-26 14:17:18.310 | DEBUG    | __main__:trials:24 - Trial = 10987/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.311 | DEBUG    | __main__:trials:29 - Trial = 10987/30000 | Total reward = 35.00
2022-01-26 14:17:18.314 | DEBUG    | __main__:trials:24 - Trial = 10988/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.316 | DEBUG    | __main__:trials:29 - Trial = 10988/30000 | Total reward = 27.29
2022-01-26 14:17:18.319 | DEBUG    | __main__:trials:24 - Trial = 10989/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.320 | DEBUG    | __main__:trials:29 - Trial = 10989/30000 | Total reward = 48.46
2022-01-26 14:17:18.324 | DEBUG    | __main__:trials:24 - Trial = 10990/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.325 | DEBUG    | __main__:trials:29 - Trial = 10990/30000 | Total reward = 43.93
2022-01-26 14:17:18.328 | DEBUG    | __main__:trials:24 - Trial = 10991/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.330 | DEBUG    | __main__:trials:29 - Trial = 10991/30000 | Total reward = 45.52
2022-01-26 14:17:18.333 | DEBUG    | __main__:trials:24 - Trial = 10992/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.335 | DEBUG    | __main__:trials:29 - Trial = 10992/30000 | Total reward = 47.00
2022-01-26 14:17:18.339 | DEBUG    | __main__:trials:24 - Trial = 10993/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.340 | DEBUG    | __main__:trials:29 - Trial = 10993/30000 | Total reward = 32.90
2022-01-26 14:17:18.344 | DEBUG    | __main__:trials:24 - Trial = 10994/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.345 | DEBUG    | __main__:trials:29 - Trial = 10994/30000 | Total reward = 23.46
2022-01-26 14:17:18.349 | DEBUG    | __main__:trials:26 - Trial = 10995/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.350 | DEBUG    | __main__:trials:29 - Trial = 10995/30000 | Total reward = 17.99
2022-01-26 14:17:18.354 | DEBUG    | __main__:trials:26 - Trial = 10996/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.355 | DEBUG    | __main__:trials:29 - Trial = 10996/30000 | Total reward = 20.13
2022-01-26 14:17:18.359 | DEBUG    | __main__:trials:24 - Trial = 10997/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.360 | DEBUG    | __main__:trials:29 - Trial = 10997/30000 | Total reward = 38.49
2022-01-26 14:17:18.363 | DEBUG    | __main__:trials:24 - Trial = 10998/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.365 | DEBUG    | __main__:trials:29 - Trial = 10998/30000 | Total reward = 43.20
2022-01-26 14:17:18.369 | DEBUG    | __main__:trials:24 - Trial = 10999/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.370 | DEBUG    | __main__:trials:29 - Trial = 10999/30000 | Total reward = 47.62
2022-01-26 14:17:18.372 | DEBUG    | __main__:trials:26 - Trial = 11000/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.374 | DEBUG    | __main__:trials:29 - Trial = 11000/30000 | Total reward = 15.21
2022-01-26 14:17:18.377 | DEBUG    | __main__:trials:26 - Trial = 11001/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.377 | DEBUG    | __main__:trials:29 - Trial = 11001/30000 | Total reward = 7.44
2022-01-26 14:17:18.381 | DEBUG    | __main__:trials:24 - Trial = 11002/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.383 | DEBUG    | __main__:trials:29 - Trial = 11002/30000 | Total reward = 39.16
2022-01-26 14:17:18.385 | DEBUG    | __main__:trials:26 - Trial = 11003/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.387 | DEBUG    | __main__:trials:29 - Trial = 11003/30000 | Total reward = 9.98
2022-01-26 14:17:18.390 | DEBUG    | __main__:trials:24 - Trial = 11004/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.392 | DEBUG    | __main__:trials:29 - Trial = 11004/30000 | Total reward = 43.59
2022-01-26 14:17:18.395 | DEBUG    | __main__:trials:24 - Trial = 11005/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.397 | DEBUG    | __main__:trials:29 - Trial = 11005/30000 | Total reward = 30.81
2022-01-26 14:17:18.400 | DEBUG    | __main__:trials:24 - Trial = 11006/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.402 | DEBUG    | __main__:trials:29 - Trial = 11006/30000 | Total reward = 43.49
2022-01-26 14:17:18.406 | DEBUG    | __main__:trials:24 - Trial = 11007/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.407 | DEBUG    | __main__:trials:29 - Trial = 11007/30000 | Total reward = 21.49
2022-01-26 14:17:18.411 | DEBUG    | __main__:trials:24 - Trial = 11008/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.412 | DEBUG    | __main__:trials:29 - Trial = 11008/30000 | Total reward = 29.35
2022-01-26 14:17:18.416 | DEBUG    | __main__:trials:24 - Trial = 11009/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.418 | DEBUG    | __main__:trials:29 - Trial = 11009/30000 | Total reward = 28.58
2022-01-26 14:17:18.420 | DEBUG    | __main__:trials:26 - Trial = 11010/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.422 | DEBUG    | __main__:trials:29 - Trial = 11010/30000 | Total reward = 6.43
2022-01-26 14:17:18.426 | DEBUG    | __main__:trials:24 - Trial = 11011/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.427 | DEBUG    | __main__:trials:29 - Trial = 11011/30000 | Total reward = 25.67
2022-01-26 14:17:18.430 | DEBUG    | __main__:trials:26 - Trial = 11012/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.432 | DEBUG    | __main__:trials:29 - Trial = 11012/30000 | Total reward = 8.59
2022-01-26 14:17:18.435 | DEBUG    | __main__:trials:24 - Trial = 11013/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.437 | DEBUG    | __main__:trials:29 - Trial = 11013/30000 | Total reward = 43.09
2022-01-26 14:17:18.441 | DEBUG    | __main__:trials:24 - Trial = 11014/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.442 | DEBUG    | __main__:trials:29 - Trial = 11014/30000 | Total reward = 29.35
2022-01-26 14:17:18.446 | DEBUG    | __main__:trials:24 - Trial = 11015/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.447 | DEBUG    | __main__:trials:29 - Trial = 11015/30000 | Total reward = 20.02
2022-01-26 14:17:18.450 | DEBUG    | __main__:trials:24 - Trial = 11016/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.452 | DEBUG    | __main__:trials:29 - Trial = 11016/30000 | Total reward = 27.32
2022-01-26 14:17:18.456 | DEBUG    | __main__:trials:24 - Trial = 11017/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.457 | DEBUG    | __main__:trials:29 - Trial = 11017/30000 | Total reward = 24.06
2022-01-26 14:17:18.461 | DEBUG    | __main__:trials:24 - Trial = 11018/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.462 | DEBUG    | __main__:trials:29 - Trial = 11018/30000 | Total reward = 41.32
2022-01-26 14:17:18.466 | DEBUG    | __main__:trials:26 - Trial = 11019/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.467 | DEBUG    | __main__:trials:29 - Trial = 11019/30000 | Total reward = 24.68
2022-01-26 14:17:18.471 | DEBUG    | __main__:trials:24 - Trial = 11020/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.472 | DEBUG    | __main__:trials:29 - Trial = 11020/30000 | Total reward = 34.77
2022-01-26 14:17:18.475 | DEBUG    | __main__:trials:26 - Trial = 11021/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.477 | DEBUG    | __main__:trials:29 - Trial = 11021/30000 | Total reward = 15.71
2022-01-26 14:17:18.481 | DEBUG    | __main__:trials:24 - Trial = 11022/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.482 | DEBUG    | __main__:trials:29 - Trial = 11022/30000 | Total reward = 27.80
2022-01-26 14:17:18.485 | DEBUG    | __main__:trials:24 - Trial = 11023/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.486 | DEBUG    | __main__:trials:29 - Trial = 11023/30000 | Total reward = 38.46
2022-01-26 14:17:18.489 | DEBUG    | __main__:trials:24 - Trial = 11024/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.491 | DEBUG    | __main__:trials:29 - Trial = 11024/30000 | Total reward = 29.54
2022-01-26 14:17:18.495 | DEBUG    | __main__:trials:24 - Trial = 11025/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.496 | DEBUG    | __main__:trials:29 - Trial = 11025/30000 | Total reward = 33.05
2022-01-26 14:17:18.500 | DEBUG    | __main__:trials:24 - Trial = 11026/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.501 | DEBUG    | __main__:trials:29 - Trial = 11026/30000 | Total reward = 35.04
2022-01-26 14:17:18.505 | DEBUG    | __main__:trials:24 - Trial = 11027/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.507 | DEBUG    | __main__:trials:29 - Trial = 11027/30000 | Total reward = 48.82
2022-01-26 14:17:18.510 | DEBUG    | __main__:trials:24 - Trial = 11028/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.512 | DEBUG    | __main__:trials:29 - Trial = 11028/30000 | Total reward = 28.68
2022-01-26 14:17:18.515 | DEBUG    | __main__:trials:24 - Trial = 11029/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.517 | DEBUG    | __main__:trials:29 - Trial = 11029/30000 | Total reward = 41.88
2022-01-26 14:17:18.520 | DEBUG    | __main__:trials:24 - Trial = 11030/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.521 | DEBUG    | __main__:trials:29 - Trial = 11030/30000 | Total reward = 29.60
2022-01-26 14:17:18.525 | DEBUG    | __main__:trials:24 - Trial = 11031/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.527 | DEBUG    | __main__:trials:29 - Trial = 11031/30000 | Total reward = 46.47
2022-01-26 14:17:18.530 | DEBUG    | __main__:trials:24 - Trial = 11032/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.532 | DEBUG    | __main__:trials:29 - Trial = 11032/30000 | Total reward = 41.31
2022-01-26 14:17:18.536 | DEBUG    | __main__:trials:24 - Trial = 11033/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.537 | DEBUG    | __main__:trials:29 - Trial = 11033/30000 | Total reward = 42.88
2022-01-26 14:17:18.540 | DEBUG    | __main__:trials:24 - Trial = 11034/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.542 | DEBUG    | __main__:trials:29 - Trial = 11034/30000 | Total reward = 47.56
2022-01-26 14:17:18.546 | DEBUG    | __main__:trials:24 - Trial = 11035/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.548 | DEBUG    | __main__:trials:29 - Trial = 11035/30000 | Total reward = 25.99
2022-01-26 14:17:18.551 | DEBUG    | __main__:trials:24 - Trial = 11036/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.553 | DEBUG    | __main__:trials:29 - Trial = 11036/30000 | Total reward = 24.33
2022-01-26 14:17:18.556 | DEBUG    | __main__:trials:26 - Trial = 11037/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.557 | DEBUG    | __main__:trials:29 - Trial = 11037/30000 | Total reward = 21.29
2022-01-26 14:17:18.561 | DEBUG    | __main__:trials:24 - Trial = 11038/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.563 | DEBUG    | __main__:trials:29 - Trial = 11038/30000 | Total reward = 37.25
2022-01-26 14:17:18.565 | DEBUG    | __main__:trials:24 - Trial = 11039/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.567 | DEBUG    | __main__:trials:29 - Trial = 11039/30000 | Total reward = 29.01
2022-01-26 14:17:18.570 | DEBUG    | __main__:trials:24 - Trial = 11040/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.572 | DEBUG    | __main__:trials:29 - Trial = 11040/30000 | Total reward = 36.68
2022-01-26 14:17:18.575 | DEBUG    | __main__:trials:24 - Trial = 11041/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.577 | DEBUG    | __main__:trials:29 - Trial = 11041/30000 | Total reward = 29.95
2022-01-26 14:17:18.580 | DEBUG    | __main__:trials:24 - Trial = 11042/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.582 | DEBUG    | __main__:trials:29 - Trial = 11042/30000 | Total reward = 29.02
2022-01-26 14:17:18.586 | DEBUG    | __main__:trials:24 - Trial = 11043/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.586 | DEBUG    | __main__:trials:29 - Trial = 11043/30000 | Total reward = 32.38
2022-01-26 14:17:18.589 | DEBUG    | __main__:trials:26 - Trial = 11044/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.591 | DEBUG    | __main__:trials:29 - Trial = 11044/30000 | Total reward = 14.08
2022-01-26 14:17:18.595 | DEBUG    | __main__:trials:24 - Trial = 11045/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.596 | DEBUG    | __main__:trials:29 - Trial = 11045/30000 | Total reward = 26.40
2022-01-26 14:17:18.599 | DEBUG    | __main__:trials:26 - Trial = 11046/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.599 | DEBUG    | __main__:trials:29 - Trial = 11046/30000 | Total reward = 7.44
2022-01-26 14:17:18.604 | DEBUG    | __main__:trials:24 - Trial = 11047/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.605 | DEBUG    | __main__:trials:29 - Trial = 11047/30000 | Total reward = 32.28
2022-01-26 14:17:18.609 | DEBUG    | __main__:trials:24 - Trial = 11048/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.610 | DEBUG    | __main__:trials:29 - Trial = 11048/30000 | Total reward = 46.74
2022-01-26 14:17:18.613 | DEBUG    | __main__:trials:24 - Trial = 11049/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.615 | DEBUG    | __main__:trials:29 - Trial = 11049/30000 | Total reward = 25.65
2022-01-26 14:17:18.619 | DEBUG    | __main__:trials:24 - Trial = 11050/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.620 | DEBUG    | __main__:trials:29 - Trial = 11050/30000 | Total reward = 36.73
2022-01-26 14:17:18.624 | DEBUG    | __main__:trials:24 - Trial = 11051/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.625 | DEBUG    | __main__:trials:29 - Trial = 11051/30000 | Total reward = 27.94
2022-01-26 14:17:18.627 | DEBUG    | __main__:trials:26 - Trial = 11052/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.628 | DEBUG    | __main__:trials:29 - Trial = 11052/30000 | Total reward = 8.00
2022-01-26 14:17:18.631 | DEBUG    | __main__:trials:24 - Trial = 11053/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.632 | DEBUG    | __main__:trials:29 - Trial = 11053/30000 | Total reward = 60.38
2022-01-26 14:17:18.635 | DEBUG    | __main__:trials:26 - Trial = 11054/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.636 | DEBUG    | __main__:trials:29 - Trial = 11054/30000 | Total reward = 12.89
2022-01-26 14:17:18.640 | DEBUG    | __main__:trials:24 - Trial = 11055/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.643 | DEBUG    | __main__:trials:29 - Trial = 11055/30000 | Total reward = 29.49
2022-01-26 14:17:18.646 | DEBUG    | __main__:trials:24 - Trial = 11056/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.647 | DEBUG    | __main__:trials:29 - Trial = 11056/30000 | Total reward = 29.98
2022-01-26 14:17:18.651 | DEBUG    | __main__:trials:24 - Trial = 11057/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.653 | DEBUG    | __main__:trials:29 - Trial = 11057/30000 | Total reward = 32.20
2022-01-26 14:17:18.656 | DEBUG    | __main__:trials:24 - Trial = 11058/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.657 | DEBUG    | __main__:trials:29 - Trial = 11058/30000 | Total reward = 29.36
2022-01-26 14:17:18.661 | DEBUG    | __main__:trials:24 - Trial = 11059/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.662 | DEBUG    | __main__:trials:29 - Trial = 11059/30000 | Total reward = 35.55
2022-01-26 14:17:18.666 | DEBUG    | __main__:trials:24 - Trial = 11060/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.668 | DEBUG    | __main__:trials:29 - Trial = 11060/30000 | Total reward = 30.66
2022-01-26 14:17:18.671 | DEBUG    | __main__:trials:24 - Trial = 11061/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.673 | DEBUG    | __main__:trials:29 - Trial = 11061/30000 | Total reward = 47.21
2022-01-26 14:17:18.676 | DEBUG    | __main__:trials:24 - Trial = 11062/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.678 | DEBUG    | __main__:trials:29 - Trial = 11062/30000 | Total reward = 36.14
2022-01-26 14:17:18.681 | DEBUG    | __main__:trials:24 - Trial = 11063/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.683 | DEBUG    | __main__:trials:29 - Trial = 11063/30000 | Total reward = 26.46
2022-01-26 14:17:18.686 | DEBUG    | __main__:trials:24 - Trial = 11064/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.687 | DEBUG    | __main__:trials:29 - Trial = 11064/30000 | Total reward = 28.68
2022-01-26 14:17:18.690 | DEBUG    | __main__:trials:26 - Trial = 11065/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.692 | DEBUG    | __main__:trials:29 - Trial = 11065/30000 | Total reward = 23.08
2022-01-26 14:17:18.696 | DEBUG    | __main__:trials:24 - Trial = 11066/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.697 | DEBUG    | __main__:trials:29 - Trial = 11066/30000 | Total reward = 46.18
2022-01-26 14:17:18.700 | DEBUG    | __main__:trials:26 - Trial = 11067/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.701 | DEBUG    | __main__:trials:29 - Trial = 11067/30000 | Total reward = 7.00
2022-01-26 14:17:18.705 | DEBUG    | __main__:trials:24 - Trial = 11068/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.706 | DEBUG    | __main__:trials:29 - Trial = 11068/30000 | Total reward = 27.36
2022-01-26 14:17:18.710 | DEBUG    | __main__:trials:24 - Trial = 11069/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.711 | DEBUG    | __main__:trials:29 - Trial = 11069/30000 | Total reward = 30.40
2022-01-26 14:17:18.715 | DEBUG    | __main__:trials:24 - Trial = 11070/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.716 | DEBUG    | __main__:trials:29 - Trial = 11070/30000 | Total reward = 36.50
2022-01-26 14:17:18.719 | DEBUG    | __main__:trials:26 - Trial = 11071/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.721 | DEBUG    | __main__:trials:29 - Trial = 11071/30000 | Total reward = 12.67
2022-01-26 14:17:18.723 | DEBUG    | __main__:trials:26 - Trial = 11072/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.724 | DEBUG    | __main__:trials:29 - Trial = 11072/30000 | Total reward = 10.89
2022-01-26 14:17:18.728 | DEBUG    | __main__:trials:24 - Trial = 11073/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.730 | DEBUG    | __main__:trials:29 - Trial = 11073/30000 | Total reward = 27.04
2022-01-26 14:17:18.734 | DEBUG    | __main__:trials:24 - Trial = 11074/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.735 | DEBUG    | __main__:trials:29 - Trial = 11074/30000 | Total reward = 42.98
2022-01-26 14:17:18.738 | DEBUG    | __main__:trials:24 - Trial = 11075/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.740 | DEBUG    | __main__:trials:29 - Trial = 11075/30000 | Total reward = 29.37
2022-01-26 14:17:18.744 | DEBUG    | __main__:trials:24 - Trial = 11076/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.744 | DEBUG    | __main__:trials:29 - Trial = 11076/30000 | Total reward = 45.53
2022-01-26 14:17:18.748 | DEBUG    | __main__:trials:24 - Trial = 11077/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.750 | DEBUG    | __main__:trials:29 - Trial = 11077/30000 | Total reward = 29.71
2022-01-26 14:17:18.754 | DEBUG    | __main__:trials:24 - Trial = 11078/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.755 | DEBUG    | __main__:trials:29 - Trial = 11078/30000 | Total reward = 41.84
2022-01-26 14:17:18.759 | DEBUG    | __main__:trials:24 - Trial = 11079/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.761 | DEBUG    | __main__:trials:29 - Trial = 11079/30000 | Total reward = 33.80
2022-01-26 14:17:18.764 | DEBUG    | __main__:trials:24 - Trial = 11080/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.766 | DEBUG    | __main__:trials:29 - Trial = 11080/30000 | Total reward = 37.66
2022-01-26 14:17:18.770 | DEBUG    | __main__:trials:24 - Trial = 11081/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.771 | DEBUG    | __main__:trials:29 - Trial = 11081/30000 | Total reward = 29.61
2022-01-26 14:17:18.774 | DEBUG    | __main__:trials:26 - Trial = 11082/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.776 | DEBUG    | __main__:trials:29 - Trial = 11082/30000 | Total reward = 13.27
2022-01-26 14:17:18.779 | DEBUG    | __main__:trials:24 - Trial = 11083/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.781 | DEBUG    | __main__:trials:29 - Trial = 11083/30000 | Total reward = 45.66
2022-01-26 14:17:18.785 | DEBUG    | __main__:trials:24 - Trial = 11084/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.786 | DEBUG    | __main__:trials:29 - Trial = 11084/30000 | Total reward = 24.16
2022-01-26 14:17:18.790 | DEBUG    | __main__:trials:24 - Trial = 11085/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.792 | DEBUG    | __main__:trials:29 - Trial = 11085/30000 | Total reward = 39.22
2022-01-26 14:17:18.795 | DEBUG    | __main__:trials:24 - Trial = 11086/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.796 | DEBUG    | __main__:trials:29 - Trial = 11086/30000 | Total reward = 31.20
2022-01-26 14:17:18.800 | DEBUG    | __main__:trials:24 - Trial = 11087/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.802 | DEBUG    | __main__:trials:29 - Trial = 11087/30000 | Total reward = 27.40
2022-01-26 14:17:18.805 | DEBUG    | __main__:trials:24 - Trial = 11088/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.807 | DEBUG    | __main__:trials:29 - Trial = 11088/30000 | Total reward = 58.21
2022-01-26 14:17:18.811 | DEBUG    | __main__:trials:24 - Trial = 11089/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.812 | DEBUG    | __main__:trials:29 - Trial = 11089/30000 | Total reward = 30.25
2022-01-26 14:17:18.816 | DEBUG    | __main__:trials:24 - Trial = 11090/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.817 | DEBUG    | __main__:trials:29 - Trial = 11090/30000 | Total reward = 29.37
2022-01-26 14:17:18.821 | DEBUG    | __main__:trials:24 - Trial = 11091/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.823 | DEBUG    | __main__:trials:29 - Trial = 11091/30000 | Total reward = 49.69
2022-01-26 14:17:18.825 | DEBUG    | __main__:trials:26 - Trial = 11092/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.826 | DEBUG    | __main__:trials:29 - Trial = 11092/30000 | Total reward = 19.11
2022-01-26 14:17:18.829 | DEBUG    | __main__:trials:24 - Trial = 11093/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.831 | DEBUG    | __main__:trials:29 - Trial = 11093/30000 | Total reward = 37.42
2022-01-26 14:17:18.835 | DEBUG    | __main__:trials:24 - Trial = 11094/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.836 | DEBUG    | __main__:trials:29 - Trial = 11094/30000 | Total reward = 29.15
2022-01-26 14:17:18.840 | DEBUG    | __main__:trials:24 - Trial = 11095/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.841 | DEBUG    | __main__:trials:29 - Trial = 11095/30000 | Total reward = 29.63
2022-01-26 14:17:18.844 | DEBUG    | __main__:trials:26 - Trial = 11096/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.844 | DEBUG    | __main__:trials:29 - Trial = 11096/30000 | Total reward = 8.84
2022-01-26 14:17:18.848 | DEBUG    | __main__:trials:24 - Trial = 11097/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.849 | DEBUG    | __main__:trials:29 - Trial = 11097/30000 | Total reward = 55.11
2022-01-26 14:17:18.853 | DEBUG    | __main__:trials:24 - Trial = 11098/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.854 | DEBUG    | __main__:trials:29 - Trial = 11098/30000 | Total reward = 25.78
2022-01-26 14:17:18.858 | DEBUG    | __main__:trials:24 - Trial = 11099/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.858 | DEBUG    | __main__:trials:29 - Trial = 11099/30000 | Total reward = 29.52
2022-01-26 14:17:18.862 | DEBUG    | __main__:trials:24 - Trial = 11100/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.864 | DEBUG    | __main__:trials:29 - Trial = 11100/30000 | Total reward = 41.52
2022-01-26 14:17:18.867 | DEBUG    | __main__:trials:24 - Trial = 11101/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.869 | DEBUG    | __main__:trials:29 - Trial = 11101/30000 | Total reward = 29.37
2022-01-26 14:17:18.872 | DEBUG    | __main__:trials:26 - Trial = 11102/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.872 | DEBUG    | __main__:trials:29 - Trial = 11102/30000 | Total reward = 13.27
2022-01-26 14:17:18.876 | DEBUG    | __main__:trials:24 - Trial = 11103/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.877 | DEBUG    | __main__:trials:29 - Trial = 11103/30000 | Total reward = 11.84
2022-01-26 14:17:18.881 | DEBUG    | __main__:trials:24 - Trial = 11104/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.882 | DEBUG    | __main__:trials:29 - Trial = 11104/30000 | Total reward = 36.11
2022-01-26 14:17:18.885 | DEBUG    | __main__:trials:24 - Trial = 11105/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.886 | DEBUG    | __main__:trials:29 - Trial = 11105/30000 | Total reward = 43.46
2022-01-26 14:17:18.890 | DEBUG    | __main__:trials:24 - Trial = 11106/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.890 | DEBUG    | __main__:trials:29 - Trial = 11106/30000 | Total reward = 43.69
2022-01-26 14:17:18.894 | DEBUG    | __main__:trials:24 - Trial = 11107/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.896 | DEBUG    | __main__:trials:29 - Trial = 11107/30000 | Total reward = 41.99
2022-01-26 14:17:18.900 | DEBUG    | __main__:trials:24 - Trial = 11108/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.901 | DEBUG    | __main__:trials:29 - Trial = 11108/30000 | Total reward = 41.13
2022-01-26 14:17:18.904 | DEBUG    | __main__:trials:24 - Trial = 11109/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.905 | DEBUG    | __main__:trials:29 - Trial = 11109/30000 | Total reward = 29.33
2022-01-26 14:17:18.908 | DEBUG    | __main__:trials:24 - Trial = 11110/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.909 | DEBUG    | __main__:trials:29 - Trial = 11110/30000 | Total reward = 35.50
2022-01-26 14:17:18.911 | DEBUG    | __main__:trials:26 - Trial = 11111/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.912 | DEBUG    | __main__:trials:29 - Trial = 11111/30000 | Total reward = 8.89
2022-01-26 14:17:18.916 | DEBUG    | __main__:trials:24 - Trial = 11112/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.917 | DEBUG    | __main__:trials:29 - Trial = 11112/30000 | Total reward = 50.33
2022-01-26 14:17:18.920 | DEBUG    | __main__:trials:24 - Trial = 11113/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.921 | DEBUG    | __main__:trials:29 - Trial = 11113/30000 | Total reward = 50.23
2022-01-26 14:17:18.924 | DEBUG    | __main__:trials:24 - Trial = 11114/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.925 | DEBUG    | __main__:trials:29 - Trial = 11114/30000 | Total reward = 29.37
2022-01-26 14:17:18.929 | DEBUG    | __main__:trials:24 - Trial = 11115/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.929 | DEBUG    | __main__:trials:29 - Trial = 11115/30000 | Total reward = 62.40
2022-01-26 14:17:18.933 | DEBUG    | __main__:trials:24 - Trial = 11116/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.934 | DEBUG    | __main__:trials:29 - Trial = 11116/30000 | Total reward = 42.21
2022-01-26 14:17:18.937 | DEBUG    | __main__:trials:24 - Trial = 11117/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.938 | DEBUG    | __main__:trials:29 - Trial = 11117/30000 | Total reward = 32.70
2022-01-26 14:17:18.941 | DEBUG    | __main__:trials:24 - Trial = 11118/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.941 | DEBUG    | __main__:trials:29 - Trial = 11118/30000 | Total reward = 39.25
2022-01-26 14:17:18.945 | DEBUG    | __main__:trials:24 - Trial = 11119/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.945 | DEBUG    | __main__:trials:29 - Trial = 11119/30000 | Total reward = 57.61
2022-01-26 14:17:18.950 | DEBUG    | __main__:trials:24 - Trial = 11120/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.950 | DEBUG    | __main__:trials:29 - Trial = 11120/30000 | Total reward = 42.77
2022-01-26 14:17:18.954 | DEBUG    | __main__:trials:24 - Trial = 11121/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.955 | DEBUG    | __main__:trials:29 - Trial = 11121/30000 | Total reward = 33.70
2022-01-26 14:17:18.958 | DEBUG    | __main__:trials:24 - Trial = 11122/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.959 | DEBUG    | __main__:trials:29 - Trial = 11122/30000 | Total reward = 41.35
2022-01-26 14:17:18.963 | DEBUG    | __main__:trials:26 - Trial = 11123/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.964 | DEBUG    | __main__:trials:29 - Trial = 11123/30000 | Total reward = 25.95
2022-01-26 14:17:18.966 | DEBUG    | __main__:trials:26 - Trial = 11124/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:18.967 | DEBUG    | __main__:trials:29 - Trial = 11124/30000 | Total reward = 6.44
2022-01-26 14:17:18.970 | DEBUG    | __main__:trials:24 - Trial = 11125/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.971 | DEBUG    | __main__:trials:29 - Trial = 11125/30000 | Total reward = 41.29
2022-01-26 14:17:18.974 | DEBUG    | __main__:trials:24 - Trial = 11126/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.975 | DEBUG    | __main__:trials:29 - Trial = 11126/30000 | Total reward = 23.19
2022-01-26 14:17:18.978 | DEBUG    | __main__:trials:24 - Trial = 11127/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.980 | DEBUG    | __main__:trials:29 - Trial = 11127/30000 | Total reward = 45.61
2022-01-26 14:17:18.984 | DEBUG    | __main__:trials:24 - Trial = 11128/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.986 | DEBUG    | __main__:trials:29 - Trial = 11128/30000 | Total reward = 17.96
2022-01-26 14:17:18.989 | DEBUG    | __main__:trials:24 - Trial = 11129/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.991 | DEBUG    | __main__:trials:29 - Trial = 11129/30000 | Total reward = 39.21
2022-01-26 14:17:18.995 | DEBUG    | __main__:trials:24 - Trial = 11130/30000 | Max number of steps (20) reached
2022-01-26 14:17:18.996 | DEBUG    | __main__:trials:29 - Trial = 11130/30000 | Total reward = 39.29
2022-01-26 14:17:19.000 | DEBUG    | __main__:trials:24 - Trial = 11131/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.001 | DEBUG    | __main__:trials:29 - Trial = 11131/30000 | Total reward = 36.48
2022-01-26 14:17:19.005 | DEBUG    | __main__:trials:24 - Trial = 11132/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.007 | DEBUG    | __main__:trials:29 - Trial = 11132/30000 | Total reward = 36.27
2022-01-26 14:17:19.010 | DEBUG    | __main__:trials:24 - Trial = 11133/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.012 | DEBUG    | __main__:trials:29 - Trial = 11133/30000 | Total reward = 34.30
2022-01-26 14:17:19.016 | DEBUG    | __main__:trials:24 - Trial = 11134/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.017 | DEBUG    | __main__:trials:29 - Trial = 11134/30000 | Total reward = 41.23
2022-01-26 14:17:19.021 | DEBUG    | __main__:trials:24 - Trial = 11135/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.023 | DEBUG    | __main__:trials:29 - Trial = 11135/30000 | Total reward = 27.66
2022-01-26 14:17:19.026 | DEBUG    | __main__:trials:24 - Trial = 11136/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.028 | DEBUG    | __main__:trials:29 - Trial = 11136/30000 | Total reward = 45.23
2022-01-26 14:17:19.029 | DEBUG    | __main__:trials:26 - Trial = 11137/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.030 | DEBUG    | __main__:trials:29 - Trial = 11137/30000 | Total reward = 7.84
2022-01-26 14:17:19.033 | DEBUG    | __main__:trials:24 - Trial = 11138/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.035 | DEBUG    | __main__:trials:29 - Trial = 11138/30000 | Total reward = 29.63
2022-01-26 14:17:19.038 | DEBUG    | __main__:trials:24 - Trial = 11139/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.040 | DEBUG    | __main__:trials:29 - Trial = 11139/30000 | Total reward = 43.10
2022-01-26 14:17:19.044 | DEBUG    | __main__:trials:24 - Trial = 11140/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.045 | DEBUG    | __main__:trials:29 - Trial = 11140/30000 | Total reward = 26.84
2022-01-26 14:17:19.048 | DEBUG    | __main__:trials:24 - Trial = 11141/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.050 | DEBUG    | __main__:trials:29 - Trial = 11141/30000 | Total reward = 27.86
2022-01-26 14:17:19.053 | DEBUG    | __main__:trials:26 - Trial = 11142/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.053 | DEBUG    | __main__:trials:29 - Trial = 11142/30000 | Total reward = 12.77
2022-01-26 14:17:19.058 | DEBUG    | __main__:trials:24 - Trial = 11143/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.059 | DEBUG    | __main__:trials:29 - Trial = 11143/30000 | Total reward = 31.82
2022-01-26 14:17:19.063 | DEBUG    | __main__:trials:24 - Trial = 11144/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.064 | DEBUG    | __main__:trials:29 - Trial = 11144/30000 | Total reward = 49.38
2022-01-26 14:17:19.068 | DEBUG    | __main__:trials:24 - Trial = 11145/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.070 | DEBUG    | __main__:trials:29 - Trial = 11145/30000 | Total reward = 26.40
2022-01-26 14:17:19.073 | DEBUG    | __main__:trials:24 - Trial = 11146/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.075 | DEBUG    | __main__:trials:29 - Trial = 11146/30000 | Total reward = 42.20
2022-01-26 14:17:19.079 | DEBUG    | __main__:trials:24 - Trial = 11147/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.080 | DEBUG    | __main__:trials:29 - Trial = 11147/30000 | Total reward = 28.67
2022-01-26 14:17:19.084 | DEBUG    | __main__:trials:24 - Trial = 11148/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.086 | DEBUG    | __main__:trials:29 - Trial = 11148/30000 | Total reward = 26.89
2022-01-26 14:17:19.089 | DEBUG    | __main__:trials:24 - Trial = 11149/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.091 | DEBUG    | __main__:trials:29 - Trial = 11149/30000 | Total reward = 41.59
2022-01-26 14:17:19.095 | DEBUG    | __main__:trials:24 - Trial = 11150/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.096 | DEBUG    | __main__:trials:29 - Trial = 11150/30000 | Total reward = 47.62
2022-01-26 14:17:19.100 | DEBUG    | __main__:trials:24 - Trial = 11151/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.102 | DEBUG    | __main__:trials:29 - Trial = 11151/30000 | Total reward = 49.12
2022-01-26 14:17:19.104 | DEBUG    | __main__:trials:26 - Trial = 11152/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.105 | DEBUG    | __main__:trials:29 - Trial = 11152/30000 | Total reward = 8.80
2022-01-26 14:17:19.109 | DEBUG    | __main__:trials:24 - Trial = 11153/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.110 | DEBUG    | __main__:trials:29 - Trial = 11153/30000 | Total reward = 28.91
2022-01-26 14:17:19.114 | DEBUG    | __main__:trials:24 - Trial = 11154/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.116 | DEBUG    | __main__:trials:29 - Trial = 11154/30000 | Total reward = 29.33
2022-01-26 14:17:19.119 | DEBUG    | __main__:trials:24 - Trial = 11155/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.121 | DEBUG    | __main__:trials:29 - Trial = 11155/30000 | Total reward = 45.98
2022-01-26 14:17:19.125 | DEBUG    | __main__:trials:24 - Trial = 11156/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.125 | DEBUG    | __main__:trials:29 - Trial = 11156/30000 | Total reward = 39.69
2022-01-26 14:17:19.130 | DEBUG    | __main__:trials:24 - Trial = 11157/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.131 | DEBUG    | __main__:trials:29 - Trial = 11157/30000 | Total reward = 48.83
2022-01-26 14:17:19.135 | DEBUG    | __main__:trials:26 - Trial = 11158/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.136 | DEBUG    | __main__:trials:29 - Trial = 11158/30000 | Total reward = 8.00
2022-01-26 14:17:19.140 | DEBUG    | __main__:trials:24 - Trial = 11159/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.142 | DEBUG    | __main__:trials:29 - Trial = 11159/30000 | Total reward = 31.15
2022-01-26 14:17:19.146 | DEBUG    | __main__:trials:24 - Trial = 11160/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.147 | DEBUG    | __main__:trials:29 - Trial = 11160/30000 | Total reward = 30.63
2022-01-26 14:17:19.151 | DEBUG    | __main__:trials:24 - Trial = 11161/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.151 | DEBUG    | __main__:trials:29 - Trial = 11161/30000 | Total reward = 38.68
2022-01-26 14:17:19.156 | DEBUG    | __main__:trials:24 - Trial = 11162/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.157 | DEBUG    | __main__:trials:29 - Trial = 11162/30000 | Total reward = 26.75
2022-01-26 14:17:19.161 | DEBUG    | __main__:trials:24 - Trial = 11163/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.163 | DEBUG    | __main__:trials:29 - Trial = 11163/30000 | Total reward = 29.48
2022-01-26 14:17:19.167 | DEBUG    | __main__:trials:24 - Trial = 11164/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.167 | DEBUG    | __main__:trials:29 - Trial = 11164/30000 | Total reward = 41.73
2022-01-26 14:17:19.171 | DEBUG    | __main__:trials:24 - Trial = 11165/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.172 | DEBUG    | __main__:trials:29 - Trial = 11165/30000 | Total reward = 30.93
2022-01-26 14:17:19.176 | DEBUG    | __main__:trials:24 - Trial = 11166/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.177 | DEBUG    | __main__:trials:29 - Trial = 11166/30000 | Total reward = 15.37
2022-01-26 14:17:19.180 | DEBUG    | __main__:trials:26 - Trial = 11167/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.181 | DEBUG    | __main__:trials:29 - Trial = 11167/30000 | Total reward = 18.08
2022-01-26 14:17:19.184 | DEBUG    | __main__:trials:24 - Trial = 11168/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.186 | DEBUG    | __main__:trials:29 - Trial = 11168/30000 | Total reward = 35.41
2022-01-26 14:17:19.190 | DEBUG    | __main__:trials:24 - Trial = 11169/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.192 | DEBUG    | __main__:trials:29 - Trial = 11169/30000 | Total reward = 56.05
2022-01-26 14:17:19.195 | DEBUG    | __main__:trials:24 - Trial = 11170/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.196 | DEBUG    | __main__:trials:29 - Trial = 11170/30000 | Total reward = 51.26
2022-01-26 14:17:19.199 | DEBUG    | __main__:trials:24 - Trial = 11171/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.201 | DEBUG    | __main__:trials:29 - Trial = 11171/30000 | Total reward = 32.61
2022-01-26 14:17:19.204 | DEBUG    | __main__:trials:24 - Trial = 11172/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.207 | DEBUG    | __main__:trials:29 - Trial = 11172/30000 | Total reward = 48.96
2022-01-26 14:17:19.210 | DEBUG    | __main__:trials:24 - Trial = 11173/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.210 | DEBUG    | __main__:trials:29 - Trial = 11173/30000 | Total reward = 26.31
2022-01-26 14:17:19.215 | DEBUG    | __main__:trials:24 - Trial = 11174/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.215 | DEBUG    | __main__:trials:29 - Trial = 11174/30000 | Total reward = 48.85
2022-01-26 14:17:19.219 | DEBUG    | __main__:trials:24 - Trial = 11175/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.220 | DEBUG    | __main__:trials:29 - Trial = 11175/30000 | Total reward = 29.44
2022-01-26 14:17:19.223 | DEBUG    | __main__:trials:24 - Trial = 11176/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.224 | DEBUG    | __main__:trials:29 - Trial = 11176/30000 | Total reward = 33.50
2022-01-26 14:17:19.228 | DEBUG    | __main__:trials:24 - Trial = 11177/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.229 | DEBUG    | __main__:trials:29 - Trial = 11177/30000 | Total reward = 29.18
2022-01-26 14:17:19.231 | DEBUG    | __main__:trials:26 - Trial = 11178/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.233 | DEBUG    | __main__:trials:29 - Trial = 11178/30000 | Total reward = 6.39
2022-01-26 14:17:19.236 | DEBUG    | __main__:trials:24 - Trial = 11179/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.238 | DEBUG    | __main__:trials:29 - Trial = 11179/30000 | Total reward = 54.77
2022-01-26 14:17:19.241 | DEBUG    | __main__:trials:24 - Trial = 11180/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.241 | DEBUG    | __main__:trials:29 - Trial = 11180/30000 | Total reward = 36.07
2022-01-26 14:17:19.243 | DEBUG    | __main__:trials:26 - Trial = 11181/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.245 | DEBUG    | __main__:trials:29 - Trial = 11181/30000 | Total reward = 8.84
2022-01-26 14:17:19.247 | DEBUG    | __main__:trials:26 - Trial = 11182/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.249 | DEBUG    | __main__:trials:29 - Trial = 11182/30000 | Total reward = 7.84
2022-01-26 14:17:19.252 | DEBUG    | __main__:trials:24 - Trial = 11183/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.253 | DEBUG    | __main__:trials:29 - Trial = 11183/30000 | Total reward = 36.99
2022-01-26 14:17:19.257 | DEBUG    | __main__:trials:24 - Trial = 11184/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.258 | DEBUG    | __main__:trials:29 - Trial = 11184/30000 | Total reward = 29.39
2022-01-26 14:17:19.261 | DEBUG    | __main__:trials:24 - Trial = 11185/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.263 | DEBUG    | __main__:trials:29 - Trial = 11185/30000 | Total reward = 41.40
2022-01-26 14:17:19.267 | DEBUG    | __main__:trials:24 - Trial = 11186/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.267 | DEBUG    | __main__:trials:29 - Trial = 11186/30000 | Total reward = 31.95
2022-01-26 14:17:19.271 | DEBUG    | __main__:trials:24 - Trial = 11187/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.273 | DEBUG    | __main__:trials:29 - Trial = 11187/30000 | Total reward = 59.97
2022-01-26 14:17:19.276 | DEBUG    | __main__:trials:24 - Trial = 11188/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.277 | DEBUG    | __main__:trials:29 - Trial = 11188/30000 | Total reward = 29.32
2022-01-26 14:17:19.281 | DEBUG    | __main__:trials:24 - Trial = 11189/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.282 | DEBUG    | __main__:trials:29 - Trial = 11189/30000 | Total reward = 35.41
2022-01-26 14:17:19.285 | DEBUG    | __main__:trials:24 - Trial = 11190/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.287 | DEBUG    | __main__:trials:29 - Trial = 11190/30000 | Total reward = 31.59
2022-01-26 14:17:19.290 | DEBUG    | __main__:trials:24 - Trial = 11191/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.290 | DEBUG    | __main__:trials:29 - Trial = 11191/30000 | Total reward = 18.31
2022-01-26 14:17:19.294 | DEBUG    | __main__:trials:24 - Trial = 11192/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.295 | DEBUG    | __main__:trials:29 - Trial = 11192/30000 | Total reward = 45.71
2022-01-26 14:17:19.298 | DEBUG    | __main__:trials:24 - Trial = 11193/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.300 | DEBUG    | __main__:trials:29 - Trial = 11193/30000 | Total reward = 39.59
2022-01-26 14:17:19.303 | DEBUG    | __main__:trials:24 - Trial = 11194/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.304 | DEBUG    | __main__:trials:29 - Trial = 11194/30000 | Total reward = 13.63
2022-01-26 14:17:19.308 | DEBUG    | __main__:trials:24 - Trial = 11195/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.310 | DEBUG    | __main__:trials:29 - Trial = 11195/30000 | Total reward = 32.93
2022-01-26 14:17:19.313 | DEBUG    | __main__:trials:24 - Trial = 11196/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.314 | DEBUG    | __main__:trials:29 - Trial = 11196/30000 | Total reward = 59.22
2022-01-26 14:17:19.317 | DEBUG    | __main__:trials:24 - Trial = 11197/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.319 | DEBUG    | __main__:trials:29 - Trial = 11197/30000 | Total reward = 30.07
2022-01-26 14:17:19.322 | DEBUG    | __main__:trials:24 - Trial = 11198/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.323 | DEBUG    | __main__:trials:29 - Trial = 11198/30000 | Total reward = 33.57
2022-01-26 14:17:19.325 | DEBUG    | __main__:trials:26 - Trial = 11199/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.327 | DEBUG    | __main__:trials:29 - Trial = 11199/30000 | Total reward = 7.44
2022-01-26 14:17:19.331 | DEBUG    | __main__:trials:24 - Trial = 11200/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.332 | DEBUG    | __main__:trials:29 - Trial = 11200/30000 | Total reward = 31.22
2022-01-26 14:17:19.335 | DEBUG    | __main__:trials:24 - Trial = 11201/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.337 | DEBUG    | __main__:trials:29 - Trial = 11201/30000 | Total reward = 33.99
2022-01-26 14:17:19.340 | DEBUG    | __main__:trials:24 - Trial = 11202/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.342 | DEBUG    | __main__:trials:29 - Trial = 11202/30000 | Total reward = 43.84
2022-01-26 14:17:19.345 | DEBUG    | __main__:trials:24 - Trial = 11203/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.345 | DEBUG    | __main__:trials:29 - Trial = 11203/30000 | Total reward = 29.82
2022-01-26 14:17:19.350 | DEBUG    | __main__:trials:24 - Trial = 11204/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.351 | DEBUG    | __main__:trials:29 - Trial = 11204/30000 | Total reward = 25.87
2022-01-26 14:17:19.353 | DEBUG    | __main__:trials:26 - Trial = 11205/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.355 | DEBUG    | __main__:trials:29 - Trial = 11205/30000 | Total reward = 10.08
2022-01-26 14:17:19.358 | DEBUG    | __main__:trials:24 - Trial = 11206/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.360 | DEBUG    | __main__:trials:29 - Trial = 11206/30000 | Total reward = 36.47
2022-01-26 14:17:19.363 | DEBUG    | __main__:trials:24 - Trial = 11207/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.365 | DEBUG    | __main__:trials:29 - Trial = 11207/30000 | Total reward = 27.05
2022-01-26 14:17:19.368 | DEBUG    | __main__:trials:24 - Trial = 11208/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.368 | DEBUG    | __main__:trials:29 - Trial = 11208/30000 | Total reward = 29.18
2022-01-26 14:17:19.371 | DEBUG    | __main__:trials:26 - Trial = 11209/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.373 | DEBUG    | __main__:trials:29 - Trial = 11209/30000 | Total reward = 18.61
2022-01-26 14:17:19.377 | DEBUG    | __main__:trials:24 - Trial = 11210/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.378 | DEBUG    | __main__:trials:29 - Trial = 11210/30000 | Total reward = 25.66
2022-01-26 14:17:19.382 | DEBUG    | __main__:trials:24 - Trial = 11211/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.384 | DEBUG    | __main__:trials:29 - Trial = 11211/30000 | Total reward = 29.71
2022-01-26 14:17:19.387 | DEBUG    | __main__:trials:26 - Trial = 11212/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.388 | DEBUG    | __main__:trials:29 - Trial = 11212/30000 | Total reward = 18.75
2022-01-26 14:17:19.392 | DEBUG    | __main__:trials:24 - Trial = 11213/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.393 | DEBUG    | __main__:trials:29 - Trial = 11213/30000 | Total reward = 28.82
2022-01-26 14:17:19.397 | DEBUG    | __main__:trials:24 - Trial = 11214/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.399 | DEBUG    | __main__:trials:29 - Trial = 11214/30000 | Total reward = 28.41
2022-01-26 14:17:19.402 | DEBUG    | __main__:trials:24 - Trial = 11215/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.404 | DEBUG    | __main__:trials:29 - Trial = 11215/30000 | Total reward = 26.97
2022-01-26 14:17:19.407 | DEBUG    | __main__:trials:24 - Trial = 11216/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.408 | DEBUG    | __main__:trials:29 - Trial = 11216/30000 | Total reward = 32.34
2022-01-26 14:17:19.412 | DEBUG    | __main__:trials:24 - Trial = 11217/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.414 | DEBUG    | __main__:trials:29 - Trial = 11217/30000 | Total reward = 27.35
2022-01-26 14:17:19.417 | DEBUG    | __main__:trials:24 - Trial = 11218/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.419 | DEBUG    | __main__:trials:29 - Trial = 11218/30000 | Total reward = 22.27
2022-01-26 14:17:19.423 | DEBUG    | __main__:trials:24 - Trial = 11219/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.424 | DEBUG    | __main__:trials:29 - Trial = 11219/30000 | Total reward = 45.26
2022-01-26 14:17:19.428 | DEBUG    | __main__:trials:24 - Trial = 11220/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.430 | DEBUG    | __main__:trials:29 - Trial = 11220/30000 | Total reward = 28.87
2022-01-26 14:17:19.434 | DEBUG    | __main__:trials:24 - Trial = 11221/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.435 | DEBUG    | __main__:trials:29 - Trial = 11221/30000 | Total reward = 52.09
2022-01-26 14:17:19.438 | DEBUG    | __main__:trials:26 - Trial = 11222/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.439 | DEBUG    | __main__:trials:29 - Trial = 11222/30000 | Total reward = 10.09
2022-01-26 14:17:19.443 | DEBUG    | __main__:trials:24 - Trial = 11223/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.444 | DEBUG    | __main__:trials:29 - Trial = 11223/30000 | Total reward = 31.09
2022-01-26 14:17:19.448 | DEBUG    | __main__:trials:24 - Trial = 11224/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.450 | DEBUG    | __main__:trials:29 - Trial = 11224/30000 | Total reward = 40.03
2022-01-26 14:17:19.453 | DEBUG    | __main__:trials:24 - Trial = 11225/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.455 | DEBUG    | __main__:trials:29 - Trial = 11225/30000 | Total reward = 60.42
2022-01-26 14:17:19.459 | DEBUG    | __main__:trials:24 - Trial = 11226/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.460 | DEBUG    | __main__:trials:29 - Trial = 11226/30000 | Total reward = 18.00
2022-01-26 14:17:19.463 | DEBUG    | __main__:trials:24 - Trial = 11227/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.465 | DEBUG    | __main__:trials:29 - Trial = 11227/30000 | Total reward = 28.84
2022-01-26 14:17:19.468 | DEBUG    | __main__:trials:24 - Trial = 11228/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.470 | DEBUG    | __main__:trials:29 - Trial = 11228/30000 | Total reward = 36.03
2022-01-26 14:17:19.474 | DEBUG    | __main__:trials:24 - Trial = 11229/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.476 | DEBUG    | __main__:trials:29 - Trial = 11229/30000 | Total reward = 37.30
2022-01-26 14:17:19.478 | DEBUG    | __main__:trials:24 - Trial = 11230/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.480 | DEBUG    | __main__:trials:29 - Trial = 11230/30000 | Total reward = 33.66
2022-01-26 14:17:19.483 | DEBUG    | __main__:trials:24 - Trial = 11231/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.485 | DEBUG    | __main__:trials:29 - Trial = 11231/30000 | Total reward = 33.33
2022-01-26 14:17:19.489 | DEBUG    | __main__:trials:24 - Trial = 11232/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.491 | DEBUG    | __main__:trials:29 - Trial = 11232/30000 | Total reward = 34.44
2022-01-26 14:17:19.494 | DEBUG    | __main__:trials:24 - Trial = 11233/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.496 | DEBUG    | __main__:trials:29 - Trial = 11233/30000 | Total reward = 61.88
2022-01-26 14:17:19.500 | DEBUG    | __main__:trials:24 - Trial = 11234/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.501 | DEBUG    | __main__:trials:29 - Trial = 11234/30000 | Total reward = 23.90
2022-01-26 14:17:19.505 | DEBUG    | __main__:trials:24 - Trial = 11235/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.506 | DEBUG    | __main__:trials:29 - Trial = 11235/30000 | Total reward = 29.28
2022-01-26 14:17:19.508 | DEBUG    | __main__:trials:26 - Trial = 11236/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.509 | DEBUG    | __main__:trials:29 - Trial = 11236/30000 | Total reward = 13.38
2022-01-26 14:17:19.512 | DEBUG    | __main__:trials:24 - Trial = 11237/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.514 | DEBUG    | __main__:trials:29 - Trial = 11237/30000 | Total reward = 37.35
2022-01-26 14:17:19.518 | DEBUG    | __main__:trials:24 - Trial = 11238/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.520 | DEBUG    | __main__:trials:29 - Trial = 11238/30000 | Total reward = 38.18
2022-01-26 14:17:19.523 | DEBUG    | __main__:trials:24 - Trial = 11239/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.525 | DEBUG    | __main__:trials:29 - Trial = 11239/30000 | Total reward = 28.19
2022-01-26 14:17:19.529 | DEBUG    | __main__:trials:24 - Trial = 11240/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.529 | DEBUG    | __main__:trials:29 - Trial = 11240/30000 | Total reward = 31.12
2022-01-26 14:17:19.534 | DEBUG    | __main__:trials:24 - Trial = 11241/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.535 | DEBUG    | __main__:trials:29 - Trial = 11241/30000 | Total reward = 29.28
2022-01-26 14:17:19.539 | DEBUG    | __main__:trials:24 - Trial = 11242/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.541 | DEBUG    | __main__:trials:29 - Trial = 11242/30000 | Total reward = 29.26
2022-01-26 14:17:19.545 | DEBUG    | __main__:trials:24 - Trial = 11243/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.546 | DEBUG    | __main__:trials:29 - Trial = 11243/30000 | Total reward = 49.23
2022-01-26 14:17:19.550 | DEBUG    | __main__:trials:24 - Trial = 11244/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.551 | DEBUG    | __main__:trials:29 - Trial = 11244/30000 | Total reward = 29.21
2022-01-26 14:17:19.554 | DEBUG    | __main__:trials:24 - Trial = 11245/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.556 | DEBUG    | __main__:trials:29 - Trial = 11245/30000 | Total reward = 33.60
2022-01-26 14:17:19.560 | DEBUG    | __main__:trials:24 - Trial = 11246/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.561 | DEBUG    | __main__:trials:29 - Trial = 11246/30000 | Total reward = 33.94
2022-01-26 14:17:19.565 | DEBUG    | __main__:trials:24 - Trial = 11247/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.566 | DEBUG    | __main__:trials:29 - Trial = 11247/30000 | Total reward = 34.72
2022-01-26 14:17:19.569 | DEBUG    | __main__:trials:24 - Trial = 11248/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.571 | DEBUG    | __main__:trials:29 - Trial = 11248/30000 | Total reward = 62.28
2022-01-26 14:17:19.575 | DEBUG    | __main__:trials:24 - Trial = 11249/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.577 | DEBUG    | __main__:trials:29 - Trial = 11249/30000 | Total reward = 33.75
2022-01-26 14:17:19.581 | DEBUG    | __main__:trials:24 - Trial = 11250/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.581 | DEBUG    | __main__:trials:29 - Trial = 11250/30000 | Total reward = 25.79
2022-01-26 14:17:19.586 | DEBUG    | __main__:trials:24 - Trial = 11251/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.587 | DEBUG    | __main__:trials:29 - Trial = 11251/30000 | Total reward = 29.26
2022-01-26 14:17:19.591 | DEBUG    | __main__:trials:24 - Trial = 11252/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.593 | DEBUG    | __main__:trials:29 - Trial = 11252/30000 | Total reward = 29.51
2022-01-26 14:17:19.596 | DEBUG    | __main__:trials:26 - Trial = 11253/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.597 | DEBUG    | __main__:trials:29 - Trial = 11253/30000 | Total reward = 16.79
2022-01-26 14:17:19.600 | DEBUG    | __main__:trials:24 - Trial = 11254/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.602 | DEBUG    | __main__:trials:29 - Trial = 11254/30000 | Total reward = 29.26
2022-01-26 14:17:19.605 | DEBUG    | __main__:trials:24 - Trial = 11255/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.606 | DEBUG    | __main__:trials:29 - Trial = 11255/30000 | Total reward = 38.42
2022-01-26 14:17:19.610 | DEBUG    | __main__:trials:24 - Trial = 11256/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.611 | DEBUG    | __main__:trials:29 - Trial = 11256/30000 | Total reward = 33.08
2022-01-26 14:17:19.614 | DEBUG    | __main__:trials:24 - Trial = 11257/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.615 | DEBUG    | __main__:trials:29 - Trial = 11257/30000 | Total reward = 29.02
2022-01-26 14:17:19.620 | DEBUG    | __main__:trials:24 - Trial = 11258/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.621 | DEBUG    | __main__:trials:29 - Trial = 11258/30000 | Total reward = 29.84
2022-01-26 14:17:19.625 | DEBUG    | __main__:trials:24 - Trial = 11259/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.627 | DEBUG    | __main__:trials:29 - Trial = 11259/30000 | Total reward = 37.24
2022-01-26 14:17:19.631 | DEBUG    | __main__:trials:24 - Trial = 11260/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.633 | DEBUG    | __main__:trials:29 - Trial = 11260/30000 | Total reward = 34.32
2022-01-26 14:17:19.636 | DEBUG    | __main__:trials:26 - Trial = 11261/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.637 | DEBUG    | __main__:trials:29 - Trial = 11261/30000 | Total reward = 15.29
2022-01-26 14:17:19.641 | DEBUG    | __main__:trials:24 - Trial = 11262/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.641 | DEBUG    | __main__:trials:29 - Trial = 11262/30000 | Total reward = 30.23
2022-01-26 14:17:19.645 | DEBUG    | __main__:trials:24 - Trial = 11263/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.647 | DEBUG    | __main__:trials:29 - Trial = 11263/30000 | Total reward = 42.10
2022-01-26 14:17:19.650 | DEBUG    | __main__:trials:26 - Trial = 11264/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.651 | DEBUG    | __main__:trials:29 - Trial = 11264/30000 | Total reward = 11.44
2022-01-26 14:17:19.654 | DEBUG    | __main__:trials:24 - Trial = 11265/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.656 | DEBUG    | __main__:trials:29 - Trial = 11265/30000 | Total reward = 32.81
2022-01-26 14:17:19.660 | DEBUG    | __main__:trials:24 - Trial = 11266/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.662 | DEBUG    | __main__:trials:29 - Trial = 11266/30000 | Total reward = 40.39
2022-01-26 14:17:19.665 | DEBUG    | __main__:trials:26 - Trial = 11267/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.667 | DEBUG    | __main__:trials:29 - Trial = 11267/30000 | Total reward = 19.62
2022-01-26 14:17:19.671 | DEBUG    | __main__:trials:24 - Trial = 11268/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.672 | DEBUG    | __main__:trials:29 - Trial = 11268/30000 | Total reward = 39.17
2022-01-26 14:17:19.676 | DEBUG    | __main__:trials:24 - Trial = 11269/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.678 | DEBUG    | __main__:trials:29 - Trial = 11269/30000 | Total reward = 41.78
2022-01-26 14:17:19.682 | DEBUG    | __main__:trials:24 - Trial = 11270/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.682 | DEBUG    | __main__:trials:29 - Trial = 11270/30000 | Total reward = 41.43
2022-01-26 14:17:19.686 | DEBUG    | __main__:trials:24 - Trial = 11271/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.688 | DEBUG    | __main__:trials:29 - Trial = 11271/30000 | Total reward = 32.08
2022-01-26 14:17:19.692 | DEBUG    | __main__:trials:24 - Trial = 11272/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.692 | DEBUG    | __main__:trials:29 - Trial = 11272/30000 | Total reward = 40.11
2022-01-26 14:17:19.697 | DEBUG    | __main__:trials:24 - Trial = 11273/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.698 | DEBUG    | __main__:trials:29 - Trial = 11273/30000 | Total reward = 59.14
2022-01-26 14:17:19.701 | DEBUG    | __main__:trials:24 - Trial = 11274/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.702 | DEBUG    | __main__:trials:29 - Trial = 11274/30000 | Total reward = 29.50
2022-01-26 14:17:19.705 | DEBUG    | __main__:trials:24 - Trial = 11275/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.706 | DEBUG    | __main__:trials:29 - Trial = 11275/30000 | Total reward = 27.18
2022-01-26 14:17:19.709 | DEBUG    | __main__:trials:24 - Trial = 11276/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.711 | DEBUG    | __main__:trials:29 - Trial = 11276/30000 | Total reward = 34.68
2022-01-26 14:17:19.714 | DEBUG    | __main__:trials:24 - Trial = 11277/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.716 | DEBUG    | __main__:trials:29 - Trial = 11277/30000 | Total reward = 38.60
2022-01-26 14:17:19.719 | DEBUG    | __main__:trials:24 - Trial = 11278/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.720 | DEBUG    | __main__:trials:29 - Trial = 11278/30000 | Total reward = 37.19
2022-01-26 14:17:19.723 | DEBUG    | __main__:trials:24 - Trial = 11279/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.725 | DEBUG    | __main__:trials:29 - Trial = 11279/30000 | Total reward = 21.95
2022-01-26 14:17:19.729 | DEBUG    | __main__:trials:24 - Trial = 11280/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.731 | DEBUG    | __main__:trials:29 - Trial = 11280/30000 | Total reward = 59.37
2022-01-26 14:17:19.733 | DEBUG    | __main__:trials:24 - Trial = 11281/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.734 | DEBUG    | __main__:trials:29 - Trial = 11281/30000 | Total reward = 53.85
2022-01-26 14:17:19.737 | DEBUG    | __main__:trials:24 - Trial = 11282/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.739 | DEBUG    | __main__:trials:29 - Trial = 11282/30000 | Total reward = 42.03
2022-01-26 14:17:19.743 | DEBUG    | __main__:trials:24 - Trial = 11283/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.744 | DEBUG    | __main__:trials:29 - Trial = 11283/30000 | Total reward = 26.30
2022-01-26 14:17:19.748 | DEBUG    | __main__:trials:24 - Trial = 11284/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.750 | DEBUG    | __main__:trials:29 - Trial = 11284/30000 | Total reward = 65.51
2022-01-26 14:17:19.754 | DEBUG    | __main__:trials:24 - Trial = 11285/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.755 | DEBUG    | __main__:trials:29 - Trial = 11285/30000 | Total reward = 40.87
2022-01-26 14:17:19.759 | DEBUG    | __main__:trials:24 - Trial = 11286/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.760 | DEBUG    | __main__:trials:29 - Trial = 11286/30000 | Total reward = 37.71
2022-01-26 14:17:19.764 | DEBUG    | __main__:trials:24 - Trial = 11287/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.764 | DEBUG    | __main__:trials:29 - Trial = 11287/30000 | Total reward = 36.18
2022-01-26 14:17:19.768 | DEBUG    | __main__:trials:24 - Trial = 11288/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.770 | DEBUG    | __main__:trials:29 - Trial = 11288/30000 | Total reward = 33.04
2022-01-26 14:17:19.774 | DEBUG    | __main__:trials:24 - Trial = 11289/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.775 | DEBUG    | __main__:trials:29 - Trial = 11289/30000 | Total reward = 39.53
2022-01-26 14:17:19.779 | DEBUG    | __main__:trials:24 - Trial = 11290/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.780 | DEBUG    | __main__:trials:29 - Trial = 11290/30000 | Total reward = 36.54
2022-01-26 14:17:19.784 | DEBUG    | __main__:trials:24 - Trial = 11291/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.785 | DEBUG    | __main__:trials:29 - Trial = 11291/30000 | Total reward = 34.04
2022-01-26 14:17:19.789 | DEBUG    | __main__:trials:24 - Trial = 11292/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.790 | DEBUG    | __main__:trials:29 - Trial = 11292/30000 | Total reward = 33.80
2022-01-26 14:17:19.793 | DEBUG    | __main__:trials:24 - Trial = 11293/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.794 | DEBUG    | __main__:trials:29 - Trial = 11293/30000 | Total reward = 38.19
2022-01-26 14:17:19.797 | DEBUG    | __main__:trials:24 - Trial = 11294/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.799 | DEBUG    | __main__:trials:29 - Trial = 11294/30000 | Total reward = 36.35
2022-01-26 14:17:19.802 | DEBUG    | __main__:trials:24 - Trial = 11295/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.804 | DEBUG    | __main__:trials:29 - Trial = 11295/30000 | Total reward = 32.75
2022-01-26 14:17:19.807 | DEBUG    | __main__:trials:26 - Trial = 11296/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.808 | DEBUG    | __main__:trials:29 - Trial = 11296/30000 | Total reward = 11.92
2022-01-26 14:17:19.812 | DEBUG    | __main__:trials:24 - Trial = 11297/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.812 | DEBUG    | __main__:trials:29 - Trial = 11297/30000 | Total reward = 36.97
2022-01-26 14:17:19.816 | DEBUG    | __main__:trials:24 - Trial = 11298/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.817 | DEBUG    | __main__:trials:29 - Trial = 11298/30000 | Total reward = 37.70
2022-01-26 14:17:19.821 | DEBUG    | __main__:trials:24 - Trial = 11299/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.823 | DEBUG    | __main__:trials:29 - Trial = 11299/30000 | Total reward = 42.16
2022-01-26 14:17:19.827 | DEBUG    | __main__:trials:24 - Trial = 11300/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.828 | DEBUG    | __main__:trials:29 - Trial = 11300/30000 | Total reward = 25.88
2022-01-26 14:17:19.832 | DEBUG    | __main__:trials:24 - Trial = 11301/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.834 | DEBUG    | __main__:trials:29 - Trial = 11301/30000 | Total reward = 47.37
2022-01-26 14:17:19.837 | DEBUG    | __main__:trials:24 - Trial = 11302/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.838 | DEBUG    | __main__:trials:29 - Trial = 11302/30000 | Total reward = 43.32
2022-01-26 14:17:19.842 | DEBUG    | __main__:trials:26 - Trial = 11303/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.844 | DEBUG    | __main__:trials:29 - Trial = 11303/30000 | Total reward = 14.25
2022-01-26 14:17:19.847 | DEBUG    | __main__:trials:24 - Trial = 11304/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.848 | DEBUG    | __main__:trials:29 - Trial = 11304/30000 | Total reward = 32.15
2022-01-26 14:17:19.852 | DEBUG    | __main__:trials:24 - Trial = 11305/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.853 | DEBUG    | __main__:trials:29 - Trial = 11305/30000 | Total reward = 31.94
2022-01-26 14:17:19.858 | DEBUG    | __main__:trials:24 - Trial = 11306/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.858 | DEBUG    | __main__:trials:29 - Trial = 11306/30000 | Total reward = 30.02
2022-01-26 14:17:19.862 | DEBUG    | __main__:trials:24 - Trial = 11307/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.864 | DEBUG    | __main__:trials:29 - Trial = 11307/30000 | Total reward = 28.73
2022-01-26 14:17:19.868 | DEBUG    | __main__:trials:26 - Trial = 11308/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.868 | DEBUG    | __main__:trials:29 - Trial = 11308/30000 | Total reward = 25.87
2022-01-26 14:17:19.872 | DEBUG    | __main__:trials:24 - Trial = 11309/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.874 | DEBUG    | __main__:trials:29 - Trial = 11309/30000 | Total reward = 29.26
2022-01-26 14:17:19.877 | DEBUG    | __main__:trials:24 - Trial = 11310/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.879 | DEBUG    | __main__:trials:29 - Trial = 11310/30000 | Total reward = 38.83
2022-01-26 14:17:19.883 | DEBUG    | __main__:trials:24 - Trial = 11311/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.884 | DEBUG    | __main__:trials:29 - Trial = 11311/30000 | Total reward = 38.72
2022-01-26 14:17:19.887 | DEBUG    | __main__:trials:26 - Trial = 11312/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.888 | DEBUG    | __main__:trials:29 - Trial = 11312/30000 | Total reward = 19.74
2022-01-26 14:17:19.892 | DEBUG    | __main__:trials:24 - Trial = 11313/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.893 | DEBUG    | __main__:trials:29 - Trial = 11313/30000 | Total reward = 29.26
2022-01-26 14:17:19.898 | DEBUG    | __main__:trials:24 - Trial = 11314/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.899 | DEBUG    | __main__:trials:29 - Trial = 11314/30000 | Total reward = 38.72
2022-01-26 14:17:19.903 | DEBUG    | __main__:trials:24 - Trial = 11315/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.904 | DEBUG    | __main__:trials:29 - Trial = 11315/30000 | Total reward = 26.23
2022-01-26 14:17:19.907 | DEBUG    | __main__:trials:26 - Trial = 11316/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.909 | DEBUG    | __main__:trials:29 - Trial = 11316/30000 | Total reward = 15.92
2022-01-26 14:17:19.912 | DEBUG    | __main__:trials:24 - Trial = 11317/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.914 | DEBUG    | __main__:trials:29 - Trial = 11317/30000 | Total reward = 41.97
2022-01-26 14:17:19.918 | DEBUG    | __main__:trials:24 - Trial = 11318/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.919 | DEBUG    | __main__:trials:29 - Trial = 11318/30000 | Total reward = 28.05
2022-01-26 14:17:19.923 | DEBUG    | __main__:trials:24 - Trial = 11319/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.924 | DEBUG    | __main__:trials:29 - Trial = 11319/30000 | Total reward = 29.26
2022-01-26 14:17:19.928 | DEBUG    | __main__:trials:24 - Trial = 11320/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.929 | DEBUG    | __main__:trials:29 - Trial = 11320/30000 | Total reward = 29.02
2022-01-26 14:17:19.933 | DEBUG    | __main__:trials:24 - Trial = 11321/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.935 | DEBUG    | __main__:trials:29 - Trial = 11321/30000 | Total reward = 50.08
2022-01-26 14:17:19.938 | DEBUG    | __main__:trials:24 - Trial = 11322/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.940 | DEBUG    | __main__:trials:29 - Trial = 11322/30000 | Total reward = 37.89
2022-01-26 14:17:19.942 | DEBUG    | __main__:trials:26 - Trial = 11323/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.943 | DEBUG    | __main__:trials:29 - Trial = 11323/30000 | Total reward = 14.66
2022-01-26 14:17:19.947 | DEBUG    | __main__:trials:26 - Trial = 11324/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:19.948 | DEBUG    | __main__:trials:29 - Trial = 11324/30000 | Total reward = 9.29
2022-01-26 14:17:19.952 | DEBUG    | __main__:trials:24 - Trial = 11325/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.953 | DEBUG    | __main__:trials:29 - Trial = 11325/30000 | Total reward = 29.57
2022-01-26 14:17:19.957 | DEBUG    | __main__:trials:24 - Trial = 11326/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.957 | DEBUG    | __main__:trials:29 - Trial = 11326/30000 | Total reward = 52.45
2022-01-26 14:17:19.961 | DEBUG    | __main__:trials:24 - Trial = 11327/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.962 | DEBUG    | __main__:trials:29 - Trial = 11327/30000 | Total reward = 25.11
2022-01-26 14:17:19.966 | DEBUG    | __main__:trials:24 - Trial = 11328/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.966 | DEBUG    | __main__:trials:29 - Trial = 11328/30000 | Total reward = 29.10
2022-01-26 14:17:19.970 | DEBUG    | __main__:trials:24 - Trial = 11329/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.972 | DEBUG    | __main__:trials:29 - Trial = 11329/30000 | Total reward = 59.19
2022-01-26 14:17:19.976 | DEBUG    | __main__:trials:24 - Trial = 11330/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.977 | DEBUG    | __main__:trials:29 - Trial = 11330/30000 | Total reward = 31.50
2022-01-26 14:17:19.981 | DEBUG    | __main__:trials:24 - Trial = 11331/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.982 | DEBUG    | __main__:trials:29 - Trial = 11331/30000 | Total reward = 43.85
2022-01-26 14:17:19.987 | DEBUG    | __main__:trials:24 - Trial = 11332/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.989 | DEBUG    | __main__:trials:29 - Trial = 11332/30000 | Total reward = 30.23
2022-01-26 14:17:19.992 | DEBUG    | __main__:trials:24 - Trial = 11333/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.994 | DEBUG    | __main__:trials:29 - Trial = 11333/30000 | Total reward = 29.08
2022-01-26 14:17:19.998 | DEBUG    | __main__:trials:24 - Trial = 11334/30000 | Max number of steps (20) reached
2022-01-26 14:17:19.999 | DEBUG    | __main__:trials:29 - Trial = 11334/30000 | Total reward = 43.69
2022-01-26 14:17:20.003 | DEBUG    | __main__:trials:24 - Trial = 11335/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.005 | DEBUG    | __main__:trials:29 - Trial = 11335/30000 | Total reward = 35.63
2022-01-26 14:17:20.008 | DEBUG    | __main__:trials:24 - Trial = 11336/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.010 | DEBUG    | __main__:trials:29 - Trial = 11336/30000 | Total reward = 28.99
2022-01-26 14:17:20.014 | DEBUG    | __main__:trials:24 - Trial = 11337/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.016 | DEBUG    | __main__:trials:29 - Trial = 11337/30000 | Total reward = 29.49
2022-01-26 14:17:20.020 | DEBUG    | __main__:trials:24 - Trial = 11338/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.021 | DEBUG    | __main__:trials:29 - Trial = 11338/30000 | Total reward = 44.68
2022-01-26 14:17:20.024 | DEBUG    | __main__:trials:24 - Trial = 11339/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.026 | DEBUG    | __main__:trials:29 - Trial = 11339/30000 | Total reward = 55.99
2022-01-26 14:17:20.030 | DEBUG    | __main__:trials:24 - Trial = 11340/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.030 | DEBUG    | __main__:trials:29 - Trial = 11340/30000 | Total reward = 29.58
2022-01-26 14:17:20.035 | DEBUG    | __main__:trials:24 - Trial = 11341/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.036 | DEBUG    | __main__:trials:29 - Trial = 11341/30000 | Total reward = 28.05
2022-01-26 14:17:20.040 | DEBUG    | __main__:trials:24 - Trial = 11342/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.042 | DEBUG    | __main__:trials:29 - Trial = 11342/30000 | Total reward = 39.29
2022-01-26 14:17:20.046 | DEBUG    | __main__:trials:24 - Trial = 11343/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.047 | DEBUG    | __main__:trials:29 - Trial = 11343/30000 | Total reward = 29.02
2022-01-26 14:17:20.050 | DEBUG    | __main__:trials:24 - Trial = 11344/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.052 | DEBUG    | __main__:trials:29 - Trial = 11344/30000 | Total reward = 25.15
2022-01-26 14:17:20.055 | DEBUG    | __main__:trials:24 - Trial = 11345/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.057 | DEBUG    | __main__:trials:29 - Trial = 11345/30000 | Total reward = 29.20
2022-01-26 14:17:20.060 | DEBUG    | __main__:trials:24 - Trial = 11346/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.061 | DEBUG    | __main__:trials:29 - Trial = 11346/30000 | Total reward = 41.04
2022-01-26 14:17:20.065 | DEBUG    | __main__:trials:24 - Trial = 11347/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.066 | DEBUG    | __main__:trials:29 - Trial = 11347/30000 | Total reward = 58.73
2022-01-26 14:17:20.070 | DEBUG    | __main__:trials:24 - Trial = 11348/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.071 | DEBUG    | __main__:trials:29 - Trial = 11348/30000 | Total reward = 37.42
2022-01-26 14:17:20.075 | DEBUG    | __main__:trials:24 - Trial = 11349/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.077 | DEBUG    | __main__:trials:29 - Trial = 11349/30000 | Total reward = 27.90
2022-01-26 14:17:20.082 | DEBUG    | __main__:trials:24 - Trial = 11350/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.084 | DEBUG    | __main__:trials:29 - Trial = 11350/30000 | Total reward = 28.54
2022-01-26 14:17:20.089 | DEBUG    | __main__:trials:24 - Trial = 11351/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.090 | DEBUG    | __main__:trials:29 - Trial = 11351/30000 | Total reward = 39.16
2022-01-26 14:17:20.095 | DEBUG    | __main__:trials:24 - Trial = 11352/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.097 | DEBUG    | __main__:trials:29 - Trial = 11352/30000 | Total reward = 29.05
2022-01-26 14:17:20.103 | DEBUG    | __main__:trials:24 - Trial = 11353/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.104 | DEBUG    | __main__:trials:29 - Trial = 11353/30000 | Total reward = 35.36
2022-01-26 14:17:20.109 | DEBUG    | __main__:trials:24 - Trial = 11354/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.110 | DEBUG    | __main__:trials:29 - Trial = 11354/30000 | Total reward = 29.30
2022-01-26 14:17:20.115 | DEBUG    | __main__:trials:24 - Trial = 11355/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.116 | DEBUG    | __main__:trials:29 - Trial = 11355/30000 | Total reward = 29.26
2022-01-26 14:17:20.121 | DEBUG    | __main__:trials:24 - Trial = 11356/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.123 | DEBUG    | __main__:trials:29 - Trial = 11356/30000 | Total reward = 30.85
2022-01-26 14:17:20.128 | DEBUG    | __main__:trials:24 - Trial = 11357/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.129 | DEBUG    | __main__:trials:29 - Trial = 11357/30000 | Total reward = 40.58
2022-01-26 14:17:20.134 | DEBUG    | __main__:trials:24 - Trial = 11358/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.134 | DEBUG    | __main__:trials:29 - Trial = 11358/30000 | Total reward = 29.16
2022-01-26 14:17:20.138 | DEBUG    | __main__:trials:26 - Trial = 11359/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.138 | DEBUG    | __main__:trials:29 - Trial = 11359/30000 | Total reward = 11.73
2022-01-26 14:17:20.143 | DEBUG    | __main__:trials:24 - Trial = 11360/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.144 | DEBUG    | __main__:trials:29 - Trial = 11360/30000 | Total reward = 43.61
2022-01-26 14:17:20.147 | DEBUG    | __main__:trials:24 - Trial = 11361/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.149 | DEBUG    | __main__:trials:29 - Trial = 11361/30000 | Total reward = 29.26
2022-01-26 14:17:20.152 | DEBUG    | __main__:trials:24 - Trial = 11362/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.154 | DEBUG    | __main__:trials:29 - Trial = 11362/30000 | Total reward = 29.34
2022-01-26 14:17:20.157 | DEBUG    | __main__:trials:24 - Trial = 11363/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.158 | DEBUG    | __main__:trials:29 - Trial = 11363/30000 | Total reward = 37.48
2022-01-26 14:17:20.161 | DEBUG    | __main__:trials:24 - Trial = 11364/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.164 | DEBUG    | __main__:trials:29 - Trial = 11364/30000 | Total reward = 23.94
2022-01-26 14:17:20.167 | DEBUG    | __main__:trials:24 - Trial = 11365/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.168 | DEBUG    | __main__:trials:29 - Trial = 11365/30000 | Total reward = 28.39
2022-01-26 14:17:20.172 | DEBUG    | __main__:trials:24 - Trial = 11366/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.174 | DEBUG    | __main__:trials:29 - Trial = 11366/30000 | Total reward = 29.22
2022-01-26 14:17:20.177 | DEBUG    | __main__:trials:24 - Trial = 11367/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.177 | DEBUG    | __main__:trials:29 - Trial = 11367/30000 | Total reward = 29.38
2022-01-26 14:17:20.181 | DEBUG    | __main__:trials:24 - Trial = 11368/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.183 | DEBUG    | __main__:trials:29 - Trial = 11368/30000 | Total reward = 29.38
2022-01-26 14:17:20.186 | DEBUG    | __main__:trials:24 - Trial = 11369/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.188 | DEBUG    | __main__:trials:29 - Trial = 11369/30000 | Total reward = 59.40
2022-01-26 14:17:20.192 | DEBUG    | __main__:trials:24 - Trial = 11370/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.192 | DEBUG    | __main__:trials:29 - Trial = 11370/30000 | Total reward = 29.08
2022-01-26 14:17:20.196 | DEBUG    | __main__:trials:24 - Trial = 11371/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.197 | DEBUG    | __main__:trials:29 - Trial = 11371/30000 | Total reward = 24.49
2022-01-26 14:17:20.200 | DEBUG    | __main__:trials:24 - Trial = 11372/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.201 | DEBUG    | __main__:trials:29 - Trial = 11372/30000 | Total reward = 39.49
2022-01-26 14:17:20.205 | DEBUG    | __main__:trials:24 - Trial = 11373/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.206 | DEBUG    | __main__:trials:29 - Trial = 11373/30000 | Total reward = 32.54
2022-01-26 14:17:20.210 | DEBUG    | __main__:trials:24 - Trial = 11374/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.211 | DEBUG    | __main__:trials:29 - Trial = 11374/30000 | Total reward = 35.67
2022-01-26 14:17:20.214 | DEBUG    | __main__:trials:24 - Trial = 11375/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.215 | DEBUG    | __main__:trials:29 - Trial = 11375/30000 | Total reward = 51.87
2022-01-26 14:17:20.218 | DEBUG    | __main__:trials:24 - Trial = 11376/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.220 | DEBUG    | __main__:trials:29 - Trial = 11376/30000 | Total reward = 39.70
2022-01-26 14:17:20.223 | DEBUG    | __main__:trials:24 - Trial = 11377/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.224 | DEBUG    | __main__:trials:29 - Trial = 11377/30000 | Total reward = 33.12
2022-01-26 14:17:20.227 | DEBUG    | __main__:trials:24 - Trial = 11378/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.229 | DEBUG    | __main__:trials:29 - Trial = 11378/30000 | Total reward = 42.86
2022-01-26 14:17:20.232 | DEBUG    | __main__:trials:24 - Trial = 11379/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.234 | DEBUG    | __main__:trials:29 - Trial = 11379/30000 | Total reward = 45.11
2022-01-26 14:17:20.237 | DEBUG    | __main__:trials:24 - Trial = 11380/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.238 | DEBUG    | __main__:trials:29 - Trial = 11380/30000 | Total reward = 40.25
2022-01-26 14:17:20.241 | DEBUG    | __main__:trials:24 - Trial = 11381/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.243 | DEBUG    | __main__:trials:29 - Trial = 11381/30000 | Total reward = 19.41
2022-01-26 14:17:20.246 | DEBUG    | __main__:trials:24 - Trial = 11382/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.247 | DEBUG    | __main__:trials:29 - Trial = 11382/30000 | Total reward = 34.66
2022-01-26 14:17:20.251 | DEBUG    | __main__:trials:24 - Trial = 11383/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.252 | DEBUG    | __main__:trials:29 - Trial = 11383/30000 | Total reward = 38.82
2022-01-26 14:17:20.255 | DEBUG    | __main__:trials:24 - Trial = 11384/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.256 | DEBUG    | __main__:trials:29 - Trial = 11384/30000 | Total reward = 39.00
2022-01-26 14:17:20.259 | DEBUG    | __main__:trials:24 - Trial = 11385/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.261 | DEBUG    | __main__:trials:29 - Trial = 11385/30000 | Total reward = 59.12
2022-01-26 14:17:20.264 | DEBUG    | __main__:trials:24 - Trial = 11386/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.265 | DEBUG    | __main__:trials:29 - Trial = 11386/30000 | Total reward = 15.34
2022-01-26 14:17:20.267 | DEBUG    | __main__:trials:26 - Trial = 11387/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.268 | DEBUG    | __main__:trials:29 - Trial = 11387/30000 | Total reward = 8.80
2022-01-26 14:17:20.271 | DEBUG    | __main__:trials:24 - Trial = 11388/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.273 | DEBUG    | __main__:trials:29 - Trial = 11388/30000 | Total reward = 41.75
2022-01-26 14:17:20.276 | DEBUG    | __main__:trials:24 - Trial = 11389/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.278 | DEBUG    | __main__:trials:29 - Trial = 11389/30000 | Total reward = 34.69
2022-01-26 14:17:20.281 | DEBUG    | __main__:trials:24 - Trial = 11390/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.282 | DEBUG    | __main__:trials:29 - Trial = 11390/30000 | Total reward = 42.45
2022-01-26 14:17:20.285 | DEBUG    | __main__:trials:24 - Trial = 11391/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.287 | DEBUG    | __main__:trials:29 - Trial = 11391/30000 | Total reward = 59.10
2022-01-26 14:17:20.289 | DEBUG    | __main__:trials:24 - Trial = 11392/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.291 | DEBUG    | __main__:trials:29 - Trial = 11392/30000 | Total reward = 36.83
2022-01-26 14:17:20.294 | DEBUG    | __main__:trials:24 - Trial = 11393/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.296 | DEBUG    | __main__:trials:29 - Trial = 11393/30000 | Total reward = 40.40
2022-01-26 14:17:20.299 | DEBUG    | __main__:trials:24 - Trial = 11394/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.301 | DEBUG    | __main__:trials:29 - Trial = 11394/30000 | Total reward = 54.38
2022-01-26 14:17:20.304 | DEBUG    | __main__:trials:24 - Trial = 11395/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.306 | DEBUG    | __main__:trials:29 - Trial = 11395/30000 | Total reward = 52.64
2022-01-26 14:17:20.309 | DEBUG    | __main__:trials:24 - Trial = 11396/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.310 | DEBUG    | __main__:trials:29 - Trial = 11396/30000 | Total reward = 38.04
2022-01-26 14:17:20.313 | DEBUG    | __main__:trials:24 - Trial = 11397/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.315 | DEBUG    | __main__:trials:29 - Trial = 11397/30000 | Total reward = 46.28
2022-01-26 14:17:20.318 | DEBUG    | __main__:trials:24 - Trial = 11398/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.320 | DEBUG    | __main__:trials:29 - Trial = 11398/30000 | Total reward = 34.68
2022-01-26 14:17:20.323 | DEBUG    | __main__:trials:24 - Trial = 11399/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.324 | DEBUG    | __main__:trials:29 - Trial = 11399/30000 | Total reward = 43.98
2022-01-26 14:17:20.328 | DEBUG    | __main__:trials:24 - Trial = 11400/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.329 | DEBUG    | __main__:trials:29 - Trial = 11400/30000 | Total reward = 34.88
2022-01-26 14:17:20.332 | DEBUG    | __main__:trials:24 - Trial = 11401/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.334 | DEBUG    | __main__:trials:29 - Trial = 11401/30000 | Total reward = 60.36
2022-01-26 14:17:20.338 | DEBUG    | __main__:trials:26 - Trial = 11402/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.339 | DEBUG    | __main__:trials:29 - Trial = 11402/30000 | Total reward = 27.78
2022-01-26 14:17:20.342 | DEBUG    | __main__:trials:24 - Trial = 11403/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.343 | DEBUG    | __main__:trials:29 - Trial = 11403/30000 | Total reward = 46.70
2022-01-26 14:17:20.346 | DEBUG    | __main__:trials:24 - Trial = 11404/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.347 | DEBUG    | __main__:trials:29 - Trial = 11404/30000 | Total reward = 36.63
2022-01-26 14:17:20.350 | DEBUG    | __main__:trials:24 - Trial = 11405/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.353 | DEBUG    | __main__:trials:29 - Trial = 11405/30000 | Total reward = 37.53
2022-01-26 14:17:20.356 | DEBUG    | __main__:trials:24 - Trial = 11406/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.357 | DEBUG    | __main__:trials:29 - Trial = 11406/30000 | Total reward = 47.77
2022-01-26 14:17:20.360 | DEBUG    | __main__:trials:24 - Trial = 11407/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.362 | DEBUG    | __main__:trials:29 - Trial = 11407/30000 | Total reward = 32.37
2022-01-26 14:17:20.365 | DEBUG    | __main__:trials:24 - Trial = 11408/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.366 | DEBUG    | __main__:trials:29 - Trial = 11408/30000 | Total reward = 35.75
2022-01-26 14:17:20.369 | DEBUG    | __main__:trials:24 - Trial = 11409/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.370 | DEBUG    | __main__:trials:29 - Trial = 11409/30000 | Total reward = 25.82
2022-01-26 14:17:20.373 | DEBUG    | __main__:trials:24 - Trial = 11410/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.374 | DEBUG    | __main__:trials:29 - Trial = 11410/30000 | Total reward = 44.94
2022-01-26 14:17:20.377 | DEBUG    | __main__:trials:24 - Trial = 11411/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.379 | DEBUG    | __main__:trials:29 - Trial = 11411/30000 | Total reward = 15.21
2022-01-26 14:17:20.382 | DEBUG    | __main__:trials:24 - Trial = 11412/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.384 | DEBUG    | __main__:trials:29 - Trial = 11412/30000 | Total reward = 36.87
2022-01-26 14:17:20.388 | DEBUG    | __main__:trials:24 - Trial = 11413/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.389 | DEBUG    | __main__:trials:29 - Trial = 11413/30000 | Total reward = 42.55
2022-01-26 14:17:20.392 | DEBUG    | __main__:trials:24 - Trial = 11414/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.393 | DEBUG    | __main__:trials:29 - Trial = 11414/30000 | Total reward = 33.61
2022-01-26 14:17:20.397 | DEBUG    | __main__:trials:24 - Trial = 11415/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.397 | DEBUG    | __main__:trials:29 - Trial = 11415/30000 | Total reward = 29.16
2022-01-26 14:17:20.401 | DEBUG    | __main__:trials:24 - Trial = 11416/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.402 | DEBUG    | __main__:trials:29 - Trial = 11416/30000 | Total reward = 35.75
2022-01-26 14:17:20.406 | DEBUG    | __main__:trials:24 - Trial = 11417/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.407 | DEBUG    | __main__:trials:29 - Trial = 11417/30000 | Total reward = 39.68
2022-01-26 14:17:20.409 | DEBUG    | __main__:trials:26 - Trial = 11418/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.410 | DEBUG    | __main__:trials:29 - Trial = 11418/30000 | Total reward = 13.86
2022-01-26 14:17:20.413 | DEBUG    | __main__:trials:24 - Trial = 11419/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.415 | DEBUG    | __main__:trials:29 - Trial = 11419/30000 | Total reward = 31.36
2022-01-26 14:17:20.418 | DEBUG    | __main__:trials:24 - Trial = 11420/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.419 | DEBUG    | __main__:trials:29 - Trial = 11420/30000 | Total reward = 31.23
2022-01-26 14:17:20.423 | DEBUG    | __main__:trials:24 - Trial = 11421/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.424 | DEBUG    | __main__:trials:29 - Trial = 11421/30000 | Total reward = 33.25
2022-01-26 14:17:20.427 | DEBUG    | __main__:trials:24 - Trial = 11422/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.428 | DEBUG    | __main__:trials:29 - Trial = 11422/30000 | Total reward = 32.55
2022-01-26 14:17:20.432 | DEBUG    | __main__:trials:24 - Trial = 11423/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.434 | DEBUG    | __main__:trials:29 - Trial = 11423/30000 | Total reward = 34.17
2022-01-26 14:17:20.437 | DEBUG    | __main__:trials:24 - Trial = 11424/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.438 | DEBUG    | __main__:trials:29 - Trial = 11424/30000 | Total reward = 45.23
2022-01-26 14:17:20.441 | DEBUG    | __main__:trials:26 - Trial = 11425/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.443 | DEBUG    | __main__:trials:29 - Trial = 11425/30000 | Total reward = 27.92
2022-01-26 14:17:20.447 | DEBUG    | __main__:trials:24 - Trial = 11426/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.448 | DEBUG    | __main__:trials:29 - Trial = 11426/30000 | Total reward = 33.03
2022-01-26 14:17:20.451 | DEBUG    | __main__:trials:24 - Trial = 11427/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.452 | DEBUG    | __main__:trials:29 - Trial = 11427/30000 | Total reward = 34.64
2022-01-26 14:17:20.456 | DEBUG    | __main__:trials:24 - Trial = 11428/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.457 | DEBUG    | __main__:trials:29 - Trial = 11428/30000 | Total reward = 43.72
2022-01-26 14:17:20.460 | DEBUG    | __main__:trials:24 - Trial = 11429/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.462 | DEBUG    | __main__:trials:29 - Trial = 11429/30000 | Total reward = 46.48
2022-01-26 14:17:20.465 | DEBUG    | __main__:trials:24 - Trial = 11430/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.466 | DEBUG    | __main__:trials:29 - Trial = 11430/30000 | Total reward = 34.37
2022-01-26 14:17:20.470 | DEBUG    | __main__:trials:24 - Trial = 11431/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.471 | DEBUG    | __main__:trials:29 - Trial = 11431/30000 | Total reward = 33.89
2022-01-26 14:17:20.474 | DEBUG    | __main__:trials:24 - Trial = 11432/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.475 | DEBUG    | __main__:trials:29 - Trial = 11432/30000 | Total reward = 26.68
2022-01-26 14:17:20.479 | DEBUG    | __main__:trials:24 - Trial = 11433/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.480 | DEBUG    | __main__:trials:29 - Trial = 11433/30000 | Total reward = 45.04
2022-01-26 14:17:20.482 | DEBUG    | __main__:trials:26 - Trial = 11434/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.483 | DEBUG    | __main__:trials:29 - Trial = 11434/30000 | Total reward = 10.25
2022-01-26 14:17:20.487 | DEBUG    | __main__:trials:24 - Trial = 11435/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.488 | DEBUG    | __main__:trials:29 - Trial = 11435/30000 | Total reward = 35.00
2022-01-26 14:17:20.491 | DEBUG    | __main__:trials:24 - Trial = 11436/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.492 | DEBUG    | __main__:trials:29 - Trial = 11436/30000 | Total reward = 32.91
2022-01-26 14:17:20.496 | DEBUG    | __main__:trials:24 - Trial = 11437/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.496 | DEBUG    | __main__:trials:29 - Trial = 11437/30000 | Total reward = 35.31
2022-01-26 14:17:20.500 | DEBUG    | __main__:trials:24 - Trial = 11438/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.501 | DEBUG    | __main__:trials:29 - Trial = 11438/30000 | Total reward = 44.91
2022-01-26 14:17:20.504 | DEBUG    | __main__:trials:24 - Trial = 11439/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.506 | DEBUG    | __main__:trials:29 - Trial = 11439/30000 | Total reward = 60.53
2022-01-26 14:17:20.510 | DEBUG    | __main__:trials:24 - Trial = 11440/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.510 | DEBUG    | __main__:trials:29 - Trial = 11440/30000 | Total reward = 51.56
2022-01-26 14:17:20.514 | DEBUG    | __main__:trials:24 - Trial = 11441/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.516 | DEBUG    | __main__:trials:29 - Trial = 11441/30000 | Total reward = 33.12
2022-01-26 14:17:20.519 | DEBUG    | __main__:trials:24 - Trial = 11442/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.521 | DEBUG    | __main__:trials:29 - Trial = 11442/30000 | Total reward = 34.76
2022-01-26 14:17:20.524 | DEBUG    | __main__:trials:24 - Trial = 11443/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.525 | DEBUG    | __main__:trials:29 - Trial = 11443/30000 | Total reward = 34.34
2022-01-26 14:17:20.528 | DEBUG    | __main__:trials:24 - Trial = 11444/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.530 | DEBUG    | __main__:trials:29 - Trial = 11444/30000 | Total reward = 37.51
2022-01-26 14:17:20.533 | DEBUG    | __main__:trials:24 - Trial = 11445/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.533 | DEBUG    | __main__:trials:29 - Trial = 11445/30000 | Total reward = 46.92
2022-01-26 14:17:20.537 | DEBUG    | __main__:trials:24 - Trial = 11446/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.538 | DEBUG    | __main__:trials:29 - Trial = 11446/30000 | Total reward = 31.43
2022-01-26 14:17:20.541 | DEBUG    | __main__:trials:24 - Trial = 11447/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.542 | DEBUG    | __main__:trials:29 - Trial = 11447/30000 | Total reward = 32.87
2022-01-26 14:17:20.546 | DEBUG    | __main__:trials:24 - Trial = 11448/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.547 | DEBUG    | __main__:trials:29 - Trial = 11448/30000 | Total reward = 36.18
2022-01-26 14:17:20.550 | DEBUG    | __main__:trials:24 - Trial = 11449/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.552 | DEBUG    | __main__:trials:29 - Trial = 11449/30000 | Total reward = 34.85
2022-01-26 14:17:20.555 | DEBUG    | __main__:trials:24 - Trial = 11450/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.555 | DEBUG    | __main__:trials:29 - Trial = 11450/30000 | Total reward = 33.51
2022-01-26 14:17:20.559 | DEBUG    | __main__:trials:24 - Trial = 11451/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.561 | DEBUG    | __main__:trials:29 - Trial = 11451/30000 | Total reward = 35.79
2022-01-26 14:17:20.564 | DEBUG    | __main__:trials:24 - Trial = 11452/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.564 | DEBUG    | __main__:trials:29 - Trial = 11452/30000 | Total reward = 43.84
2022-01-26 14:17:20.568 | DEBUG    | __main__:trials:24 - Trial = 11453/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.568 | DEBUG    | __main__:trials:29 - Trial = 11453/30000 | Total reward = 37.26
2022-01-26 14:17:20.572 | DEBUG    | __main__:trials:24 - Trial = 11454/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.574 | DEBUG    | __main__:trials:29 - Trial = 11454/30000 | Total reward = 34.06
2022-01-26 14:17:20.577 | DEBUG    | __main__:trials:24 - Trial = 11455/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.578 | DEBUG    | __main__:trials:29 - Trial = 11455/30000 | Total reward = 30.46
2022-01-26 14:17:20.582 | DEBUG    | __main__:trials:24 - Trial = 11456/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.582 | DEBUG    | __main__:trials:29 - Trial = 11456/30000 | Total reward = 40.58
2022-01-26 14:17:20.586 | DEBUG    | __main__:trials:24 - Trial = 11457/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.587 | DEBUG    | __main__:trials:29 - Trial = 11457/30000 | Total reward = 38.10
2022-01-26 14:17:20.590 | DEBUG    | __main__:trials:24 - Trial = 11458/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.592 | DEBUG    | __main__:trials:29 - Trial = 11458/30000 | Total reward = 31.24
2022-01-26 14:17:20.595 | DEBUG    | __main__:trials:24 - Trial = 11459/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.595 | DEBUG    | __main__:trials:29 - Trial = 11459/30000 | Total reward = 26.30
2022-01-26 14:17:20.599 | DEBUG    | __main__:trials:24 - Trial = 11460/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.599 | DEBUG    | __main__:trials:29 - Trial = 11460/30000 | Total reward = 40.28
2022-01-26 14:17:20.603 | DEBUG    | __main__:trials:24 - Trial = 11461/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.605 | DEBUG    | __main__:trials:29 - Trial = 11461/30000 | Total reward = 56.35
2022-01-26 14:17:20.608 | DEBUG    | __main__:trials:24 - Trial = 11462/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.609 | DEBUG    | __main__:trials:29 - Trial = 11462/30000 | Total reward = 39.27
2022-01-26 14:17:20.612 | DEBUG    | __main__:trials:24 - Trial = 11463/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.614 | DEBUG    | __main__:trials:29 - Trial = 11463/30000 | Total reward = 29.45
2022-01-26 14:17:20.617 | DEBUG    | __main__:trials:24 - Trial = 11464/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.618 | DEBUG    | __main__:trials:29 - Trial = 11464/30000 | Total reward = 29.69
2022-01-26 14:17:20.621 | DEBUG    | __main__:trials:24 - Trial = 11465/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.621 | DEBUG    | __main__:trials:29 - Trial = 11465/30000 | Total reward = 39.90
2022-01-26 14:17:20.626 | DEBUG    | __main__:trials:24 - Trial = 11466/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.627 | DEBUG    | __main__:trials:29 - Trial = 11466/30000 | Total reward = 48.10
2022-01-26 14:17:20.630 | DEBUG    | __main__:trials:24 - Trial = 11467/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.632 | DEBUG    | __main__:trials:29 - Trial = 11467/30000 | Total reward = 29.45
2022-01-26 14:17:20.635 | DEBUG    | __main__:trials:24 - Trial = 11468/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.637 | DEBUG    | __main__:trials:29 - Trial = 11468/30000 | Total reward = 33.70
2022-01-26 14:17:20.640 | DEBUG    | __main__:trials:24 - Trial = 11469/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.641 | DEBUG    | __main__:trials:29 - Trial = 11469/30000 | Total reward = 28.74
2022-01-26 14:17:20.644 | DEBUG    | __main__:trials:24 - Trial = 11470/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.645 | DEBUG    | __main__:trials:29 - Trial = 11470/30000 | Total reward = 43.23
2022-01-26 14:17:20.649 | DEBUG    | __main__:trials:24 - Trial = 11471/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.650 | DEBUG    | __main__:trials:29 - Trial = 11471/30000 | Total reward = 30.78
2022-01-26 14:17:20.654 | DEBUG    | __main__:trials:24 - Trial = 11472/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.655 | DEBUG    | __main__:trials:29 - Trial = 11472/30000 | Total reward = 58.45
2022-01-26 14:17:20.658 | DEBUG    | __main__:trials:24 - Trial = 11473/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.660 | DEBUG    | __main__:trials:29 - Trial = 11473/30000 | Total reward = 33.53
2022-01-26 14:17:20.664 | DEBUG    | __main__:trials:24 - Trial = 11474/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.666 | DEBUG    | __main__:trials:29 - Trial = 11474/30000 | Total reward = 23.53
2022-01-26 14:17:20.669 | DEBUG    | __main__:trials:24 - Trial = 11475/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.671 | DEBUG    | __main__:trials:29 - Trial = 11475/30000 | Total reward = 49.73
2022-01-26 14:17:20.674 | DEBUG    | __main__:trials:24 - Trial = 11476/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.676 | DEBUG    | __main__:trials:29 - Trial = 11476/30000 | Total reward = 41.84
2022-01-26 14:17:20.679 | DEBUG    | __main__:trials:24 - Trial = 11477/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.681 | DEBUG    | __main__:trials:29 - Trial = 11477/30000 | Total reward = 39.29
2022-01-26 14:17:20.684 | DEBUG    | __main__:trials:24 - Trial = 11478/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.686 | DEBUG    | __main__:trials:29 - Trial = 11478/30000 | Total reward = 55.35
2022-01-26 14:17:20.690 | DEBUG    | __main__:trials:24 - Trial = 11479/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.691 | DEBUG    | __main__:trials:29 - Trial = 11479/30000 | Total reward = 29.15
2022-01-26 14:17:20.695 | DEBUG    | __main__:trials:24 - Trial = 11480/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.697 | DEBUG    | __main__:trials:29 - Trial = 11480/30000 | Total reward = 36.73
2022-01-26 14:17:20.700 | DEBUG    | __main__:trials:24 - Trial = 11481/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.702 | DEBUG    | __main__:trials:29 - Trial = 11481/30000 | Total reward = 34.49
2022-01-26 14:17:20.705 | DEBUG    | __main__:trials:24 - Trial = 11482/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.707 | DEBUG    | __main__:trials:29 - Trial = 11482/30000 | Total reward = 39.91
2022-01-26 14:17:20.710 | DEBUG    | __main__:trials:24 - Trial = 11483/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.712 | DEBUG    | __main__:trials:29 - Trial = 11483/30000 | Total reward = 33.08
2022-01-26 14:17:20.716 | DEBUG    | __main__:trials:24 - Trial = 11484/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.717 | DEBUG    | __main__:trials:29 - Trial = 11484/30000 | Total reward = 44.57
2022-01-26 14:17:20.720 | DEBUG    | __main__:trials:24 - Trial = 11485/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.721 | DEBUG    | __main__:trials:29 - Trial = 11485/30000 | Total reward = 35.37
2022-01-26 14:17:20.724 | DEBUG    | __main__:trials:24 - Trial = 11486/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.725 | DEBUG    | __main__:trials:29 - Trial = 11486/30000 | Total reward = 36.84
2022-01-26 14:17:20.729 | DEBUG    | __main__:trials:26 - Trial = 11487/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.730 | DEBUG    | __main__:trials:29 - Trial = 11487/30000 | Total reward = 30.30
2022-01-26 14:17:20.733 | DEBUG    | __main__:trials:24 - Trial = 11488/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.735 | DEBUG    | __main__:trials:29 - Trial = 11488/30000 | Total reward = 35.12
2022-01-26 14:17:20.737 | DEBUG    | __main__:trials:24 - Trial = 11489/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.739 | DEBUG    | __main__:trials:29 - Trial = 11489/30000 | Total reward = 28.36
2022-01-26 14:17:20.743 | DEBUG    | __main__:trials:24 - Trial = 11490/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.745 | DEBUG    | __main__:trials:29 - Trial = 11490/30000 | Total reward = 32.05
2022-01-26 14:17:20.748 | DEBUG    | __main__:trials:24 - Trial = 11491/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.750 | DEBUG    | __main__:trials:29 - Trial = 11491/30000 | Total reward = 34.19
2022-01-26 14:17:20.753 | DEBUG    | __main__:trials:24 - Trial = 11492/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.755 | DEBUG    | __main__:trials:29 - Trial = 11492/30000 | Total reward = 58.04
2022-01-26 14:17:20.759 | DEBUG    | __main__:trials:24 - Trial = 11493/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.760 | DEBUG    | __main__:trials:29 - Trial = 11493/30000 | Total reward = 21.28
2022-01-26 14:17:20.764 | DEBUG    | __main__:trials:24 - Trial = 11494/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.765 | DEBUG    | __main__:trials:29 - Trial = 11494/30000 | Total reward = 57.36
2022-01-26 14:17:20.768 | DEBUG    | __main__:trials:26 - Trial = 11495/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.770 | DEBUG    | __main__:trials:29 - Trial = 11495/30000 | Total reward = 3.28
2022-01-26 14:17:20.773 | DEBUG    | __main__:trials:24 - Trial = 11496/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.775 | DEBUG    | __main__:trials:29 - Trial = 11496/30000 | Total reward = 34.71
2022-01-26 14:17:20.779 | DEBUG    | __main__:trials:24 - Trial = 11497/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.780 | DEBUG    | __main__:trials:29 - Trial = 11497/30000 | Total reward = 37.25
2022-01-26 14:17:20.784 | DEBUG    | __main__:trials:24 - Trial = 11498/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.785 | DEBUG    | __main__:trials:29 - Trial = 11498/30000 | Total reward = 42.98
2022-01-26 14:17:20.789 | DEBUG    | __main__:trials:24 - Trial = 11499/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.791 | DEBUG    | __main__:trials:29 - Trial = 11499/30000 | Total reward = 47.62
2022-01-26 14:17:20.794 | DEBUG    | __main__:trials:24 - Trial = 11500/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.796 | DEBUG    | __main__:trials:29 - Trial = 11500/30000 | Total reward = 33.36
2022-01-26 14:17:20.800 | DEBUG    | __main__:trials:24 - Trial = 11501/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.801 | DEBUG    | __main__:trials:29 - Trial = 11501/30000 | Total reward = 32.48
2022-01-26 14:17:20.805 | DEBUG    | __main__:trials:24 - Trial = 11502/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.806 | DEBUG    | __main__:trials:29 - Trial = 11502/30000 | Total reward = 33.36
2022-01-26 14:17:20.810 | DEBUG    | __main__:trials:24 - Trial = 11503/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.811 | DEBUG    | __main__:trials:29 - Trial = 11503/30000 | Total reward = 17.15
2022-01-26 14:17:20.815 | DEBUG    | __main__:trials:26 - Trial = 11504/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.817 | DEBUG    | __main__:trials:29 - Trial = 11504/30000 | Total reward = 24.55
2022-01-26 14:17:20.820 | DEBUG    | __main__:trials:24 - Trial = 11505/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.822 | DEBUG    | __main__:trials:29 - Trial = 11505/30000 | Total reward = 25.71
2022-01-26 14:17:20.826 | DEBUG    | __main__:trials:24 - Trial = 11506/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.827 | DEBUG    | __main__:trials:29 - Trial = 11506/30000 | Total reward = 36.09
2022-01-26 14:17:20.830 | DEBUG    | __main__:trials:24 - Trial = 11507/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.831 | DEBUG    | __main__:trials:29 - Trial = 11507/30000 | Total reward = 32.84
2022-01-26 14:17:20.835 | DEBUG    | __main__:trials:24 - Trial = 11508/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.836 | DEBUG    | __main__:trials:29 - Trial = 11508/30000 | Total reward = 29.22
2022-01-26 14:17:20.840 | DEBUG    | __main__:trials:24 - Trial = 11509/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.842 | DEBUG    | __main__:trials:29 - Trial = 11509/30000 | Total reward = 38.18
2022-01-26 14:17:20.845 | DEBUG    | __main__:trials:26 - Trial = 11510/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.847 | DEBUG    | __main__:trials:29 - Trial = 11510/30000 | Total reward = 19.35
2022-01-26 14:17:20.850 | DEBUG    | __main__:trials:24 - Trial = 11511/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.852 | DEBUG    | __main__:trials:29 - Trial = 11511/30000 | Total reward = 57.24
2022-01-26 14:17:20.856 | DEBUG    | __main__:trials:24 - Trial = 11512/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.857 | DEBUG    | __main__:trials:29 - Trial = 11512/30000 | Total reward = 29.32
2022-01-26 14:17:20.860 | DEBUG    | __main__:trials:24 - Trial = 11513/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.862 | DEBUG    | __main__:trials:29 - Trial = 11513/30000 | Total reward = 46.67
2022-01-26 14:17:20.866 | DEBUG    | __main__:trials:24 - Trial = 11514/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.868 | DEBUG    | __main__:trials:29 - Trial = 11514/30000 | Total reward = 48.76
2022-01-26 14:17:20.871 | DEBUG    | __main__:trials:24 - Trial = 11515/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.873 | DEBUG    | __main__:trials:29 - Trial = 11515/30000 | Total reward = 40.31
2022-01-26 14:17:20.877 | DEBUG    | __main__:trials:24 - Trial = 11516/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.878 | DEBUG    | __main__:trials:29 - Trial = 11516/30000 | Total reward = 24.40
2022-01-26 14:17:20.882 | DEBUG    | __main__:trials:24 - Trial = 11517/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.883 | DEBUG    | __main__:trials:29 - Trial = 11517/30000 | Total reward = 31.53
2022-01-26 14:17:20.886 | DEBUG    | __main__:trials:24 - Trial = 11518/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.888 | DEBUG    | __main__:trials:29 - Trial = 11518/30000 | Total reward = 29.10
2022-01-26 14:17:20.891 | DEBUG    | __main__:trials:24 - Trial = 11519/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.893 | DEBUG    | __main__:trials:29 - Trial = 11519/30000 | Total reward = 29.10
2022-01-26 14:17:20.897 | DEBUG    | __main__:trials:24 - Trial = 11520/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.899 | DEBUG    | __main__:trials:29 - Trial = 11520/30000 | Total reward = 29.22
2022-01-26 14:17:20.902 | DEBUG    | __main__:trials:24 - Trial = 11521/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.904 | DEBUG    | __main__:trials:29 - Trial = 11521/30000 | Total reward = 29.22
2022-01-26 14:17:20.907 | DEBUG    | __main__:trials:24 - Trial = 11522/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.909 | DEBUG    | __main__:trials:29 - Trial = 11522/30000 | Total reward = 24.97
2022-01-26 14:17:20.912 | DEBUG    | __main__:trials:24 - Trial = 11523/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.914 | DEBUG    | __main__:trials:29 - Trial = 11523/30000 | Total reward = 37.41
2022-01-26 14:17:20.917 | DEBUG    | __main__:trials:24 - Trial = 11524/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.919 | DEBUG    | __main__:trials:29 - Trial = 11524/30000 | Total reward = 27.34
2022-01-26 14:17:20.922 | DEBUG    | __main__:trials:24 - Trial = 11525/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.924 | DEBUG    | __main__:trials:29 - Trial = 11525/30000 | Total reward = 33.56
2022-01-26 14:17:20.927 | DEBUG    | __main__:trials:24 - Trial = 11526/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.928 | DEBUG    | __main__:trials:29 - Trial = 11526/30000 | Total reward = 45.96
2022-01-26 14:17:20.932 | DEBUG    | __main__:trials:24 - Trial = 11527/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.934 | DEBUG    | __main__:trials:29 - Trial = 11527/30000 | Total reward = 29.10
2022-01-26 14:17:20.937 | DEBUG    | __main__:trials:24 - Trial = 11528/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.939 | DEBUG    | __main__:trials:29 - Trial = 11528/30000 | Total reward = 27.08
2022-01-26 14:17:20.942 | DEBUG    | __main__:trials:26 - Trial = 11529/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.944 | DEBUG    | __main__:trials:29 - Trial = 11529/30000 | Total reward = 16.68
2022-01-26 14:17:20.947 | DEBUG    | __main__:trials:24 - Trial = 11530/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.949 | DEBUG    | __main__:trials:29 - Trial = 11530/30000 | Total reward = 27.32
2022-01-26 14:17:20.952 | DEBUG    | __main__:trials:24 - Trial = 11531/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.953 | DEBUG    | __main__:trials:29 - Trial = 11531/30000 | Total reward = 24.96
2022-01-26 14:17:20.958 | DEBUG    | __main__:trials:24 - Trial = 11532/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.959 | DEBUG    | __main__:trials:29 - Trial = 11532/30000 | Total reward = 25.48
2022-01-26 14:17:20.963 | DEBUG    | __main__:trials:26 - Trial = 11533/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:20.964 | DEBUG    | __main__:trials:29 - Trial = 11533/30000 | Total reward = -5.30
2022-01-26 14:17:20.968 | DEBUG    | __main__:trials:24 - Trial = 11534/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.969 | DEBUG    | __main__:trials:29 - Trial = 11534/30000 | Total reward = 46.63
2022-01-26 14:17:20.973 | DEBUG    | __main__:trials:24 - Trial = 11535/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.974 | DEBUG    | __main__:trials:29 - Trial = 11535/30000 | Total reward = 30.98
2022-01-26 14:17:20.978 | DEBUG    | __main__:trials:24 - Trial = 11536/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.979 | DEBUG    | __main__:trials:29 - Trial = 11536/30000 | Total reward = 29.05
2022-01-26 14:17:20.982 | DEBUG    | __main__:trials:24 - Trial = 11537/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.984 | DEBUG    | __main__:trials:29 - Trial = 11537/30000 | Total reward = 49.78
2022-01-26 14:17:20.988 | DEBUG    | __main__:trials:24 - Trial = 11538/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.989 | DEBUG    | __main__:trials:29 - Trial = 11538/30000 | Total reward = 29.85
2022-01-26 14:17:20.992 | DEBUG    | __main__:trials:24 - Trial = 11539/30000 | Max number of steps (20) reached
2022-01-26 14:17:20.994 | DEBUG    | __main__:trials:29 - Trial = 11539/30000 | Total reward = 35.27
2022-01-26 14:17:20.998 | DEBUG    | __main__:trials:24 - Trial = 11540/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.000 | DEBUG    | __main__:trials:29 - Trial = 11540/30000 | Total reward = 42.87
2022-01-26 14:17:21.003 | DEBUG    | __main__:trials:26 - Trial = 11541/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.005 | DEBUG    | __main__:trials:29 - Trial = 11541/30000 | Total reward = 13.87
2022-01-26 14:17:21.008 | DEBUG    | __main__:trials:24 - Trial = 11542/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.010 | DEBUG    | __main__:trials:29 - Trial = 11542/30000 | Total reward = 27.91
2022-01-26 14:17:21.013 | DEBUG    | __main__:trials:24 - Trial = 11543/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.014 | DEBUG    | __main__:trials:29 - Trial = 11543/30000 | Total reward = 37.03
2022-01-26 14:17:21.017 | DEBUG    | __main__:trials:24 - Trial = 11544/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.018 | DEBUG    | __main__:trials:29 - Trial = 11544/30000 | Total reward = 34.87
2022-01-26 14:17:21.022 | DEBUG    | __main__:trials:24 - Trial = 11545/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.023 | DEBUG    | __main__:trials:29 - Trial = 11545/30000 | Total reward = 36.22
2022-01-26 14:17:21.026 | DEBUG    | __main__:trials:24 - Trial = 11546/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.028 | DEBUG    | __main__:trials:29 - Trial = 11546/30000 | Total reward = 29.23
2022-01-26 14:17:21.032 | DEBUG    | __main__:trials:24 - Trial = 11547/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.032 | DEBUG    | __main__:trials:29 - Trial = 11547/30000 | Total reward = 55.83
2022-01-26 14:17:21.036 | DEBUG    | __main__:trials:26 - Trial = 11548/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.038 | DEBUG    | __main__:trials:29 - Trial = 11548/30000 | Total reward = 3.57
2022-01-26 14:17:21.041 | DEBUG    | __main__:trials:24 - Trial = 11549/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.042 | DEBUG    | __main__:trials:29 - Trial = 11549/30000 | Total reward = 29.26
2022-01-26 14:17:21.046 | DEBUG    | __main__:trials:24 - Trial = 11550/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.047 | DEBUG    | __main__:trials:29 - Trial = 11550/30000 | Total reward = 29.26
2022-01-26 14:17:21.051 | DEBUG    | __main__:trials:24 - Trial = 11551/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.051 | DEBUG    | __main__:trials:29 - Trial = 11551/30000 | Total reward = 33.33
2022-01-26 14:17:21.055 | DEBUG    | __main__:trials:24 - Trial = 11552/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.056 | DEBUG    | __main__:trials:29 - Trial = 11552/30000 | Total reward = 29.25
2022-01-26 14:17:21.060 | DEBUG    | __main__:trials:24 - Trial = 11553/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.062 | DEBUG    | __main__:trials:29 - Trial = 11553/30000 | Total reward = 29.36
2022-01-26 14:17:21.066 | DEBUG    | __main__:trials:24 - Trial = 11554/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.067 | DEBUG    | __main__:trials:29 - Trial = 11554/30000 | Total reward = 26.83
2022-01-26 14:17:21.070 | DEBUG    | __main__:trials:24 - Trial = 11555/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.072 | DEBUG    | __main__:trials:29 - Trial = 11555/30000 | Total reward = 36.82
2022-01-26 14:17:21.076 | DEBUG    | __main__:trials:24 - Trial = 11556/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.077 | DEBUG    | __main__:trials:29 - Trial = 11556/30000 | Total reward = 29.22
2022-01-26 14:17:21.081 | DEBUG    | __main__:trials:24 - Trial = 11557/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.082 | DEBUG    | __main__:trials:29 - Trial = 11557/30000 | Total reward = 25.35
2022-01-26 14:17:21.085 | DEBUG    | __main__:trials:24 - Trial = 11558/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.087 | DEBUG    | __main__:trials:29 - Trial = 11558/30000 | Total reward = 56.51
2022-01-26 14:17:21.091 | DEBUG    | __main__:trials:24 - Trial = 11559/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.093 | DEBUG    | __main__:trials:29 - Trial = 11559/30000 | Total reward = 29.22
2022-01-26 14:17:21.096 | DEBUG    | __main__:trials:24 - Trial = 11560/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.098 | DEBUG    | __main__:trials:29 - Trial = 11560/30000 | Total reward = 29.37
2022-01-26 14:17:21.101 | DEBUG    | __main__:trials:24 - Trial = 11561/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.103 | DEBUG    | __main__:trials:29 - Trial = 11561/30000 | Total reward = 29.98
2022-01-26 14:17:21.107 | DEBUG    | __main__:trials:24 - Trial = 11562/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.108 | DEBUG    | __main__:trials:29 - Trial = 11562/30000 | Total reward = 29.06
2022-01-26 14:17:21.112 | DEBUG    | __main__:trials:24 - Trial = 11563/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.113 | DEBUG    | __main__:trials:29 - Trial = 11563/30000 | Total reward = 29.22
2022-01-26 14:17:21.116 | DEBUG    | __main__:trials:24 - Trial = 11564/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.118 | DEBUG    | __main__:trials:29 - Trial = 11564/30000 | Total reward = 30.97
2022-01-26 14:17:21.122 | DEBUG    | __main__:trials:24 - Trial = 11565/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.123 | DEBUG    | __main__:trials:29 - Trial = 11565/30000 | Total reward = 17.53
2022-01-26 14:17:21.127 | DEBUG    | __main__:trials:24 - Trial = 11566/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.129 | DEBUG    | __main__:trials:29 - Trial = 11566/30000 | Total reward = 29.34
2022-01-26 14:17:21.132 | DEBUG    | __main__:trials:24 - Trial = 11567/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.133 | DEBUG    | __main__:trials:29 - Trial = 11567/30000 | Total reward = 55.93
2022-01-26 14:17:21.137 | DEBUG    | __main__:trials:24 - Trial = 11568/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.138 | DEBUG    | __main__:trials:29 - Trial = 11568/30000 | Total reward = 37.68
2022-01-26 14:17:21.142 | DEBUG    | __main__:trials:24 - Trial = 11569/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.143 | DEBUG    | __main__:trials:29 - Trial = 11569/30000 | Total reward = 41.80
2022-01-26 14:17:21.147 | DEBUG    | __main__:trials:24 - Trial = 11570/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.148 | DEBUG    | __main__:trials:29 - Trial = 11570/30000 | Total reward = 62.97
2022-01-26 14:17:21.152 | DEBUG    | __main__:trials:24 - Trial = 11571/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.153 | DEBUG    | __main__:trials:29 - Trial = 11571/30000 | Total reward = 39.04
2022-01-26 14:17:21.157 | DEBUG    | __main__:trials:24 - Trial = 11572/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.157 | DEBUG    | __main__:trials:29 - Trial = 11572/30000 | Total reward = 29.26
2022-01-26 14:17:21.161 | DEBUG    | __main__:trials:24 - Trial = 11573/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.163 | DEBUG    | __main__:trials:29 - Trial = 11573/30000 | Total reward = 36.04
2022-01-26 14:17:21.166 | DEBUG    | __main__:trials:26 - Trial = 11574/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.168 | DEBUG    | __main__:trials:29 - Trial = 11574/30000 | Total reward = 17.40
2022-01-26 14:17:21.171 | DEBUG    | __main__:trials:24 - Trial = 11575/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.173 | DEBUG    | __main__:trials:29 - Trial = 11575/30000 | Total reward = 40.79
2022-01-26 14:17:21.176 | DEBUG    | __main__:trials:24 - Trial = 11576/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.176 | DEBUG    | __main__:trials:29 - Trial = 11576/30000 | Total reward = 37.41
2022-01-26 14:17:21.180 | DEBUG    | __main__:trials:24 - Trial = 11577/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.181 | DEBUG    | __main__:trials:29 - Trial = 11577/30000 | Total reward = 37.03
2022-01-26 14:17:21.185 | DEBUG    | __main__:trials:26 - Trial = 11578/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.186 | DEBUG    | __main__:trials:29 - Trial = 11578/30000 | Total reward = 15.85
2022-01-26 14:17:21.189 | DEBUG    | __main__:trials:24 - Trial = 11579/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.190 | DEBUG    | __main__:trials:29 - Trial = 11579/30000 | Total reward = 32.12
2022-01-26 14:17:21.193 | DEBUG    | __main__:trials:24 - Trial = 11580/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.194 | DEBUG    | __main__:trials:29 - Trial = 11580/30000 | Total reward = 43.36
2022-01-26 14:17:21.196 | DEBUG    | __main__:trials:26 - Trial = 11581/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.197 | DEBUG    | __main__:trials:29 - Trial = 11581/30000 | Total reward = 12.11
2022-01-26 14:17:21.200 | DEBUG    | __main__:trials:24 - Trial = 11582/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.201 | DEBUG    | __main__:trials:29 - Trial = 11582/30000 | Total reward = 29.18
2022-01-26 14:17:21.204 | DEBUG    | __main__:trials:24 - Trial = 11583/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.206 | DEBUG    | __main__:trials:29 - Trial = 11583/30000 | Total reward = 33.02
2022-01-26 14:17:21.209 | DEBUG    | __main__:trials:24 - Trial = 11584/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.210 | DEBUG    | __main__:trials:29 - Trial = 11584/30000 | Total reward = 43.19
2022-01-26 14:17:21.213 | DEBUG    | __main__:trials:24 - Trial = 11585/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.214 | DEBUG    | __main__:trials:29 - Trial = 11585/30000 | Total reward = 37.68
2022-01-26 14:17:21.217 | DEBUG    | __main__:trials:24 - Trial = 11586/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.218 | DEBUG    | __main__:trials:29 - Trial = 11586/30000 | Total reward = 36.81
2022-01-26 14:17:21.221 | DEBUG    | __main__:trials:24 - Trial = 11587/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.222 | DEBUG    | __main__:trials:29 - Trial = 11587/30000 | Total reward = 28.75
2022-01-26 14:17:21.225 | DEBUG    | __main__:trials:24 - Trial = 11588/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.227 | DEBUG    | __main__:trials:29 - Trial = 11588/30000 | Total reward = 29.37
2022-01-26 14:17:21.231 | DEBUG    | __main__:trials:24 - Trial = 11589/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.231 | DEBUG    | __main__:trials:29 - Trial = 11589/30000 | Total reward = 29.69
2022-01-26 14:17:21.235 | DEBUG    | __main__:trials:24 - Trial = 11590/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.236 | DEBUG    | __main__:trials:29 - Trial = 11590/30000 | Total reward = 29.09
2022-01-26 14:17:21.238 | DEBUG    | __main__:trials:26 - Trial = 11591/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.240 | DEBUG    | __main__:trials:29 - Trial = 11591/30000 | Total reward = 7.00
2022-01-26 14:17:21.243 | DEBUG    | __main__:trials:24 - Trial = 11592/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.244 | DEBUG    | __main__:trials:29 - Trial = 11592/30000 | Total reward = 37.35
2022-01-26 14:17:21.248 | DEBUG    | __main__:trials:24 - Trial = 11593/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.249 | DEBUG    | __main__:trials:29 - Trial = 11593/30000 | Total reward = 36.08
2022-01-26 14:17:21.252 | DEBUG    | __main__:trials:24 - Trial = 11594/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.254 | DEBUG    | __main__:trials:29 - Trial = 11594/30000 | Total reward = 28.66
2022-01-26 14:17:21.258 | DEBUG    | __main__:trials:24 - Trial = 11595/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.260 | DEBUG    | __main__:trials:29 - Trial = 11595/30000 | Total reward = 41.22
2022-01-26 14:17:21.263 | DEBUG    | __main__:trials:24 - Trial = 11596/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.263 | DEBUG    | __main__:trials:29 - Trial = 11596/30000 | Total reward = 25.08
2022-01-26 14:17:21.267 | DEBUG    | __main__:trials:24 - Trial = 11597/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.268 | DEBUG    | __main__:trials:29 - Trial = 11597/30000 | Total reward = 29.26
2022-01-26 14:17:21.272 | DEBUG    | __main__:trials:26 - Trial = 11598/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.273 | DEBUG    | __main__:trials:29 - Trial = 11598/30000 | Total reward = 23.72
2022-01-26 14:17:21.277 | DEBUG    | __main__:trials:26 - Trial = 11599/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.278 | DEBUG    | __main__:trials:29 - Trial = 11599/30000 | Total reward = 14.59
2022-01-26 14:17:21.282 | DEBUG    | __main__:trials:24 - Trial = 11600/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.283 | DEBUG    | __main__:trials:29 - Trial = 11600/30000 | Total reward = 36.57
2022-01-26 14:17:21.287 | DEBUG    | __main__:trials:24 - Trial = 11601/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.289 | DEBUG    | __main__:trials:29 - Trial = 11601/30000 | Total reward = 24.70
2022-01-26 14:17:21.292 | DEBUG    | __main__:trials:24 - Trial = 11602/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.294 | DEBUG    | __main__:trials:29 - Trial = 11602/30000 | Total reward = 33.73
2022-01-26 14:17:21.297 | DEBUG    | __main__:trials:24 - Trial = 11603/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.299 | DEBUG    | __main__:trials:29 - Trial = 11603/30000 | Total reward = 37.23
2022-01-26 14:17:21.302 | DEBUG    | __main__:trials:24 - Trial = 11604/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.304 | DEBUG    | __main__:trials:29 - Trial = 11604/30000 | Total reward = 29.26
2022-01-26 14:17:21.308 | DEBUG    | __main__:trials:24 - Trial = 11605/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.309 | DEBUG    | __main__:trials:29 - Trial = 11605/30000 | Total reward = 24.35
2022-01-26 14:17:21.313 | DEBUG    | __main__:trials:24 - Trial = 11606/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.315 | DEBUG    | __main__:trials:29 - Trial = 11606/30000 | Total reward = 21.09
2022-01-26 14:17:21.318 | DEBUG    | __main__:trials:24 - Trial = 11607/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.320 | DEBUG    | __main__:trials:29 - Trial = 11607/30000 | Total reward = 40.68
2022-01-26 14:17:21.324 | DEBUG    | __main__:trials:24 - Trial = 11608/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.325 | DEBUG    | __main__:trials:29 - Trial = 11608/30000 | Total reward = 26.52
2022-01-26 14:17:21.328 | DEBUG    | __main__:trials:24 - Trial = 11609/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.330 | DEBUG    | __main__:trials:29 - Trial = 11609/30000 | Total reward = 53.89
2022-01-26 14:17:21.333 | DEBUG    | __main__:trials:24 - Trial = 11610/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.334 | DEBUG    | __main__:trials:29 - Trial = 11610/30000 | Total reward = 29.30
2022-01-26 14:17:21.338 | DEBUG    | __main__:trials:24 - Trial = 11611/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.339 | DEBUG    | __main__:trials:29 - Trial = 11611/30000 | Total reward = 29.22
2022-01-26 14:17:21.343 | DEBUG    | __main__:trials:24 - Trial = 11612/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.345 | DEBUG    | __main__:trials:29 - Trial = 11612/30000 | Total reward = 29.90
2022-01-26 14:17:21.349 | DEBUG    | __main__:trials:24 - Trial = 11613/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.351 | DEBUG    | __main__:trials:29 - Trial = 11613/30000 | Total reward = 25.03
2022-01-26 14:17:21.352 | DEBUG    | __main__:trials:26 - Trial = 11614/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.354 | DEBUG    | __main__:trials:29 - Trial = 11614/30000 | Total reward = 7.56
2022-01-26 14:17:21.358 | DEBUG    | __main__:trials:24 - Trial = 11615/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.358 | DEBUG    | __main__:trials:29 - Trial = 11615/30000 | Total reward = 31.77
2022-01-26 14:17:21.362 | DEBUG    | __main__:trials:24 - Trial = 11616/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.364 | DEBUG    | __main__:trials:29 - Trial = 11616/30000 | Total reward = 29.73
2022-01-26 14:17:21.368 | DEBUG    | __main__:trials:24 - Trial = 11617/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.369 | DEBUG    | __main__:trials:29 - Trial = 11617/30000 | Total reward = 31.72
2022-01-26 14:17:21.373 | DEBUG    | __main__:trials:24 - Trial = 11618/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.374 | DEBUG    | __main__:trials:29 - Trial = 11618/30000 | Total reward = 29.82
2022-01-26 14:17:21.378 | DEBUG    | __main__:trials:24 - Trial = 11619/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.380 | DEBUG    | __main__:trials:29 - Trial = 11619/30000 | Total reward = 25.09
2022-01-26 14:17:21.383 | DEBUG    | __main__:trials:26 - Trial = 11620/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.385 | DEBUG    | __main__:trials:29 - Trial = 11620/30000 | Total reward = 20.95
2022-01-26 14:17:21.388 | DEBUG    | __main__:trials:26 - Trial = 11621/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.390 | DEBUG    | __main__:trials:29 - Trial = 11621/30000 | Total reward = 16.05
2022-01-26 14:17:21.393 | DEBUG    | __main__:trials:26 - Trial = 11622/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.394 | DEBUG    | __main__:trials:29 - Trial = 11622/30000 | Total reward = 20.97
2022-01-26 14:17:21.398 | DEBUG    | __main__:trials:24 - Trial = 11623/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.399 | DEBUG    | __main__:trials:29 - Trial = 11623/30000 | Total reward = 48.80
2022-01-26 14:17:21.403 | DEBUG    | __main__:trials:24 - Trial = 11624/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.405 | DEBUG    | __main__:trials:29 - Trial = 11624/30000 | Total reward = 25.18
2022-01-26 14:17:21.408 | DEBUG    | __main__:trials:26 - Trial = 11625/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.410 | DEBUG    | __main__:trials:29 - Trial = 11625/30000 | Total reward = 23.07
2022-01-26 14:17:21.414 | DEBUG    | __main__:trials:24 - Trial = 11626/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.415 | DEBUG    | __main__:trials:29 - Trial = 11626/30000 | Total reward = 55.90
2022-01-26 14:17:21.418 | DEBUG    | __main__:trials:24 - Trial = 11627/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.420 | DEBUG    | __main__:trials:29 - Trial = 11627/30000 | Total reward = 24.97
2022-01-26 14:17:21.424 | DEBUG    | __main__:trials:24 - Trial = 11628/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.425 | DEBUG    | __main__:trials:29 - Trial = 11628/30000 | Total reward = 30.28
2022-01-26 14:17:21.428 | DEBUG    | __main__:trials:24 - Trial = 11629/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.430 | DEBUG    | __main__:trials:29 - Trial = 11629/30000 | Total reward = 29.26
2022-01-26 14:17:21.434 | DEBUG    | __main__:trials:24 - Trial = 11630/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.435 | DEBUG    | __main__:trials:29 - Trial = 11630/30000 | Total reward = 29.05
2022-01-26 14:17:21.438 | DEBUG    | __main__:trials:24 - Trial = 11631/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.440 | DEBUG    | __main__:trials:29 - Trial = 11631/30000 | Total reward = 25.80
2022-01-26 14:17:21.444 | DEBUG    | __main__:trials:24 - Trial = 11632/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.445 | DEBUG    | __main__:trials:29 - Trial = 11632/30000 | Total reward = 29.27
2022-01-26 14:17:21.449 | DEBUG    | __main__:trials:24 - Trial = 11633/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.450 | DEBUG    | __main__:trials:29 - Trial = 11633/30000 | Total reward = 60.59
2022-01-26 14:17:21.454 | DEBUG    | __main__:trials:24 - Trial = 11634/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.455 | DEBUG    | __main__:trials:29 - Trial = 11634/30000 | Total reward = 29.53
2022-01-26 14:17:21.459 | DEBUG    | __main__:trials:24 - Trial = 11635/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.460 | DEBUG    | __main__:trials:29 - Trial = 11635/30000 | Total reward = 30.17
2022-01-26 14:17:21.464 | DEBUG    | __main__:trials:24 - Trial = 11636/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.466 | DEBUG    | __main__:trials:29 - Trial = 11636/30000 | Total reward = 35.77
2022-01-26 14:17:21.470 | DEBUG    | __main__:trials:24 - Trial = 11637/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.471 | DEBUG    | __main__:trials:29 - Trial = 11637/30000 | Total reward = 11.06
2022-01-26 14:17:21.474 | DEBUG    | __main__:trials:24 - Trial = 11638/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.476 | DEBUG    | __main__:trials:29 - Trial = 11638/30000 | Total reward = 58.63
2022-01-26 14:17:21.479 | DEBUG    | __main__:trials:26 - Trial = 11639/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.480 | DEBUG    | __main__:trials:29 - Trial = 11639/30000 | Total reward = 10.09
2022-01-26 14:17:21.484 | DEBUG    | __main__:trials:24 - Trial = 11640/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.486 | DEBUG    | __main__:trials:29 - Trial = 11640/30000 | Total reward = 42.40
2022-01-26 14:17:21.489 | DEBUG    | __main__:trials:24 - Trial = 11641/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.491 | DEBUG    | __main__:trials:29 - Trial = 11641/30000 | Total reward = 46.22
2022-01-26 14:17:21.494 | DEBUG    | __main__:trials:24 - Trial = 11642/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.496 | DEBUG    | __main__:trials:29 - Trial = 11642/30000 | Total reward = 25.23
2022-01-26 14:17:21.500 | DEBUG    | __main__:trials:24 - Trial = 11643/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.501 | DEBUG    | __main__:trials:29 - Trial = 11643/30000 | Total reward = -3.27
2022-01-26 14:17:21.504 | DEBUG    | __main__:trials:24 - Trial = 11644/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.506 | DEBUG    | __main__:trials:29 - Trial = 11644/30000 | Total reward = 51.82
2022-01-26 14:17:21.510 | DEBUG    | __main__:trials:24 - Trial = 11645/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.511 | DEBUG    | __main__:trials:29 - Trial = 11645/30000 | Total reward = 21.33
2022-01-26 14:17:21.515 | DEBUG    | __main__:trials:24 - Trial = 11646/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.517 | DEBUG    | __main__:trials:29 - Trial = 11646/30000 | Total reward = 41.31
2022-01-26 14:17:21.520 | DEBUG    | __main__:trials:24 - Trial = 11647/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.521 | DEBUG    | __main__:trials:29 - Trial = 11647/30000 | Total reward = 29.61
2022-01-26 14:17:21.525 | DEBUG    | __main__:trials:24 - Trial = 11648/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.527 | DEBUG    | __main__:trials:29 - Trial = 11648/30000 | Total reward = 26.99
2022-01-26 14:17:21.531 | DEBUG    | __main__:trials:24 - Trial = 11649/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.532 | DEBUG    | __main__:trials:29 - Trial = 11649/30000 | Total reward = 43.09
2022-01-26 14:17:21.535 | DEBUG    | __main__:trials:24 - Trial = 11650/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.537 | DEBUG    | __main__:trials:29 - Trial = 11650/30000 | Total reward = 42.82
2022-01-26 14:17:21.541 | DEBUG    | __main__:trials:24 - Trial = 11651/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.542 | DEBUG    | __main__:trials:29 - Trial = 11651/30000 | Total reward = 29.22
2022-01-26 14:17:21.546 | DEBUG    | __main__:trials:24 - Trial = 11652/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.548 | DEBUG    | __main__:trials:29 - Trial = 11652/30000 | Total reward = 29.22
2022-01-26 14:17:21.552 | DEBUG    | __main__:trials:24 - Trial = 11653/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.553 | DEBUG    | __main__:trials:29 - Trial = 11653/30000 | Total reward = 30.09
2022-01-26 14:17:21.556 | DEBUG    | __main__:trials:24 - Trial = 11654/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.557 | DEBUG    | __main__:trials:29 - Trial = 11654/30000 | Total reward = 29.22
2022-01-26 14:17:21.561 | DEBUG    | __main__:trials:24 - Trial = 11655/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.562 | DEBUG    | __main__:trials:29 - Trial = 11655/30000 | Total reward = 27.86
2022-01-26 14:17:21.565 | DEBUG    | __main__:trials:24 - Trial = 11656/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.567 | DEBUG    | __main__:trials:29 - Trial = 11656/30000 | Total reward = 29.57
2022-01-26 14:17:21.571 | DEBUG    | __main__:trials:24 - Trial = 11657/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.573 | DEBUG    | __main__:trials:29 - Trial = 11657/30000 | Total reward = 27.41
2022-01-26 14:17:21.576 | DEBUG    | __main__:trials:24 - Trial = 11658/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.578 | DEBUG    | __main__:trials:29 - Trial = 11658/30000 | Total reward = 63.36
2022-01-26 14:17:21.581 | DEBUG    | __main__:trials:24 - Trial = 11659/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.583 | DEBUG    | __main__:trials:29 - Trial = 11659/30000 | Total reward = 29.85
2022-01-26 14:17:21.587 | DEBUG    | __main__:trials:24 - Trial = 11660/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.588 | DEBUG    | __main__:trials:29 - Trial = 11660/30000 | Total reward = 29.46
2022-01-26 14:17:21.592 | DEBUG    | __main__:trials:24 - Trial = 11661/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.593 | DEBUG    | __main__:trials:29 - Trial = 11661/30000 | Total reward = 33.02
2022-01-26 14:17:21.597 | DEBUG    | __main__:trials:24 - Trial = 11662/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.598 | DEBUG    | __main__:trials:29 - Trial = 11662/30000 | Total reward = 23.56
2022-01-26 14:17:21.602 | DEBUG    | __main__:trials:24 - Trial = 11663/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.604 | DEBUG    | __main__:trials:29 - Trial = 11663/30000 | Total reward = 52.54
2022-01-26 14:17:21.607 | DEBUG    | __main__:trials:24 - Trial = 11664/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.609 | DEBUG    | __main__:trials:29 - Trial = 11664/30000 | Total reward = 31.85
2022-01-26 14:17:21.612 | DEBUG    | __main__:trials:24 - Trial = 11665/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.613 | DEBUG    | __main__:trials:29 - Trial = 11665/30000 | Total reward = 59.28
2022-01-26 14:17:21.616 | DEBUG    | __main__:trials:24 - Trial = 11666/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.618 | DEBUG    | __main__:trials:29 - Trial = 11666/30000 | Total reward = 35.34
2022-01-26 14:17:21.622 | DEBUG    | __main__:trials:24 - Trial = 11667/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.623 | DEBUG    | __main__:trials:29 - Trial = 11667/30000 | Total reward = 32.15
2022-01-26 14:17:21.626 | DEBUG    | __main__:trials:24 - Trial = 11668/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.628 | DEBUG    | __main__:trials:29 - Trial = 11668/30000 | Total reward = 28.16
2022-01-26 14:17:21.631 | DEBUG    | __main__:trials:24 - Trial = 11669/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.633 | DEBUG    | __main__:trials:29 - Trial = 11669/30000 | Total reward = 42.93
2022-01-26 14:17:21.636 | DEBUG    | __main__:trials:24 - Trial = 11670/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.638 | DEBUG    | __main__:trials:29 - Trial = 11670/30000 | Total reward = 36.03
2022-01-26 14:17:21.642 | DEBUG    | __main__:trials:24 - Trial = 11671/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.643 | DEBUG    | __main__:trials:29 - Trial = 11671/30000 | Total reward = 28.68
2022-01-26 14:17:21.647 | DEBUG    | __main__:trials:24 - Trial = 11672/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.649 | DEBUG    | __main__:trials:29 - Trial = 11672/30000 | Total reward = 29.26
2022-01-26 14:17:21.652 | DEBUG    | __main__:trials:24 - Trial = 11673/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.654 | DEBUG    | __main__:trials:29 - Trial = 11673/30000 | Total reward = 34.50
2022-01-26 14:17:21.658 | DEBUG    | __main__:trials:24 - Trial = 11674/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.659 | DEBUG    | __main__:trials:29 - Trial = 11674/30000 | Total reward = 41.42
2022-01-26 14:17:21.663 | DEBUG    | __main__:trials:24 - Trial = 11675/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.664 | DEBUG    | __main__:trials:29 - Trial = 11675/30000 | Total reward = 45.53
2022-01-26 14:17:21.667 | DEBUG    | __main__:trials:26 - Trial = 11676/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.668 | DEBUG    | __main__:trials:29 - Trial = 11676/30000 | Total reward = 12.15
2022-01-26 14:17:21.672 | DEBUG    | __main__:trials:24 - Trial = 11677/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.674 | DEBUG    | __main__:trials:29 - Trial = 11677/30000 | Total reward = 27.57
2022-01-26 14:17:21.677 | DEBUG    | __main__:trials:26 - Trial = 11678/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.679 | DEBUG    | __main__:trials:29 - Trial = 11678/30000 | Total reward = 24.15
2022-01-26 14:17:21.683 | DEBUG    | __main__:trials:24 - Trial = 11679/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.684 | DEBUG    | __main__:trials:29 - Trial = 11679/30000 | Total reward = 24.06
2022-01-26 14:17:21.688 | DEBUG    | __main__:trials:26 - Trial = 11680/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.689 | DEBUG    | __main__:trials:29 - Trial = 11680/30000 | Total reward = 25.96
2022-01-26 14:17:21.693 | DEBUG    | __main__:trials:24 - Trial = 11681/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.695 | DEBUG    | __main__:trials:29 - Trial = 11681/30000 | Total reward = 33.19
2022-01-26 14:17:21.697 | DEBUG    | __main__:trials:26 - Trial = 11682/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.698 | DEBUG    | __main__:trials:29 - Trial = 11682/30000 | Total reward = 16.46
2022-01-26 14:17:21.701 | DEBUG    | __main__:trials:24 - Trial = 11683/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.703 | DEBUG    | __main__:trials:29 - Trial = 11683/30000 | Total reward = 31.97
2022-01-26 14:17:21.706 | DEBUG    | __main__:trials:24 - Trial = 11684/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.708 | DEBUG    | __main__:trials:29 - Trial = 11684/30000 | Total reward = 28.34
2022-01-26 14:17:21.712 | DEBUG    | __main__:trials:24 - Trial = 11685/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.713 | DEBUG    | __main__:trials:29 - Trial = 11685/30000 | Total reward = 28.98
2022-01-26 14:17:21.716 | DEBUG    | __main__:trials:26 - Trial = 11686/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.717 | DEBUG    | __main__:trials:29 - Trial = 11686/30000 | Total reward = 5.12
2022-01-26 14:17:21.720 | DEBUG    | __main__:trials:24 - Trial = 11687/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.722 | DEBUG    | __main__:trials:29 - Trial = 11687/30000 | Total reward = 28.74
2022-01-26 14:17:21.726 | DEBUG    | __main__:trials:24 - Trial = 11688/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.727 | DEBUG    | __main__:trials:29 - Trial = 11688/30000 | Total reward = 29.85
2022-01-26 14:17:21.731 | DEBUG    | __main__:trials:24 - Trial = 11689/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.733 | DEBUG    | __main__:trials:29 - Trial = 11689/30000 | Total reward = 26.67
2022-01-26 14:17:21.736 | DEBUG    | __main__:trials:24 - Trial = 11690/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.737 | DEBUG    | __main__:trials:29 - Trial = 11690/30000 | Total reward = 27.70
2022-01-26 14:17:21.740 | DEBUG    | __main__:trials:26 - Trial = 11691/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.741 | DEBUG    | __main__:trials:29 - Trial = 11691/30000 | Total reward = 7.12
2022-01-26 14:17:21.745 | DEBUG    | __main__:trials:24 - Trial = 11692/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.746 | DEBUG    | __main__:trials:29 - Trial = 11692/30000 | Total reward = 31.73
2022-01-26 14:17:21.749 | DEBUG    | __main__:trials:24 - Trial = 11693/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.750 | DEBUG    | __main__:trials:29 - Trial = 11693/30000 | Total reward = 50.58
2022-01-26 14:17:21.753 | DEBUG    | __main__:trials:24 - Trial = 11694/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.755 | DEBUG    | __main__:trials:29 - Trial = 11694/30000 | Total reward = 35.23
2022-01-26 14:17:21.758 | DEBUG    | __main__:trials:24 - Trial = 11695/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.759 | DEBUG    | __main__:trials:29 - Trial = 11695/30000 | Total reward = 47.01
2022-01-26 14:17:21.763 | DEBUG    | __main__:trials:24 - Trial = 11696/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.765 | DEBUG    | __main__:trials:29 - Trial = 11696/30000 | Total reward = 59.10
2022-01-26 14:17:21.768 | DEBUG    | __main__:trials:24 - Trial = 11697/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.770 | DEBUG    | __main__:trials:29 - Trial = 11697/30000 | Total reward = 29.07
2022-01-26 14:17:21.774 | DEBUG    | __main__:trials:24 - Trial = 11698/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.775 | DEBUG    | __main__:trials:29 - Trial = 11698/30000 | Total reward = 38.23
2022-01-26 14:17:21.779 | DEBUG    | __main__:trials:24 - Trial = 11699/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.780 | DEBUG    | __main__:trials:29 - Trial = 11699/30000 | Total reward = 58.70
2022-01-26 14:17:21.784 | DEBUG    | __main__:trials:24 - Trial = 11700/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.786 | DEBUG    | __main__:trials:29 - Trial = 11700/30000 | Total reward = 67.07
2022-01-26 14:17:21.789 | DEBUG    | __main__:trials:24 - Trial = 11701/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.791 | DEBUG    | __main__:trials:29 - Trial = 11701/30000 | Total reward = 65.80
2022-01-26 14:17:21.795 | DEBUG    | __main__:trials:24 - Trial = 11702/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.796 | DEBUG    | __main__:trials:29 - Trial = 11702/30000 | Total reward = 53.70
2022-01-26 14:17:21.800 | DEBUG    | __main__:trials:24 - Trial = 11703/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.801 | DEBUG    | __main__:trials:29 - Trial = 11703/30000 | Total reward = 42.92
2022-01-26 14:17:21.805 | DEBUG    | __main__:trials:24 - Trial = 11704/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.807 | DEBUG    | __main__:trials:29 - Trial = 11704/30000 | Total reward = 60.59
2022-01-26 14:17:21.810 | DEBUG    | __main__:trials:24 - Trial = 11705/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.812 | DEBUG    | __main__:trials:29 - Trial = 11705/30000 | Total reward = 53.56
2022-01-26 14:17:21.816 | DEBUG    | __main__:trials:24 - Trial = 11706/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.818 | DEBUG    | __main__:trials:29 - Trial = 11706/30000 | Total reward = 43.52
2022-01-26 14:17:21.821 | DEBUG    | __main__:trials:24 - Trial = 11707/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.822 | DEBUG    | __main__:trials:29 - Trial = 11707/30000 | Total reward = 27.11
2022-01-26 14:17:21.826 | DEBUG    | __main__:trials:24 - Trial = 11708/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.828 | DEBUG    | __main__:trials:29 - Trial = 11708/30000 | Total reward = 25.11
2022-01-26 14:17:21.831 | DEBUG    | __main__:trials:24 - Trial = 11709/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.833 | DEBUG    | __main__:trials:29 - Trial = 11709/30000 | Total reward = 29.22
2022-01-26 14:17:21.837 | DEBUG    | __main__:trials:24 - Trial = 11710/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.837 | DEBUG    | __main__:trials:29 - Trial = 11710/30000 | Total reward = 35.71
2022-01-26 14:17:21.842 | DEBUG    | __main__:trials:24 - Trial = 11711/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.842 | DEBUG    | __main__:trials:29 - Trial = 11711/30000 | Total reward = 29.30
2022-01-26 14:17:21.847 | DEBUG    | __main__:trials:24 - Trial = 11712/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.848 | DEBUG    | __main__:trials:29 - Trial = 11712/30000 | Total reward = 40.80
2022-01-26 14:17:21.852 | DEBUG    | __main__:trials:24 - Trial = 11713/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.853 | DEBUG    | __main__:trials:29 - Trial = 11713/30000 | Total reward = 28.62
2022-01-26 14:17:21.857 | DEBUG    | __main__:trials:24 - Trial = 11714/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.859 | DEBUG    | __main__:trials:29 - Trial = 11714/30000 | Total reward = 29.14
2022-01-26 14:17:21.862 | DEBUG    | __main__:trials:26 - Trial = 11715/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.864 | DEBUG    | __main__:trials:29 - Trial = 11715/30000 | Total reward = 21.76
2022-01-26 14:17:21.868 | DEBUG    | __main__:trials:24 - Trial = 11716/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.869 | DEBUG    | __main__:trials:29 - Trial = 11716/30000 | Total reward = 24.52
2022-01-26 14:17:21.873 | DEBUG    | __main__:trials:24 - Trial = 11717/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.874 | DEBUG    | __main__:trials:29 - Trial = 11717/30000 | Total reward = 47.05
2022-01-26 14:17:21.878 | DEBUG    | __main__:trials:24 - Trial = 11718/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.880 | DEBUG    | __main__:trials:29 - Trial = 11718/30000 | Total reward = 41.43
2022-01-26 14:17:21.883 | DEBUG    | __main__:trials:24 - Trial = 11719/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.885 | DEBUG    | __main__:trials:29 - Trial = 11719/30000 | Total reward = 25.30
2022-01-26 14:17:21.888 | DEBUG    | __main__:trials:24 - Trial = 11720/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.890 | DEBUG    | __main__:trials:29 - Trial = 11720/30000 | Total reward = 29.08
2022-01-26 14:17:21.894 | DEBUG    | __main__:trials:24 - Trial = 11721/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.894 | DEBUG    | __main__:trials:29 - Trial = 11721/30000 | Total reward = 61.16
2022-01-26 14:17:21.898 | DEBUG    | __main__:trials:24 - Trial = 11722/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.899 | DEBUG    | __main__:trials:29 - Trial = 11722/30000 | Total reward = 40.78
2022-01-26 14:17:21.903 | DEBUG    | __main__:trials:24 - Trial = 11723/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.905 | DEBUG    | __main__:trials:29 - Trial = 11723/30000 | Total reward = 41.08
2022-01-26 14:17:21.908 | DEBUG    | __main__:trials:24 - Trial = 11724/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.910 | DEBUG    | __main__:trials:29 - Trial = 11724/30000 | Total reward = 40.31
2022-01-26 14:17:21.914 | DEBUG    | __main__:trials:24 - Trial = 11725/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.915 | DEBUG    | __main__:trials:29 - Trial = 11725/30000 | Total reward = 43.00
2022-01-26 14:17:21.919 | DEBUG    | __main__:trials:24 - Trial = 11726/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.920 | DEBUG    | __main__:trials:29 - Trial = 11726/30000 | Total reward = 34.19
2022-01-26 14:17:21.924 | DEBUG    | __main__:trials:24 - Trial = 11727/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.926 | DEBUG    | __main__:trials:29 - Trial = 11727/30000 | Total reward = 32.40
2022-01-26 14:17:21.929 | DEBUG    | __main__:trials:24 - Trial = 11728/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.931 | DEBUG    | __main__:trials:29 - Trial = 11728/30000 | Total reward = 29.62
2022-01-26 14:17:21.935 | DEBUG    | __main__:trials:24 - Trial = 11729/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.936 | DEBUG    | __main__:trials:29 - Trial = 11729/30000 | Total reward = 38.79
2022-01-26 14:17:21.940 | DEBUG    | __main__:trials:24 - Trial = 11730/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.941 | DEBUG    | __main__:trials:29 - Trial = 11730/30000 | Total reward = 25.61
2022-01-26 14:17:21.945 | DEBUG    | __main__:trials:24 - Trial = 11731/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.946 | DEBUG    | __main__:trials:29 - Trial = 11731/30000 | Total reward = 30.51
2022-01-26 14:17:21.950 | DEBUG    | __main__:trials:24 - Trial = 11732/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.951 | DEBUG    | __main__:trials:29 - Trial = 11732/30000 | Total reward = 31.03
2022-01-26 14:17:21.955 | DEBUG    | __main__:trials:24 - Trial = 11733/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.957 | DEBUG    | __main__:trials:29 - Trial = 11733/30000 | Total reward = 46.81
2022-01-26 14:17:21.960 | DEBUG    | __main__:trials:24 - Trial = 11734/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.962 | DEBUG    | __main__:trials:29 - Trial = 11734/30000 | Total reward = 29.22
2022-01-26 14:17:21.966 | DEBUG    | __main__:trials:24 - Trial = 11735/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.967 | DEBUG    | __main__:trials:29 - Trial = 11735/30000 | Total reward = 31.69
2022-01-26 14:17:21.971 | DEBUG    | __main__:trials:26 - Trial = 11736/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:21.972 | DEBUG    | __main__:trials:29 - Trial = 11736/30000 | Total reward = 18.94
2022-01-26 14:17:21.976 | DEBUG    | __main__:trials:24 - Trial = 11737/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.977 | DEBUG    | __main__:trials:29 - Trial = 11737/30000 | Total reward = 42.88
2022-01-26 14:17:21.981 | DEBUG    | __main__:trials:24 - Trial = 11738/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.983 | DEBUG    | __main__:trials:29 - Trial = 11738/30000 | Total reward = 36.63
2022-01-26 14:17:21.986 | DEBUG    | __main__:trials:24 - Trial = 11739/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.988 | DEBUG    | __main__:trials:29 - Trial = 11739/30000 | Total reward = 29.44
2022-01-26 14:17:21.991 | DEBUG    | __main__:trials:24 - Trial = 11740/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.993 | DEBUG    | __main__:trials:29 - Trial = 11740/30000 | Total reward = 30.92
2022-01-26 14:17:21.996 | DEBUG    | __main__:trials:24 - Trial = 11741/30000 | Max number of steps (20) reached
2022-01-26 14:17:21.998 | DEBUG    | __main__:trials:29 - Trial = 11741/30000 | Total reward = 53.81
2022-01-26 14:17:22.001 | DEBUG    | __main__:trials:24 - Trial = 11742/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.003 | DEBUG    | __main__:trials:29 - Trial = 11742/30000 | Total reward = 43.94
2022-01-26 14:17:22.006 | DEBUG    | __main__:trials:24 - Trial = 11743/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.007 | DEBUG    | __main__:trials:29 - Trial = 11743/30000 | Total reward = 38.57
2022-01-26 14:17:22.011 | DEBUG    | __main__:trials:24 - Trial = 11744/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.012 | DEBUG    | __main__:trials:29 - Trial = 11744/30000 | Total reward = 27.26
2022-01-26 14:17:22.016 | DEBUG    | __main__:trials:24 - Trial = 11745/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.018 | DEBUG    | __main__:trials:29 - Trial = 11745/30000 | Total reward = 22.95
2022-01-26 14:17:22.021 | DEBUG    | __main__:trials:24 - Trial = 11746/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.022 | DEBUG    | __main__:trials:29 - Trial = 11746/30000 | Total reward = 30.23
2022-01-26 14:17:22.026 | DEBUG    | __main__:trials:24 - Trial = 11747/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.028 | DEBUG    | __main__:trials:29 - Trial = 11747/30000 | Total reward = 32.22
2022-01-26 14:17:22.031 | DEBUG    | __main__:trials:24 - Trial = 11748/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.033 | DEBUG    | __main__:trials:29 - Trial = 11748/30000 | Total reward = 40.74
2022-01-26 14:17:22.037 | DEBUG    | __main__:trials:24 - Trial = 11749/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.038 | DEBUG    | __main__:trials:29 - Trial = 11749/30000 | Total reward = 47.79
2022-01-26 14:17:22.042 | DEBUG    | __main__:trials:24 - Trial = 11750/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.043 | DEBUG    | __main__:trials:29 - Trial = 11750/30000 | Total reward = 58.79
2022-01-26 14:17:22.047 | DEBUG    | __main__:trials:24 - Trial = 11751/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.049 | DEBUG    | __main__:trials:29 - Trial = 11751/30000 | Total reward = 51.11
2022-01-26 14:17:22.053 | DEBUG    | __main__:trials:24 - Trial = 11752/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.055 | DEBUG    | __main__:trials:29 - Trial = 11752/30000 | Total reward = 58.10
2022-01-26 14:17:22.058 | DEBUG    | __main__:trials:24 - Trial = 11753/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.059 | DEBUG    | __main__:trials:29 - Trial = 11753/30000 | Total reward = 46.78
2022-01-26 14:17:22.063 | DEBUG    | __main__:trials:24 - Trial = 11754/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.064 | DEBUG    | __main__:trials:29 - Trial = 11754/30000 | Total reward = 36.85
2022-01-26 14:17:22.068 | DEBUG    | __main__:trials:24 - Trial = 11755/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.070 | DEBUG    | __main__:trials:29 - Trial = 11755/30000 | Total reward = 62.32
2022-01-26 14:17:22.073 | DEBUG    | __main__:trials:24 - Trial = 11756/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.075 | DEBUG    | __main__:trials:29 - Trial = 11756/30000 | Total reward = 39.92
2022-01-26 14:17:22.079 | DEBUG    | __main__:trials:24 - Trial = 11757/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.080 | DEBUG    | __main__:trials:29 - Trial = 11757/30000 | Total reward = 33.35
2022-01-26 14:17:22.084 | DEBUG    | __main__:trials:24 - Trial = 11758/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.086 | DEBUG    | __main__:trials:29 - Trial = 11758/30000 | Total reward = 31.48
2022-01-26 14:17:22.090 | DEBUG    | __main__:trials:24 - Trial = 11759/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.091 | DEBUG    | __main__:trials:29 - Trial = 11759/30000 | Total reward = 50.78
2022-01-26 14:17:22.095 | DEBUG    | __main__:trials:24 - Trial = 11760/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.097 | DEBUG    | __main__:trials:29 - Trial = 11760/30000 | Total reward = 35.38
2022-01-26 14:17:22.100 | DEBUG    | __main__:trials:24 - Trial = 11761/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.102 | DEBUG    | __main__:trials:29 - Trial = 11761/30000 | Total reward = 45.74
2022-01-26 14:17:22.105 | DEBUG    | __main__:trials:24 - Trial = 11762/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.107 | DEBUG    | __main__:trials:29 - Trial = 11762/30000 | Total reward = 35.84
2022-01-26 14:17:22.111 | DEBUG    | __main__:trials:24 - Trial = 11763/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.112 | DEBUG    | __main__:trials:29 - Trial = 11763/30000 | Total reward = 37.27
2022-01-26 14:17:22.116 | DEBUG    | __main__:trials:26 - Trial = 11764/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.118 | DEBUG    | __main__:trials:29 - Trial = 11764/30000 | Total reward = 39.32
2022-01-26 14:17:22.121 | DEBUG    | __main__:trials:24 - Trial = 11765/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.122 | DEBUG    | __main__:trials:29 - Trial = 11765/30000 | Total reward = 46.65
2022-01-26 14:17:22.127 | DEBUG    | __main__:trials:24 - Trial = 11766/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.128 | DEBUG    | __main__:trials:29 - Trial = 11766/30000 | Total reward = 47.69
2022-01-26 14:17:22.132 | DEBUG    | __main__:trials:24 - Trial = 11767/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.133 | DEBUG    | __main__:trials:29 - Trial = 11767/30000 | Total reward = 47.09
2022-01-26 14:17:22.136 | DEBUG    | __main__:trials:24 - Trial = 11768/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.138 | DEBUG    | __main__:trials:29 - Trial = 11768/30000 | Total reward = 47.84
2022-01-26 14:17:22.142 | DEBUG    | __main__:trials:24 - Trial = 11769/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.143 | DEBUG    | __main__:trials:29 - Trial = 11769/30000 | Total reward = 31.19
2022-01-26 14:17:22.147 | DEBUG    | __main__:trials:24 - Trial = 11770/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.149 | DEBUG    | __main__:trials:29 - Trial = 11770/30000 | Total reward = 51.97
2022-01-26 14:17:22.152 | DEBUG    | __main__:trials:24 - Trial = 11771/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.154 | DEBUG    | __main__:trials:29 - Trial = 11771/30000 | Total reward = 45.74
2022-01-26 14:17:22.157 | DEBUG    | __main__:trials:24 - Trial = 11772/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.158 | DEBUG    | __main__:trials:29 - Trial = 11772/30000 | Total reward = 32.03
2022-01-26 14:17:22.162 | DEBUG    | __main__:trials:24 - Trial = 11773/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.163 | DEBUG    | __main__:trials:29 - Trial = 11773/30000 | Total reward = 31.12
2022-01-26 14:17:22.167 | DEBUG    | __main__:trials:24 - Trial = 11774/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.169 | DEBUG    | __main__:trials:29 - Trial = 11774/30000 | Total reward = 56.19
2022-01-26 14:17:22.172 | DEBUG    | __main__:trials:24 - Trial = 11775/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.174 | DEBUG    | __main__:trials:29 - Trial = 11775/30000 | Total reward = 48.42
2022-01-26 14:17:22.177 | DEBUG    | __main__:trials:26 - Trial = 11776/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.179 | DEBUG    | __main__:trials:29 - Trial = 11776/30000 | Total reward = 16.32
2022-01-26 14:17:22.182 | DEBUG    | __main__:trials:24 - Trial = 11777/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.184 | DEBUG    | __main__:trials:29 - Trial = 11777/30000 | Total reward = 46.88
2022-01-26 14:17:22.187 | DEBUG    | __main__:trials:24 - Trial = 11778/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.189 | DEBUG    | __main__:trials:29 - Trial = 11778/30000 | Total reward = 16.42
2022-01-26 14:17:22.192 | DEBUG    | __main__:trials:24 - Trial = 11779/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.194 | DEBUG    | __main__:trials:29 - Trial = 11779/30000 | Total reward = 41.28
2022-01-26 14:17:22.198 | DEBUG    | __main__:trials:24 - Trial = 11780/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.198 | DEBUG    | __main__:trials:29 - Trial = 11780/30000 | Total reward = 44.12
2022-01-26 14:17:22.202 | DEBUG    | __main__:trials:24 - Trial = 11781/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.204 | DEBUG    | __main__:trials:29 - Trial = 11781/30000 | Total reward = 40.93
2022-01-26 14:17:22.208 | DEBUG    | __main__:trials:24 - Trial = 11782/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.209 | DEBUG    | __main__:trials:29 - Trial = 11782/30000 | Total reward = 62.61
2022-01-26 14:17:22.213 | DEBUG    | __main__:trials:24 - Trial = 11783/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.214 | DEBUG    | __main__:trials:29 - Trial = 11783/30000 | Total reward = 42.41
2022-01-26 14:17:22.218 | DEBUG    | __main__:trials:24 - Trial = 11784/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.219 | DEBUG    | __main__:trials:29 - Trial = 11784/30000 | Total reward = 40.48
2022-01-26 14:17:22.223 | DEBUG    | __main__:trials:24 - Trial = 11785/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.224 | DEBUG    | __main__:trials:29 - Trial = 11785/30000 | Total reward = 56.37
2022-01-26 14:17:22.228 | DEBUG    | __main__:trials:24 - Trial = 11786/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.230 | DEBUG    | __main__:trials:29 - Trial = 11786/30000 | Total reward = 40.82
2022-01-26 14:17:22.233 | DEBUG    | __main__:trials:24 - Trial = 11787/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.235 | DEBUG    | __main__:trials:29 - Trial = 11787/30000 | Total reward = 33.82
2022-01-26 14:17:22.238 | DEBUG    | __main__:trials:24 - Trial = 11788/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.240 | DEBUG    | __main__:trials:29 - Trial = 11788/30000 | Total reward = 53.51
2022-01-26 14:17:22.243 | DEBUG    | __main__:trials:24 - Trial = 11789/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.245 | DEBUG    | __main__:trials:29 - Trial = 11789/30000 | Total reward = 47.83
2022-01-26 14:17:22.248 | DEBUG    | __main__:trials:24 - Trial = 11790/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.250 | DEBUG    | __main__:trials:29 - Trial = 11790/30000 | Total reward = 38.82
2022-01-26 14:17:22.253 | DEBUG    | __main__:trials:24 - Trial = 11791/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.254 | DEBUG    | __main__:trials:29 - Trial = 11791/30000 | Total reward = 53.53
2022-01-26 14:17:22.257 | DEBUG    | __main__:trials:24 - Trial = 11792/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.259 | DEBUG    | __main__:trials:29 - Trial = 11792/30000 | Total reward = 32.57
2022-01-26 14:17:22.262 | DEBUG    | __main__:trials:24 - Trial = 11793/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.264 | DEBUG    | __main__:trials:29 - Trial = 11793/30000 | Total reward = 32.75
2022-01-26 14:17:22.268 | DEBUG    | __main__:trials:24 - Trial = 11794/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.269 | DEBUG    | __main__:trials:29 - Trial = 11794/30000 | Total reward = 49.63
2022-01-26 14:17:22.273 | DEBUG    | __main__:trials:24 - Trial = 11795/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.273 | DEBUG    | __main__:trials:29 - Trial = 11795/30000 | Total reward = 58.58
2022-01-26 14:17:22.277 | DEBUG    | __main__:trials:24 - Trial = 11796/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.278 | DEBUG    | __main__:trials:29 - Trial = 11796/30000 | Total reward = 61.08
2022-01-26 14:17:22.281 | DEBUG    | __main__:trials:24 - Trial = 11797/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.283 | DEBUG    | __main__:trials:29 - Trial = 11797/30000 | Total reward = 40.94
2022-01-26 14:17:22.287 | DEBUG    | __main__:trials:24 - Trial = 11798/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.289 | DEBUG    | __main__:trials:29 - Trial = 11798/30000 | Total reward = 40.23
2022-01-26 14:17:22.292 | DEBUG    | __main__:trials:24 - Trial = 11799/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.293 | DEBUG    | __main__:trials:29 - Trial = 11799/30000 | Total reward = 32.06
2022-01-26 14:17:22.297 | DEBUG    | __main__:trials:24 - Trial = 11800/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.298 | DEBUG    | __main__:trials:29 - Trial = 11800/30000 | Total reward = 49.15
2022-01-26 14:17:22.302 | DEBUG    | __main__:trials:26 - Trial = 11801/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.304 | DEBUG    | __main__:trials:29 - Trial = 11801/30000 | Total reward = 19.44
2022-01-26 14:17:22.307 | DEBUG    | __main__:trials:24 - Trial = 11802/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.309 | DEBUG    | __main__:trials:29 - Trial = 11802/30000 | Total reward = 39.85
2022-01-26 14:17:22.312 | DEBUG    | __main__:trials:24 - Trial = 11803/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.314 | DEBUG    | __main__:trials:29 - Trial = 11803/30000 | Total reward = 38.36
2022-01-26 14:17:22.317 | DEBUG    | __main__:trials:24 - Trial = 11804/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.318 | DEBUG    | __main__:trials:29 - Trial = 11804/30000 | Total reward = 25.12
2022-01-26 14:17:22.322 | DEBUG    | __main__:trials:24 - Trial = 11805/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.323 | DEBUG    | __main__:trials:29 - Trial = 11805/30000 | Total reward = 39.75
2022-01-26 14:17:22.327 | DEBUG    | __main__:trials:24 - Trial = 11806/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.329 | DEBUG    | __main__:trials:29 - Trial = 11806/30000 | Total reward = 46.16
2022-01-26 14:17:22.333 | DEBUG    | __main__:trials:24 - Trial = 11807/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.334 | DEBUG    | __main__:trials:29 - Trial = 11807/30000 | Total reward = 37.14
2022-01-26 14:17:22.338 | DEBUG    | __main__:trials:24 - Trial = 11808/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.339 | DEBUG    | __main__:trials:29 - Trial = 11808/30000 | Total reward = 25.12
2022-01-26 14:17:22.342 | DEBUG    | __main__:trials:24 - Trial = 11809/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.344 | DEBUG    | __main__:trials:29 - Trial = 11809/30000 | Total reward = 20.47
2022-01-26 14:17:22.347 | DEBUG    | __main__:trials:24 - Trial = 11810/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.349 | DEBUG    | __main__:trials:29 - Trial = 11810/30000 | Total reward = 44.85
2022-01-26 14:17:22.352 | DEBUG    | __main__:trials:24 - Trial = 11811/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.353 | DEBUG    | __main__:trials:29 - Trial = 11811/30000 | Total reward = 26.70
2022-01-26 14:17:22.356 | DEBUG    | __main__:trials:24 - Trial = 11812/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.357 | DEBUG    | __main__:trials:29 - Trial = 11812/30000 | Total reward = 25.03
2022-01-26 14:17:22.360 | DEBUG    | __main__:trials:24 - Trial = 11813/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.362 | DEBUG    | __main__:trials:29 - Trial = 11813/30000 | Total reward = 41.39
2022-01-26 14:17:22.365 | DEBUG    | __main__:trials:24 - Trial = 11814/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.366 | DEBUG    | __main__:trials:29 - Trial = 11814/30000 | Total reward = 40.14
2022-01-26 14:17:22.370 | DEBUG    | __main__:trials:24 - Trial = 11815/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.372 | DEBUG    | __main__:trials:29 - Trial = 11815/30000 | Total reward = 47.16
2022-01-26 14:17:22.376 | DEBUG    | __main__:trials:24 - Trial = 11816/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.377 | DEBUG    | __main__:trials:29 - Trial = 11816/30000 | Total reward = 28.37
2022-01-26 14:17:22.380 | DEBUG    | __main__:trials:24 - Trial = 11817/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.382 | DEBUG    | __main__:trials:29 - Trial = 11817/30000 | Total reward = 38.23
2022-01-26 14:17:22.386 | DEBUG    | __main__:trials:24 - Trial = 11818/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.386 | DEBUG    | __main__:trials:29 - Trial = 11818/30000 | Total reward = 31.26
2022-01-26 14:17:22.390 | DEBUG    | __main__:trials:24 - Trial = 11819/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.392 | DEBUG    | __main__:trials:29 - Trial = 11819/30000 | Total reward = 45.88
2022-01-26 14:17:22.395 | DEBUG    | __main__:trials:24 - Trial = 11820/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.397 | DEBUG    | __main__:trials:29 - Trial = 11820/30000 | Total reward = 44.61
2022-01-26 14:17:22.400 | DEBUG    | __main__:trials:24 - Trial = 11821/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.402 | DEBUG    | __main__:trials:29 - Trial = 11821/30000 | Total reward = 33.65
2022-01-26 14:17:22.406 | DEBUG    | __main__:trials:24 - Trial = 11822/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.407 | DEBUG    | __main__:trials:29 - Trial = 11822/30000 | Total reward = 44.62
2022-01-26 14:17:22.411 | DEBUG    | __main__:trials:26 - Trial = 11823/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.412 | DEBUG    | __main__:trials:29 - Trial = 11823/30000 | Total reward = 32.56
2022-01-26 14:17:22.415 | DEBUG    | __main__:trials:24 - Trial = 11824/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.417 | DEBUG    | __main__:trials:29 - Trial = 11824/30000 | Total reward = 30.04
2022-01-26 14:17:22.421 | DEBUG    | __main__:trials:24 - Trial = 11825/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.422 | DEBUG    | __main__:trials:29 - Trial = 11825/30000 | Total reward = 42.52
2022-01-26 14:17:22.425 | DEBUG    | __main__:trials:24 - Trial = 11826/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.427 | DEBUG    | __main__:trials:29 - Trial = 11826/30000 | Total reward = 41.67
2022-01-26 14:17:22.430 | DEBUG    | __main__:trials:26 - Trial = 11827/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.432 | DEBUG    | __main__:trials:29 - Trial = 11827/30000 | Total reward = 19.64
2022-01-26 14:17:22.435 | DEBUG    | __main__:trials:24 - Trial = 11828/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.437 | DEBUG    | __main__:trials:29 - Trial = 11828/30000 | Total reward = 47.16
2022-01-26 14:17:22.440 | DEBUG    | __main__:trials:24 - Trial = 11829/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.442 | DEBUG    | __main__:trials:29 - Trial = 11829/30000 | Total reward = 45.55
2022-01-26 14:17:22.446 | DEBUG    | __main__:trials:24 - Trial = 11830/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.447 | DEBUG    | __main__:trials:29 - Trial = 11830/30000 | Total reward = 31.87
2022-01-26 14:17:22.451 | DEBUG    | __main__:trials:24 - Trial = 11831/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.452 | DEBUG    | __main__:trials:29 - Trial = 11831/30000 | Total reward = 41.14
2022-01-26 14:17:22.456 | DEBUG    | __main__:trials:24 - Trial = 11832/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.457 | DEBUG    | __main__:trials:29 - Trial = 11832/30000 | Total reward = 39.81
2022-01-26 14:17:22.461 | DEBUG    | __main__:trials:24 - Trial = 11833/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.463 | DEBUG    | __main__:trials:29 - Trial = 11833/30000 | Total reward = 29.38
2022-01-26 14:17:22.466 | DEBUG    | __main__:trials:24 - Trial = 11834/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.468 | DEBUG    | __main__:trials:29 - Trial = 11834/30000 | Total reward = 45.33
2022-01-26 14:17:22.472 | DEBUG    | __main__:trials:24 - Trial = 11835/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.473 | DEBUG    | __main__:trials:29 - Trial = 11835/30000 | Total reward = 30.27
2022-01-26 14:17:22.476 | DEBUG    | __main__:trials:24 - Trial = 11836/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.478 | DEBUG    | __main__:trials:29 - Trial = 11836/30000 | Total reward = 49.47
2022-01-26 14:17:22.482 | DEBUG    | __main__:trials:24 - Trial = 11837/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.483 | DEBUG    | __main__:trials:29 - Trial = 11837/30000 | Total reward = 35.89
2022-01-26 14:17:22.487 | DEBUG    | __main__:trials:24 - Trial = 11838/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.488 | DEBUG    | __main__:trials:29 - Trial = 11838/30000 | Total reward = 47.03
2022-01-26 14:17:22.492 | DEBUG    | __main__:trials:24 - Trial = 11839/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.493 | DEBUG    | __main__:trials:29 - Trial = 11839/30000 | Total reward = 55.90
2022-01-26 14:17:22.497 | DEBUG    | __main__:trials:24 - Trial = 11840/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.498 | DEBUG    | __main__:trials:29 - Trial = 11840/30000 | Total reward = 42.33
2022-01-26 14:17:22.502 | DEBUG    | __main__:trials:24 - Trial = 11841/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.503 | DEBUG    | __main__:trials:29 - Trial = 11841/30000 | Total reward = 31.40
2022-01-26 14:17:22.507 | DEBUG    | __main__:trials:24 - Trial = 11842/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.508 | DEBUG    | __main__:trials:29 - Trial = 11842/30000 | Total reward = 30.38
2022-01-26 14:17:22.512 | DEBUG    | __main__:trials:24 - Trial = 11843/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.514 | DEBUG    | __main__:trials:29 - Trial = 11843/30000 | Total reward = 57.65
2022-01-26 14:17:22.517 | DEBUG    | __main__:trials:24 - Trial = 11844/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.519 | DEBUG    | __main__:trials:29 - Trial = 11844/30000 | Total reward = 43.31
2022-01-26 14:17:22.523 | DEBUG    | __main__:trials:24 - Trial = 11845/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.524 | DEBUG    | __main__:trials:29 - Trial = 11845/30000 | Total reward = 49.29
2022-01-26 14:17:22.528 | DEBUG    | __main__:trials:24 - Trial = 11846/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.530 | DEBUG    | __main__:trials:29 - Trial = 11846/30000 | Total reward = 43.89
2022-01-26 14:17:22.533 | DEBUG    | __main__:trials:24 - Trial = 11847/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.535 | DEBUG    | __main__:trials:29 - Trial = 11847/30000 | Total reward = 47.72
2022-01-26 14:17:22.538 | DEBUG    | __main__:trials:24 - Trial = 11848/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.540 | DEBUG    | __main__:trials:29 - Trial = 11848/30000 | Total reward = 45.44
2022-01-26 14:17:22.543 | DEBUG    | __main__:trials:24 - Trial = 11849/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.544 | DEBUG    | __main__:trials:29 - Trial = 11849/30000 | Total reward = 44.50
2022-01-26 14:17:22.547 | DEBUG    | __main__:trials:26 - Trial = 11850/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.549 | DEBUG    | __main__:trials:29 - Trial = 11850/30000 | Total reward = 33.20
2022-01-26 14:17:22.553 | DEBUG    | __main__:trials:24 - Trial = 11851/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.554 | DEBUG    | __main__:trials:29 - Trial = 11851/30000 | Total reward = 57.19
2022-01-26 14:17:22.557 | DEBUG    | __main__:trials:24 - Trial = 11852/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.558 | DEBUG    | __main__:trials:29 - Trial = 11852/30000 | Total reward = 35.19
2022-01-26 14:17:22.563 | DEBUG    | __main__:trials:24 - Trial = 11853/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.565 | DEBUG    | __main__:trials:29 - Trial = 11853/30000 | Total reward = 42.23
2022-01-26 14:17:22.568 | DEBUG    | __main__:trials:24 - Trial = 11854/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.570 | DEBUG    | __main__:trials:29 - Trial = 11854/30000 | Total reward = 41.99
2022-01-26 14:17:22.573 | DEBUG    | __main__:trials:24 - Trial = 11855/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.574 | DEBUG    | __main__:trials:29 - Trial = 11855/30000 | Total reward = 36.76
2022-01-26 14:17:22.579 | DEBUG    | __main__:trials:24 - Trial = 11856/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.580 | DEBUG    | __main__:trials:29 - Trial = 11856/30000 | Total reward = 33.89
2022-01-26 14:17:22.584 | DEBUG    | __main__:trials:24 - Trial = 11857/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.585 | DEBUG    | __main__:trials:29 - Trial = 11857/30000 | Total reward = 41.36
2022-01-26 14:17:22.589 | DEBUG    | __main__:trials:24 - Trial = 11858/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.591 | DEBUG    | __main__:trials:29 - Trial = 11858/30000 | Total reward = 62.68
2022-01-26 14:17:22.594 | DEBUG    | __main__:trials:24 - Trial = 11859/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.596 | DEBUG    | __main__:trials:29 - Trial = 11859/30000 | Total reward = 48.89
2022-01-26 14:17:22.600 | DEBUG    | __main__:trials:24 - Trial = 11860/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.601 | DEBUG    | __main__:trials:29 - Trial = 11860/30000 | Total reward = 47.58
2022-01-26 14:17:22.604 | DEBUG    | __main__:trials:24 - Trial = 11861/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.606 | DEBUG    | __main__:trials:29 - Trial = 11861/30000 | Total reward = 34.94
2022-01-26 14:17:22.610 | DEBUG    | __main__:trials:24 - Trial = 11862/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.611 | DEBUG    | __main__:trials:29 - Trial = 11862/30000 | Total reward = 34.58
2022-01-26 14:17:22.615 | DEBUG    | __main__:trials:24 - Trial = 11863/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.616 | DEBUG    | __main__:trials:29 - Trial = 11863/30000 | Total reward = 39.78
2022-01-26 14:17:22.620 | DEBUG    | __main__:trials:24 - Trial = 11864/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.621 | DEBUG    | __main__:trials:29 - Trial = 11864/30000 | Total reward = 66.99
2022-01-26 14:17:22.625 | DEBUG    | __main__:trials:24 - Trial = 11865/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.626 | DEBUG    | __main__:trials:29 - Trial = 11865/30000 | Total reward = 44.81
2022-01-26 14:17:22.630 | DEBUG    | __main__:trials:24 - Trial = 11866/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.632 | DEBUG    | __main__:trials:29 - Trial = 11866/30000 | Total reward = 67.43
2022-01-26 14:17:22.635 | DEBUG    | __main__:trials:24 - Trial = 11867/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.637 | DEBUG    | __main__:trials:29 - Trial = 11867/30000 | Total reward = 41.59
2022-01-26 14:17:22.640 | DEBUG    | __main__:trials:24 - Trial = 11868/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.642 | DEBUG    | __main__:trials:29 - Trial = 11868/30000 | Total reward = 36.87
2022-01-26 14:17:22.645 | DEBUG    | __main__:trials:24 - Trial = 11869/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.647 | DEBUG    | __main__:trials:29 - Trial = 11869/30000 | Total reward = 54.53
2022-01-26 14:17:22.651 | DEBUG    | __main__:trials:24 - Trial = 11870/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.652 | DEBUG    | __main__:trials:29 - Trial = 11870/30000 | Total reward = 43.98
2022-01-26 14:17:22.655 | DEBUG    | __main__:trials:24 - Trial = 11871/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.657 | DEBUG    | __main__:trials:29 - Trial = 11871/30000 | Total reward = 20.58
2022-01-26 14:17:22.661 | DEBUG    | __main__:trials:26 - Trial = 11872/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.661 | DEBUG    | __main__:trials:29 - Trial = 11872/30000 | Total reward = 26.34
2022-01-26 14:17:22.664 | DEBUG    | __main__:trials:24 - Trial = 11873/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.666 | DEBUG    | __main__:trials:29 - Trial = 11873/30000 | Total reward = 42.48
2022-01-26 14:17:22.670 | DEBUG    | __main__:trials:24 - Trial = 11874/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.671 | DEBUG    | __main__:trials:29 - Trial = 11874/30000 | Total reward = 37.99
2022-01-26 14:17:22.675 | DEBUG    | __main__:trials:24 - Trial = 11875/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.677 | DEBUG    | __main__:trials:29 - Trial = 11875/30000 | Total reward = 25.59
2022-01-26 14:17:22.681 | DEBUG    | __main__:trials:24 - Trial = 11876/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.681 | DEBUG    | __main__:trials:29 - Trial = 11876/30000 | Total reward = 58.64
2022-01-26 14:17:22.685 | DEBUG    | __main__:trials:24 - Trial = 11877/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.686 | DEBUG    | __main__:trials:29 - Trial = 11877/30000 | Total reward = 43.19
2022-01-26 14:17:22.690 | DEBUG    | __main__:trials:26 - Trial = 11878/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.690 | DEBUG    | __main__:trials:29 - Trial = 11878/30000 | Total reward = 20.66
2022-01-26 14:17:22.694 | DEBUG    | __main__:trials:24 - Trial = 11879/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.696 | DEBUG    | __main__:trials:29 - Trial = 11879/30000 | Total reward = 50.51
2022-01-26 14:17:22.699 | DEBUG    | __main__:trials:24 - Trial = 11880/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.701 | DEBUG    | __main__:trials:29 - Trial = 11880/30000 | Total reward = 43.33
2022-01-26 14:17:22.704 | DEBUG    | __main__:trials:24 - Trial = 11881/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.706 | DEBUG    | __main__:trials:29 - Trial = 11881/30000 | Total reward = 39.66
2022-01-26 14:17:22.710 | DEBUG    | __main__:trials:24 - Trial = 11882/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.711 | DEBUG    | __main__:trials:29 - Trial = 11882/30000 | Total reward = 65.88
2022-01-26 14:17:22.714 | DEBUG    | __main__:trials:24 - Trial = 11883/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.716 | DEBUG    | __main__:trials:29 - Trial = 11883/30000 | Total reward = 41.51
2022-01-26 14:17:22.719 | DEBUG    | __main__:trials:24 - Trial = 11884/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.721 | DEBUG    | __main__:trials:29 - Trial = 11884/30000 | Total reward = 58.54
2022-01-26 14:17:22.724 | DEBUG    | __main__:trials:24 - Trial = 11885/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.726 | DEBUG    | __main__:trials:29 - Trial = 11885/30000 | Total reward = 44.02
2022-01-26 14:17:22.730 | DEBUG    | __main__:trials:24 - Trial = 11886/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.731 | DEBUG    | __main__:trials:29 - Trial = 11886/30000 | Total reward = 25.69
2022-01-26 14:17:22.735 | DEBUG    | __main__:trials:24 - Trial = 11887/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.737 | DEBUG    | __main__:trials:29 - Trial = 11887/30000 | Total reward = 56.72
2022-01-26 14:17:22.740 | DEBUG    | __main__:trials:24 - Trial = 11888/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.742 | DEBUG    | __main__:trials:29 - Trial = 11888/30000 | Total reward = 44.99
2022-01-26 14:17:22.747 | DEBUG    | __main__:trials:24 - Trial = 11889/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.748 | DEBUG    | __main__:trials:29 - Trial = 11889/30000 | Total reward = 40.22
2022-01-26 14:17:22.752 | DEBUG    | __main__:trials:24 - Trial = 11890/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.753 | DEBUG    | __main__:trials:29 - Trial = 11890/30000 | Total reward = 66.87
2022-01-26 14:17:22.757 | DEBUG    | __main__:trials:24 - Trial = 11891/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.758 | DEBUG    | __main__:trials:29 - Trial = 11891/30000 | Total reward = 38.73
2022-01-26 14:17:22.762 | DEBUG    | __main__:trials:24 - Trial = 11892/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.763 | DEBUG    | __main__:trials:29 - Trial = 11892/30000 | Total reward = 38.49
2022-01-26 14:17:22.767 | DEBUG    | __main__:trials:24 - Trial = 11893/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.769 | DEBUG    | __main__:trials:29 - Trial = 11893/30000 | Total reward = 40.99
2022-01-26 14:17:22.772 | DEBUG    | __main__:trials:24 - Trial = 11894/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.774 | DEBUG    | __main__:trials:29 - Trial = 11894/30000 | Total reward = 49.05
2022-01-26 14:17:22.777 | DEBUG    | __main__:trials:24 - Trial = 11895/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.779 | DEBUG    | __main__:trials:29 - Trial = 11895/30000 | Total reward = 60.57
2022-01-26 14:17:22.783 | DEBUG    | __main__:trials:24 - Trial = 11896/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.784 | DEBUG    | __main__:trials:29 - Trial = 11896/30000 | Total reward = 40.55
2022-01-26 14:17:22.787 | DEBUG    | __main__:trials:24 - Trial = 11897/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.789 | DEBUG    | __main__:trials:29 - Trial = 11897/30000 | Total reward = 45.96
2022-01-26 14:17:22.792 | DEBUG    | __main__:trials:24 - Trial = 11898/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.793 | DEBUG    | __main__:trials:29 - Trial = 11898/30000 | Total reward = 42.45
2022-01-26 14:17:22.796 | DEBUG    | __main__:trials:24 - Trial = 11899/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.797 | DEBUG    | __main__:trials:29 - Trial = 11899/30000 | Total reward = 60.73
2022-01-26 14:17:22.801 | DEBUG    | __main__:trials:26 - Trial = 11900/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.802 | DEBUG    | __main__:trials:29 - Trial = 11900/30000 | Total reward = 42.01
2022-01-26 14:17:22.806 | DEBUG    | __main__:trials:24 - Trial = 11901/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.807 | DEBUG    | __main__:trials:29 - Trial = 11901/30000 | Total reward = 60.03
2022-01-26 14:17:22.811 | DEBUG    | __main__:trials:26 - Trial = 11902/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.812 | DEBUG    | __main__:trials:29 - Trial = 11902/30000 | Total reward = 19.80
2022-01-26 14:17:22.815 | DEBUG    | __main__:trials:24 - Trial = 11903/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.817 | DEBUG    | __main__:trials:29 - Trial = 11903/30000 | Total reward = 34.50
2022-01-26 14:17:22.820 | DEBUG    | __main__:trials:24 - Trial = 11904/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.821 | DEBUG    | __main__:trials:29 - Trial = 11904/30000 | Total reward = 66.66
2022-01-26 14:17:22.825 | DEBUG    | __main__:trials:24 - Trial = 11905/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.827 | DEBUG    | __main__:trials:29 - Trial = 11905/30000 | Total reward = 45.11
2022-01-26 14:17:22.830 | DEBUG    | __main__:trials:24 - Trial = 11906/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.832 | DEBUG    | __main__:trials:29 - Trial = 11906/30000 | Total reward = 47.62
2022-01-26 14:17:22.835 | DEBUG    | __main__:trials:24 - Trial = 11907/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.837 | DEBUG    | __main__:trials:29 - Trial = 11907/30000 | Total reward = 46.02
2022-01-26 14:17:22.839 | DEBUG    | __main__:trials:26 - Trial = 11908/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.840 | DEBUG    | __main__:trials:29 - Trial = 11908/30000 | Total reward = 14.93
2022-01-26 14:17:22.844 | DEBUG    | __main__:trials:24 - Trial = 11909/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.845 | DEBUG    | __main__:trials:29 - Trial = 11909/30000 | Total reward = 61.03
2022-01-26 14:17:22.849 | DEBUG    | __main__:trials:24 - Trial = 11910/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.850 | DEBUG    | __main__:trials:29 - Trial = 11910/30000 | Total reward = 46.52
2022-01-26 14:17:22.853 | DEBUG    | __main__:trials:24 - Trial = 11911/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.854 | DEBUG    | __main__:trials:29 - Trial = 11911/30000 | Total reward = 47.03
2022-01-26 14:17:22.857 | DEBUG    | __main__:trials:24 - Trial = 11912/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.859 | DEBUG    | __main__:trials:29 - Trial = 11912/30000 | Total reward = 34.18
2022-01-26 14:17:22.862 | DEBUG    | __main__:trials:24 - Trial = 11913/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.863 | DEBUG    | __main__:trials:29 - Trial = 11913/30000 | Total reward = 47.03
2022-01-26 14:17:22.865 | DEBUG    | __main__:trials:26 - Trial = 11914/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:22.866 | DEBUG    | __main__:trials:29 - Trial = 11914/30000 | Total reward = 9.53
2022-01-26 14:17:22.869 | DEBUG    | __main__:trials:24 - Trial = 11915/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.870 | DEBUG    | __main__:trials:29 - Trial = 11915/30000 | Total reward = 63.21
2022-01-26 14:17:22.873 | DEBUG    | __main__:trials:24 - Trial = 11916/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.876 | DEBUG    | __main__:trials:29 - Trial = 11916/30000 | Total reward = 47.03
2022-01-26 14:17:22.878 | DEBUG    | __main__:trials:24 - Trial = 11917/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.880 | DEBUG    | __main__:trials:29 - Trial = 11917/30000 | Total reward = 48.05
2022-01-26 14:17:22.883 | DEBUG    | __main__:trials:24 - Trial = 11918/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.885 | DEBUG    | __main__:trials:29 - Trial = 11918/30000 | Total reward = 59.00
2022-01-26 14:17:22.889 | DEBUG    | __main__:trials:24 - Trial = 11919/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.890 | DEBUG    | __main__:trials:29 - Trial = 11919/30000 | Total reward = 48.71
2022-01-26 14:17:22.893 | DEBUG    | __main__:trials:24 - Trial = 11920/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.895 | DEBUG    | __main__:trials:29 - Trial = 11920/30000 | Total reward = 46.05
2022-01-26 14:17:22.898 | DEBUG    | __main__:trials:24 - Trial = 11921/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.900 | DEBUG    | __main__:trials:29 - Trial = 11921/30000 | Total reward = 48.24
2022-01-26 14:17:22.903 | DEBUG    | __main__:trials:24 - Trial = 11922/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.905 | DEBUG    | __main__:trials:29 - Trial = 11922/30000 | Total reward = 40.40
2022-01-26 14:17:22.909 | DEBUG    | __main__:trials:24 - Trial = 11923/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.909 | DEBUG    | __main__:trials:29 - Trial = 11923/30000 | Total reward = 50.31
2022-01-26 14:17:22.913 | DEBUG    | __main__:trials:24 - Trial = 11924/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.913 | DEBUG    | __main__:trials:29 - Trial = 11924/30000 | Total reward = 32.75
2022-01-26 14:17:22.918 | DEBUG    | __main__:trials:24 - Trial = 11925/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.919 | DEBUG    | __main__:trials:29 - Trial = 11925/30000 | Total reward = 52.89
2022-01-26 14:17:22.923 | DEBUG    | __main__:trials:24 - Trial = 11926/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.924 | DEBUG    | __main__:trials:29 - Trial = 11926/30000 | Total reward = 50.45
2022-01-26 14:17:22.927 | DEBUG    | __main__:trials:24 - Trial = 11927/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.929 | DEBUG    | __main__:trials:29 - Trial = 11927/30000 | Total reward = 46.79
2022-01-26 14:17:22.933 | DEBUG    | __main__:trials:24 - Trial = 11928/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.934 | DEBUG    | __main__:trials:29 - Trial = 11928/30000 | Total reward = 40.66
2022-01-26 14:17:22.937 | DEBUG    | __main__:trials:24 - Trial = 11929/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.938 | DEBUG    | __main__:trials:29 - Trial = 11929/30000 | Total reward = 61.87
2022-01-26 14:17:22.941 | DEBUG    | __main__:trials:24 - Trial = 11930/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.942 | DEBUG    | __main__:trials:29 - Trial = 11930/30000 | Total reward = 38.97
2022-01-26 14:17:22.945 | DEBUG    | __main__:trials:24 - Trial = 11931/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.947 | DEBUG    | __main__:trials:29 - Trial = 11931/30000 | Total reward = 43.91
2022-01-26 14:17:22.951 | DEBUG    | __main__:trials:24 - Trial = 11932/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.952 | DEBUG    | __main__:trials:29 - Trial = 11932/30000 | Total reward = 46.07
2022-01-26 14:17:22.956 | DEBUG    | __main__:trials:24 - Trial = 11933/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.958 | DEBUG    | __main__:trials:29 - Trial = 11933/30000 | Total reward = 61.97
2022-01-26 14:17:22.961 | DEBUG    | __main__:trials:24 - Trial = 11934/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.963 | DEBUG    | __main__:trials:29 - Trial = 11934/30000 | Total reward = 40.35
2022-01-26 14:17:22.966 | DEBUG    | __main__:trials:24 - Trial = 11935/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.968 | DEBUG    | __main__:trials:29 - Trial = 11935/30000 | Total reward = 34.13
2022-01-26 14:17:22.972 | DEBUG    | __main__:trials:24 - Trial = 11936/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.973 | DEBUG    | __main__:trials:29 - Trial = 11936/30000 | Total reward = 66.54
2022-01-26 14:17:22.976 | DEBUG    | __main__:trials:24 - Trial = 11937/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.978 | DEBUG    | __main__:trials:29 - Trial = 11937/30000 | Total reward = 47.00
2022-01-26 14:17:22.982 | DEBUG    | __main__:trials:24 - Trial = 11938/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.982 | DEBUG    | __main__:trials:29 - Trial = 11938/30000 | Total reward = 46.53
2022-01-26 14:17:22.986 | DEBUG    | __main__:trials:24 - Trial = 11939/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.988 | DEBUG    | __main__:trials:29 - Trial = 11939/30000 | Total reward = 41.65
2022-01-26 14:17:22.992 | DEBUG    | __main__:trials:24 - Trial = 11940/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.993 | DEBUG    | __main__:trials:29 - Trial = 11940/30000 | Total reward = 41.40
2022-01-26 14:17:22.997 | DEBUG    | __main__:trials:24 - Trial = 11941/30000 | Max number of steps (20) reached
2022-01-26 14:17:22.997 | DEBUG    | __main__:trials:29 - Trial = 11941/30000 | Total reward = 52.41
2022-01-26 14:17:23.001 | DEBUG    | __main__:trials:24 - Trial = 11942/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.001 | DEBUG    | __main__:trials:29 - Trial = 11942/30000 | Total reward = 41.29
2022-01-26 14:17:23.005 | DEBUG    | __main__:trials:24 - Trial = 11943/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.005 | DEBUG    | __main__:trials:29 - Trial = 11943/30000 | Total reward = 42.76
2022-01-26 14:17:23.009 | DEBUG    | __main__:trials:24 - Trial = 11944/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.009 | DEBUG    | __main__:trials:29 - Trial = 11944/30000 | Total reward = 63.76
2022-01-26 14:17:23.013 | DEBUG    | __main__:trials:24 - Trial = 11945/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.014 | DEBUG    | __main__:trials:29 - Trial = 11945/30000 | Total reward = 30.23
2022-01-26 14:17:23.018 | DEBUG    | __main__:trials:24 - Trial = 11946/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.019 | DEBUG    | __main__:trials:29 - Trial = 11946/30000 | Total reward = 49.51
2022-01-26 14:17:23.023 | DEBUG    | __main__:trials:24 - Trial = 11947/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.025 | DEBUG    | __main__:trials:29 - Trial = 11947/30000 | Total reward = 57.44
2022-01-26 14:17:23.028 | DEBUG    | __main__:trials:24 - Trial = 11948/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.030 | DEBUG    | __main__:trials:29 - Trial = 11948/30000 | Total reward = 51.54
2022-01-26 14:17:23.033 | DEBUG    | __main__:trials:24 - Trial = 11949/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.035 | DEBUG    | __main__:trials:29 - Trial = 11949/30000 | Total reward = 44.46
2022-01-26 14:17:23.039 | DEBUG    | __main__:trials:24 - Trial = 11950/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.039 | DEBUG    | __main__:trials:29 - Trial = 11950/30000 | Total reward = 42.60
2022-01-26 14:17:23.043 | DEBUG    | __main__:trials:24 - Trial = 11951/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.045 | DEBUG    | __main__:trials:29 - Trial = 11951/30000 | Total reward = 49.18
2022-01-26 14:17:23.047 | DEBUG    | __main__:trials:26 - Trial = 11952/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.049 | DEBUG    | __main__:trials:29 - Trial = 11952/30000 | Total reward = 18.54
2022-01-26 14:17:23.053 | DEBUG    | __main__:trials:24 - Trial = 11953/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.054 | DEBUG    | __main__:trials:29 - Trial = 11953/30000 | Total reward = 37.96
2022-01-26 14:17:23.058 | DEBUG    | __main__:trials:24 - Trial = 11954/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.059 | DEBUG    | __main__:trials:29 - Trial = 11954/30000 | Total reward = 33.30
2022-01-26 14:17:23.063 | DEBUG    | __main__:trials:24 - Trial = 11955/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.063 | DEBUG    | __main__:trials:29 - Trial = 11955/30000 | Total reward = 47.62
2022-01-26 14:17:23.068 | DEBUG    | __main__:trials:24 - Trial = 11956/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.069 | DEBUG    | __main__:trials:29 - Trial = 11956/30000 | Total reward = 40.69
2022-01-26 14:17:23.072 | DEBUG    | __main__:trials:24 - Trial = 11957/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.074 | DEBUG    | __main__:trials:29 - Trial = 11957/30000 | Total reward = 57.58
2022-01-26 14:17:23.078 | DEBUG    | __main__:trials:24 - Trial = 11958/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.079 | DEBUG    | __main__:trials:29 - Trial = 11958/30000 | Total reward = 54.42
2022-01-26 14:17:23.083 | DEBUG    | __main__:trials:24 - Trial = 11959/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.084 | DEBUG    | __main__:trials:29 - Trial = 11959/30000 | Total reward = 60.17
2022-01-26 14:17:23.088 | DEBUG    | __main__:trials:24 - Trial = 11960/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.090 | DEBUG    | __main__:trials:29 - Trial = 11960/30000 | Total reward = 38.83
2022-01-26 14:17:23.093 | DEBUG    | __main__:trials:24 - Trial = 11961/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.095 | DEBUG    | __main__:trials:29 - Trial = 11961/30000 | Total reward = 47.03
2022-01-26 14:17:23.098 | DEBUG    | __main__:trials:24 - Trial = 11962/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.100 | DEBUG    | __main__:trials:29 - Trial = 11962/30000 | Total reward = 35.16
2022-01-26 14:17:23.104 | DEBUG    | __main__:trials:24 - Trial = 11963/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.106 | DEBUG    | __main__:trials:29 - Trial = 11963/30000 | Total reward = 36.00
2022-01-26 14:17:23.109 | DEBUG    | __main__:trials:24 - Trial = 11964/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.111 | DEBUG    | __main__:trials:29 - Trial = 11964/30000 | Total reward = 42.70
2022-01-26 14:17:23.115 | DEBUG    | __main__:trials:24 - Trial = 11965/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.116 | DEBUG    | __main__:trials:29 - Trial = 11965/30000 | Total reward = 36.51
2022-01-26 14:17:23.120 | DEBUG    | __main__:trials:24 - Trial = 11966/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.121 | DEBUG    | __main__:trials:29 - Trial = 11966/30000 | Total reward = 41.59
2022-01-26 14:17:23.124 | DEBUG    | __main__:trials:24 - Trial = 11967/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.126 | DEBUG    | __main__:trials:29 - Trial = 11967/30000 | Total reward = 58.21
2022-01-26 14:17:23.130 | DEBUG    | __main__:trials:24 - Trial = 11968/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.131 | DEBUG    | __main__:trials:29 - Trial = 11968/30000 | Total reward = 36.88
2022-01-26 14:17:23.134 | DEBUG    | __main__:trials:24 - Trial = 11969/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.136 | DEBUG    | __main__:trials:29 - Trial = 11969/30000 | Total reward = 42.86
2022-01-26 14:17:23.139 | DEBUG    | __main__:trials:24 - Trial = 11970/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.141 | DEBUG    | __main__:trials:29 - Trial = 11970/30000 | Total reward = 49.76
2022-01-26 14:17:23.144 | DEBUG    | __main__:trials:24 - Trial = 11971/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.146 | DEBUG    | __main__:trials:29 - Trial = 11971/30000 | Total reward = 47.62
2022-01-26 14:17:23.149 | DEBUG    | __main__:trials:24 - Trial = 11972/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.151 | DEBUG    | __main__:trials:29 - Trial = 11972/30000 | Total reward = 41.00
2022-01-26 14:17:23.154 | DEBUG    | __main__:trials:24 - Trial = 11973/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.156 | DEBUG    | __main__:trials:29 - Trial = 11973/30000 | Total reward = 39.80
2022-01-26 14:17:23.159 | DEBUG    | __main__:trials:24 - Trial = 11974/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.161 | DEBUG    | __main__:trials:29 - Trial = 11974/30000 | Total reward = 46.63
2022-01-26 14:17:23.164 | DEBUG    | __main__:trials:24 - Trial = 11975/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.165 | DEBUG    | __main__:trials:29 - Trial = 11975/30000 | Total reward = 41.29
2022-01-26 14:17:23.169 | DEBUG    | __main__:trials:24 - Trial = 11976/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.171 | DEBUG    | __main__:trials:29 - Trial = 11976/30000 | Total reward = 48.30
2022-01-26 14:17:23.174 | DEBUG    | __main__:trials:24 - Trial = 11977/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.176 | DEBUG    | __main__:trials:29 - Trial = 11977/30000 | Total reward = 41.89
2022-01-26 14:17:23.180 | DEBUG    | __main__:trials:24 - Trial = 11978/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.180 | DEBUG    | __main__:trials:29 - Trial = 11978/30000 | Total reward = 49.44
2022-01-26 14:17:23.184 | DEBUG    | __main__:trials:24 - Trial = 11979/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.186 | DEBUG    | __main__:trials:29 - Trial = 11979/30000 | Total reward = 59.67
2022-01-26 14:17:23.189 | DEBUG    | __main__:trials:24 - Trial = 11980/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.191 | DEBUG    | __main__:trials:29 - Trial = 11980/30000 | Total reward = 61.07
2022-01-26 14:17:23.195 | DEBUG    | __main__:trials:24 - Trial = 11981/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.196 | DEBUG    | __main__:trials:29 - Trial = 11981/30000 | Total reward = 56.75
2022-01-26 14:17:23.200 | DEBUG    | __main__:trials:24 - Trial = 11982/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.201 | DEBUG    | __main__:trials:29 - Trial = 11982/30000 | Total reward = 54.83
2022-01-26 14:17:23.205 | DEBUG    | __main__:trials:24 - Trial = 11983/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.206 | DEBUG    | __main__:trials:29 - Trial = 11983/30000 | Total reward = 36.15
2022-01-26 14:17:23.210 | DEBUG    | __main__:trials:24 - Trial = 11984/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.211 | DEBUG    | __main__:trials:29 - Trial = 11984/30000 | Total reward = 42.03
2022-01-26 14:17:23.214 | DEBUG    | __main__:trials:24 - Trial = 11985/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.216 | DEBUG    | __main__:trials:29 - Trial = 11985/30000 | Total reward = 39.24
2022-01-26 14:17:23.219 | DEBUG    | __main__:trials:24 - Trial = 11986/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.221 | DEBUG    | __main__:trials:29 - Trial = 11986/30000 | Total reward = 47.62
2022-01-26 14:17:23.225 | DEBUG    | __main__:trials:24 - Trial = 11987/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.226 | DEBUG    | __main__:trials:29 - Trial = 11987/30000 | Total reward = 32.26
2022-01-26 14:17:23.230 | DEBUG    | __main__:trials:24 - Trial = 11988/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.231 | DEBUG    | __main__:trials:29 - Trial = 11988/30000 | Total reward = 37.24
2022-01-26 14:17:23.235 | DEBUG    | __main__:trials:24 - Trial = 11989/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.236 | DEBUG    | __main__:trials:29 - Trial = 11989/30000 | Total reward = 28.66
2022-01-26 14:17:23.240 | DEBUG    | __main__:trials:24 - Trial = 11990/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.242 | DEBUG    | __main__:trials:29 - Trial = 11990/30000 | Total reward = 45.89
2022-01-26 14:17:23.245 | DEBUG    | __main__:trials:24 - Trial = 11991/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.247 | DEBUG    | __main__:trials:29 - Trial = 11991/30000 | Total reward = 61.08
2022-01-26 14:17:23.251 | DEBUG    | __main__:trials:24 - Trial = 11992/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.252 | DEBUG    | __main__:trials:29 - Trial = 11992/30000 | Total reward = 52.93
2022-01-26 14:17:23.256 | DEBUG    | __main__:trials:24 - Trial = 11993/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.257 | DEBUG    | __main__:trials:29 - Trial = 11993/30000 | Total reward = 44.27
2022-01-26 14:17:23.260 | DEBUG    | __main__:trials:24 - Trial = 11994/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.261 | DEBUG    | __main__:trials:29 - Trial = 11994/30000 | Total reward = 42.35
2022-01-26 14:17:23.265 | DEBUG    | __main__:trials:24 - Trial = 11995/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.267 | DEBUG    | __main__:trials:29 - Trial = 11995/30000 | Total reward = 37.02
2022-01-26 14:17:23.271 | DEBUG    | __main__:trials:24 - Trial = 11996/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.272 | DEBUG    | __main__:trials:29 - Trial = 11996/30000 | Total reward = 41.93
2022-01-26 14:17:23.276 | DEBUG    | __main__:trials:24 - Trial = 11997/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.278 | DEBUG    | __main__:trials:29 - Trial = 11997/30000 | Total reward = 61.89
2022-01-26 14:17:23.281 | DEBUG    | __main__:trials:24 - Trial = 11998/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.282 | DEBUG    | __main__:trials:29 - Trial = 11998/30000 | Total reward = 47.03
2022-01-26 14:17:23.285 | DEBUG    | __main__:trials:24 - Trial = 11999/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.286 | DEBUG    | __main__:trials:29 - Trial = 11999/30000 | Total reward = 46.39
2022-01-26 14:17:23.289 | DEBUG    | __main__:trials:24 - Trial = 12000/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.291 | DEBUG    | __main__:trials:29 - Trial = 12000/30000 | Total reward = 43.83
2022-01-26 14:17:23.294 | DEBUG    | __main__:trials:24 - Trial = 12001/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.296 | DEBUG    | __main__:trials:29 - Trial = 12001/30000 | Total reward = 41.92
2022-01-26 14:17:23.300 | DEBUG    | __main__:trials:24 - Trial = 12002/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.301 | DEBUG    | __main__:trials:29 - Trial = 12002/30000 | Total reward = 36.52
2022-01-26 14:17:23.305 | DEBUG    | __main__:trials:24 - Trial = 12003/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.306 | DEBUG    | __main__:trials:29 - Trial = 12003/30000 | Total reward = 38.79
2022-01-26 14:17:23.310 | DEBUG    | __main__:trials:24 - Trial = 12004/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.311 | DEBUG    | __main__:trials:29 - Trial = 12004/30000 | Total reward = 43.32
2022-01-26 14:17:23.315 | DEBUG    | __main__:trials:24 - Trial = 12005/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.316 | DEBUG    | __main__:trials:29 - Trial = 12005/30000 | Total reward = 32.03
2022-01-26 14:17:23.320 | DEBUG    | __main__:trials:24 - Trial = 12006/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.322 | DEBUG    | __main__:trials:29 - Trial = 12006/30000 | Total reward = 55.13
2022-01-26 14:17:23.325 | DEBUG    | __main__:trials:24 - Trial = 12007/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.327 | DEBUG    | __main__:trials:29 - Trial = 12007/30000 | Total reward = 59.54
2022-01-26 14:17:23.330 | DEBUG    | __main__:trials:24 - Trial = 12008/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.332 | DEBUG    | __main__:trials:29 - Trial = 12008/30000 | Total reward = 44.63
2022-01-26 14:17:23.336 | DEBUG    | __main__:trials:24 - Trial = 12009/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.337 | DEBUG    | __main__:trials:29 - Trial = 12009/30000 | Total reward = 57.52
2022-01-26 14:17:23.341 | DEBUG    | __main__:trials:24 - Trial = 12010/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.343 | DEBUG    | __main__:trials:29 - Trial = 12010/30000 | Total reward = 59.05
2022-01-26 14:17:23.345 | DEBUG    | __main__:trials:26 - Trial = 12011/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.347 | DEBUG    | __main__:trials:29 - Trial = 12011/30000 | Total reward = 31.45
2022-01-26 14:17:23.351 | DEBUG    | __main__:trials:24 - Trial = 12012/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.352 | DEBUG    | __main__:trials:29 - Trial = 12012/30000 | Total reward = 41.56
2022-01-26 14:17:23.356 | DEBUG    | __main__:trials:24 - Trial = 12013/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.357 | DEBUG    | __main__:trials:29 - Trial = 12013/30000 | Total reward = 51.01
2022-01-26 14:17:23.361 | DEBUG    | __main__:trials:24 - Trial = 12014/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.362 | DEBUG    | __main__:trials:29 - Trial = 12014/30000 | Total reward = 64.25
2022-01-26 14:17:23.364 | DEBUG    | __main__:trials:26 - Trial = 12015/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.366 | DEBUG    | __main__:trials:29 - Trial = 12015/30000 | Total reward = 14.95
2022-01-26 14:17:23.369 | DEBUG    | __main__:trials:24 - Trial = 12016/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.371 | DEBUG    | __main__:trials:29 - Trial = 12016/30000 | Total reward = 33.88
2022-01-26 14:17:23.374 | DEBUG    | __main__:trials:24 - Trial = 12017/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.376 | DEBUG    | __main__:trials:29 - Trial = 12017/30000 | Total reward = 57.39
2022-01-26 14:17:23.379 | DEBUG    | __main__:trials:24 - Trial = 12018/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.381 | DEBUG    | __main__:trials:29 - Trial = 12018/30000 | Total reward = 48.21
2022-01-26 14:17:23.384 | DEBUG    | __main__:trials:24 - Trial = 12019/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.386 | DEBUG    | __main__:trials:29 - Trial = 12019/30000 | Total reward = 34.99
2022-01-26 14:17:23.389 | DEBUG    | __main__:trials:24 - Trial = 12020/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.390 | DEBUG    | __main__:trials:29 - Trial = 12020/30000 | Total reward = 56.35
2022-01-26 14:17:23.394 | DEBUG    | __main__:trials:24 - Trial = 12021/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.395 | DEBUG    | __main__:trials:29 - Trial = 12021/30000 | Total reward = 52.82
2022-01-26 14:17:23.399 | DEBUG    | __main__:trials:24 - Trial = 12022/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.401 | DEBUG    | __main__:trials:29 - Trial = 12022/30000 | Total reward = 47.21
2022-01-26 14:17:23.403 | DEBUG    | __main__:trials:24 - Trial = 12023/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.405 | DEBUG    | __main__:trials:29 - Trial = 12023/30000 | Total reward = 53.48
2022-01-26 14:17:23.409 | DEBUG    | __main__:trials:24 - Trial = 12024/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.411 | DEBUG    | __main__:trials:29 - Trial = 12024/30000 | Total reward = 57.57
2022-01-26 14:17:23.414 | DEBUG    | __main__:trials:24 - Trial = 12025/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.416 | DEBUG    | __main__:trials:29 - Trial = 12025/30000 | Total reward = 29.99
2022-01-26 14:17:23.420 | DEBUG    | __main__:trials:24 - Trial = 12026/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.422 | DEBUG    | __main__:trials:29 - Trial = 12026/30000 | Total reward = 38.04
2022-01-26 14:17:23.425 | DEBUG    | __main__:trials:24 - Trial = 12027/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.427 | DEBUG    | __main__:trials:29 - Trial = 12027/30000 | Total reward = 41.98
2022-01-26 14:17:23.431 | DEBUG    | __main__:trials:24 - Trial = 12028/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.433 | DEBUG    | __main__:trials:29 - Trial = 12028/30000 | Total reward = 41.19
2022-01-26 14:17:23.436 | DEBUG    | __main__:trials:24 - Trial = 12029/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.438 | DEBUG    | __main__:trials:29 - Trial = 12029/30000 | Total reward = 57.96
2022-01-26 14:17:23.441 | DEBUG    | __main__:trials:24 - Trial = 12030/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.442 | DEBUG    | __main__:trials:29 - Trial = 12030/30000 | Total reward = 59.27
2022-01-26 14:17:23.445 | DEBUG    | __main__:trials:24 - Trial = 12031/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.446 | DEBUG    | __main__:trials:29 - Trial = 12031/30000 | Total reward = 40.63
2022-01-26 14:17:23.449 | DEBUG    | __main__:trials:24 - Trial = 12032/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.451 | DEBUG    | __main__:trials:29 - Trial = 12032/30000 | Total reward = 43.19
2022-01-26 14:17:23.454 | DEBUG    | __main__:trials:24 - Trial = 12033/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.455 | DEBUG    | __main__:trials:29 - Trial = 12033/30000 | Total reward = 45.76
2022-01-26 14:17:23.458 | DEBUG    | __main__:trials:24 - Trial = 12034/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.459 | DEBUG    | __main__:trials:29 - Trial = 12034/30000 | Total reward = 51.52
2022-01-26 14:17:23.462 | DEBUG    | __main__:trials:24 - Trial = 12035/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.463 | DEBUG    | __main__:trials:29 - Trial = 12035/30000 | Total reward = 60.92
2022-01-26 14:17:23.466 | DEBUG    | __main__:trials:24 - Trial = 12036/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.467 | DEBUG    | __main__:trials:29 - Trial = 12036/30000 | Total reward = 38.73
2022-01-26 14:17:23.470 | DEBUG    | __main__:trials:24 - Trial = 12037/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.472 | DEBUG    | __main__:trials:29 - Trial = 12037/30000 | Total reward = 38.78
2022-01-26 14:17:23.476 | DEBUG    | __main__:trials:24 - Trial = 12038/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.477 | DEBUG    | __main__:trials:29 - Trial = 12038/30000 | Total reward = 40.93
2022-01-26 14:17:23.480 | DEBUG    | __main__:trials:24 - Trial = 12039/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.482 | DEBUG    | __main__:trials:29 - Trial = 12039/30000 | Total reward = 48.75
2022-01-26 14:17:23.485 | DEBUG    | __main__:trials:24 - Trial = 12040/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.487 | DEBUG    | __main__:trials:29 - Trial = 12040/30000 | Total reward = 41.06
2022-01-26 14:17:23.490 | DEBUG    | __main__:trials:24 - Trial = 12041/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.490 | DEBUG    | __main__:trials:29 - Trial = 12041/30000 | Total reward = 50.85
2022-01-26 14:17:23.494 | DEBUG    | __main__:trials:24 - Trial = 12042/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.496 | DEBUG    | __main__:trials:29 - Trial = 12042/30000 | Total reward = 49.80
2022-01-26 14:17:23.498 | DEBUG    | __main__:trials:24 - Trial = 12043/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.500 | DEBUG    | __main__:trials:29 - Trial = 12043/30000 | Total reward = 45.38
2022-01-26 14:17:23.503 | DEBUG    | __main__:trials:24 - Trial = 12044/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.505 | DEBUG    | __main__:trials:29 - Trial = 12044/30000 | Total reward = 47.03
2022-01-26 14:17:23.508 | DEBUG    | __main__:trials:24 - Trial = 12045/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.509 | DEBUG    | __main__:trials:29 - Trial = 12045/30000 | Total reward = 31.06
2022-01-26 14:17:23.513 | DEBUG    | __main__:trials:24 - Trial = 12046/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.513 | DEBUG    | __main__:trials:29 - Trial = 12046/30000 | Total reward = 38.31
2022-01-26 14:17:23.517 | DEBUG    | __main__:trials:24 - Trial = 12047/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.518 | DEBUG    | __main__:trials:29 - Trial = 12047/30000 | Total reward = 53.94
2022-01-26 14:17:23.521 | DEBUG    | __main__:trials:24 - Trial = 12048/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.522 | DEBUG    | __main__:trials:29 - Trial = 12048/30000 | Total reward = 42.70
2022-01-26 14:17:23.525 | DEBUG    | __main__:trials:24 - Trial = 12049/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.527 | DEBUG    | __main__:trials:29 - Trial = 12049/30000 | Total reward = 45.69
2022-01-26 14:17:23.531 | DEBUG    | __main__:trials:24 - Trial = 12050/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.532 | DEBUG    | __main__:trials:29 - Trial = 12050/30000 | Total reward = 38.30
2022-01-26 14:17:23.535 | DEBUG    | __main__:trials:26 - Trial = 12051/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.536 | DEBUG    | __main__:trials:29 - Trial = 12051/30000 | Total reward = 38.64
2022-01-26 14:17:23.540 | DEBUG    | __main__:trials:24 - Trial = 12052/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.542 | DEBUG    | __main__:trials:29 - Trial = 12052/30000 | Total reward = 64.77
2022-01-26 14:17:23.545 | DEBUG    | __main__:trials:24 - Trial = 12053/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.546 | DEBUG    | __main__:trials:29 - Trial = 12053/30000 | Total reward = 50.33
2022-01-26 14:17:23.550 | DEBUG    | __main__:trials:24 - Trial = 12054/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.551 | DEBUG    | __main__:trials:29 - Trial = 12054/30000 | Total reward = 64.29
2022-01-26 14:17:23.555 | DEBUG    | __main__:trials:24 - Trial = 12055/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.557 | DEBUG    | __main__:trials:29 - Trial = 12055/30000 | Total reward = 47.03
2022-01-26 14:17:23.559 | DEBUG    | __main__:trials:24 - Trial = 12056/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.561 | DEBUG    | __main__:trials:29 - Trial = 12056/30000 | Total reward = 29.52
2022-01-26 14:17:23.565 | DEBUG    | __main__:trials:24 - Trial = 12057/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.566 | DEBUG    | __main__:trials:29 - Trial = 12057/30000 | Total reward = 46.52
2022-01-26 14:17:23.570 | DEBUG    | __main__:trials:24 - Trial = 12058/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.572 | DEBUG    | __main__:trials:29 - Trial = 12058/30000 | Total reward = 34.24
2022-01-26 14:17:23.575 | DEBUG    | __main__:trials:24 - Trial = 12059/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.577 | DEBUG    | __main__:trials:29 - Trial = 12059/30000 | Total reward = 54.35
2022-01-26 14:17:23.580 | DEBUG    | __main__:trials:24 - Trial = 12060/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.581 | DEBUG    | __main__:trials:29 - Trial = 12060/30000 | Total reward = 37.19
2022-01-26 14:17:23.585 | DEBUG    | __main__:trials:24 - Trial = 12061/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.586 | DEBUG    | __main__:trials:29 - Trial = 12061/30000 | Total reward = 42.25
2022-01-26 14:17:23.590 | DEBUG    | __main__:trials:24 - Trial = 12062/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.591 | DEBUG    | __main__:trials:29 - Trial = 12062/30000 | Total reward = 23.02
2022-01-26 14:17:23.595 | DEBUG    | __main__:trials:24 - Trial = 12063/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.596 | DEBUG    | __main__:trials:29 - Trial = 12063/30000 | Total reward = 31.38
2022-01-26 14:17:23.600 | DEBUG    | __main__:trials:24 - Trial = 12064/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.601 | DEBUG    | __main__:trials:29 - Trial = 12064/30000 | Total reward = 42.92
2022-01-26 14:17:23.605 | DEBUG    | __main__:trials:24 - Trial = 12065/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.607 | DEBUG    | __main__:trials:29 - Trial = 12065/30000 | Total reward = 37.89
2022-01-26 14:17:23.610 | DEBUG    | __main__:trials:24 - Trial = 12066/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.612 | DEBUG    | __main__:trials:29 - Trial = 12066/30000 | Total reward = 29.80
2022-01-26 14:17:23.615 | DEBUG    | __main__:trials:26 - Trial = 12067/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.617 | DEBUG    | __main__:trials:29 - Trial = 12067/30000 | Total reward = 31.64
2022-01-26 14:17:23.620 | DEBUG    | __main__:trials:24 - Trial = 12068/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.621 | DEBUG    | __main__:trials:29 - Trial = 12068/30000 | Total reward = 40.05
2022-01-26 14:17:23.625 | DEBUG    | __main__:trials:24 - Trial = 12069/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.627 | DEBUG    | __main__:trials:29 - Trial = 12069/30000 | Total reward = 63.20
2022-01-26 14:17:23.630 | DEBUG    | __main__:trials:24 - Trial = 12070/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.632 | DEBUG    | __main__:trials:29 - Trial = 12070/30000 | Total reward = 47.03
2022-01-26 14:17:23.636 | DEBUG    | __main__:trials:24 - Trial = 12071/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.637 | DEBUG    | __main__:trials:29 - Trial = 12071/30000 | Total reward = 41.54
2022-01-26 14:17:23.640 | DEBUG    | __main__:trials:24 - Trial = 12072/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.642 | DEBUG    | __main__:trials:29 - Trial = 12072/30000 | Total reward = 40.19
2022-01-26 14:17:23.645 | DEBUG    | __main__:trials:24 - Trial = 12073/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.646 | DEBUG    | __main__:trials:29 - Trial = 12073/30000 | Total reward = 47.52
2022-01-26 14:17:23.649 | DEBUG    | __main__:trials:24 - Trial = 12074/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.650 | DEBUG    | __main__:trials:29 - Trial = 12074/30000 | Total reward = 50.30
2022-01-26 14:17:23.653 | DEBUG    | __main__:trials:24 - Trial = 12075/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.655 | DEBUG    | __main__:trials:29 - Trial = 12075/30000 | Total reward = 41.17
2022-01-26 14:17:23.659 | DEBUG    | __main__:trials:24 - Trial = 12076/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.660 | DEBUG    | __main__:trials:29 - Trial = 12076/30000 | Total reward = 40.45
2022-01-26 14:17:23.664 | DEBUG    | __main__:trials:24 - Trial = 12077/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.665 | DEBUG    | __main__:trials:29 - Trial = 12077/30000 | Total reward = 33.18
2022-01-26 14:17:23.669 | DEBUG    | __main__:trials:24 - Trial = 12078/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.671 | DEBUG    | __main__:trials:29 - Trial = 12078/30000 | Total reward = 47.41
2022-01-26 14:17:23.675 | DEBUG    | __main__:trials:24 - Trial = 12079/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.676 | DEBUG    | __main__:trials:29 - Trial = 12079/30000 | Total reward = 29.79
2022-01-26 14:17:23.680 | DEBUG    | __main__:trials:24 - Trial = 12080/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.681 | DEBUG    | __main__:trials:29 - Trial = 12080/30000 | Total reward = 45.07
2022-01-26 14:17:23.684 | DEBUG    | __main__:trials:26 - Trial = 12081/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.686 | DEBUG    | __main__:trials:29 - Trial = 12081/30000 | Total reward = 30.48
2022-01-26 14:17:23.690 | DEBUG    | __main__:trials:24 - Trial = 12082/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.691 | DEBUG    | __main__:trials:29 - Trial = 12082/30000 | Total reward = 39.20
2022-01-26 14:17:23.694 | DEBUG    | __main__:trials:24 - Trial = 12083/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.696 | DEBUG    | __main__:trials:29 - Trial = 12083/30000 | Total reward = 24.61
2022-01-26 14:17:23.700 | DEBUG    | __main__:trials:24 - Trial = 12084/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.701 | DEBUG    | __main__:trials:29 - Trial = 12084/30000 | Total reward = 32.82
2022-01-26 14:17:23.704 | DEBUG    | __main__:trials:24 - Trial = 12085/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.705 | DEBUG    | __main__:trials:29 - Trial = 12085/30000 | Total reward = 60.39
2022-01-26 14:17:23.708 | DEBUG    | __main__:trials:26 - Trial = 12086/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.709 | DEBUG    | __main__:trials:29 - Trial = 12086/30000 | Total reward = 14.21
2022-01-26 14:17:23.712 | DEBUG    | __main__:trials:24 - Trial = 12087/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.714 | DEBUG    | __main__:trials:29 - Trial = 12087/30000 | Total reward = 38.53
2022-01-26 14:17:23.718 | DEBUG    | __main__:trials:24 - Trial = 12088/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.720 | DEBUG    | __main__:trials:29 - Trial = 12088/30000 | Total reward = 23.54
2022-01-26 14:17:23.723 | DEBUG    | __main__:trials:24 - Trial = 12089/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.725 | DEBUG    | __main__:trials:29 - Trial = 12089/30000 | Total reward = 53.53
2022-01-26 14:17:23.729 | DEBUG    | __main__:trials:24 - Trial = 12090/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.730 | DEBUG    | __main__:trials:29 - Trial = 12090/30000 | Total reward = 47.41
2022-01-26 14:17:23.734 | DEBUG    | __main__:trials:24 - Trial = 12091/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.734 | DEBUG    | __main__:trials:29 - Trial = 12091/30000 | Total reward = 66.25
2022-01-26 14:17:23.739 | DEBUG    | __main__:trials:24 - Trial = 12092/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.739 | DEBUG    | __main__:trials:29 - Trial = 12092/30000 | Total reward = 35.99
2022-01-26 14:17:23.744 | DEBUG    | __main__:trials:26 - Trial = 12093/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.747 | DEBUG    | __main__:trials:29 - Trial = 12093/30000 | Total reward = 25.56
2022-01-26 14:17:23.750 | DEBUG    | __main__:trials:24 - Trial = 12094/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.752 | DEBUG    | __main__:trials:29 - Trial = 12094/30000 | Total reward = 60.09
2022-01-26 14:17:23.756 | DEBUG    | __main__:trials:24 - Trial = 12095/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.757 | DEBUG    | __main__:trials:29 - Trial = 12095/30000 | Total reward = 37.40
2022-01-26 14:17:23.761 | DEBUG    | __main__:trials:24 - Trial = 12096/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.761 | DEBUG    | __main__:trials:29 - Trial = 12096/30000 | Total reward = 47.03
2022-01-26 14:17:23.764 | DEBUG    | __main__:trials:24 - Trial = 12097/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.766 | DEBUG    | __main__:trials:29 - Trial = 12097/30000 | Total reward = 47.83
2022-01-26 14:17:23.769 | DEBUG    | __main__:trials:24 - Trial = 12098/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.770 | DEBUG    | __main__:trials:29 - Trial = 12098/30000 | Total reward = 57.31
2022-01-26 14:17:23.774 | DEBUG    | __main__:trials:24 - Trial = 12099/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.776 | DEBUG    | __main__:trials:29 - Trial = 12099/30000 | Total reward = 47.03
2022-01-26 14:17:23.778 | DEBUG    | __main__:trials:26 - Trial = 12100/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.779 | DEBUG    | __main__:trials:29 - Trial = 12100/30000 | Total reward = 23.95
2022-01-26 14:17:23.782 | DEBUG    | __main__:trials:26 - Trial = 12101/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.782 | DEBUG    | __main__:trials:29 - Trial = 12101/30000 | Total reward = 26.65
2022-01-26 14:17:23.786 | DEBUG    | __main__:trials:24 - Trial = 12102/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.787 | DEBUG    | __main__:trials:29 - Trial = 12102/30000 | Total reward = 23.58
2022-01-26 14:17:23.790 | DEBUG    | __main__:trials:24 - Trial = 12103/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.791 | DEBUG    | __main__:trials:29 - Trial = 12103/30000 | Total reward = 29.80
2022-01-26 14:17:23.794 | DEBUG    | __main__:trials:24 - Trial = 12104/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.796 | DEBUG    | __main__:trials:29 - Trial = 12104/30000 | Total reward = 30.96
2022-01-26 14:17:23.799 | DEBUG    | __main__:trials:24 - Trial = 12105/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.801 | DEBUG    | __main__:trials:29 - Trial = 12105/30000 | Total reward = 30.27
2022-01-26 14:17:23.804 | DEBUG    | __main__:trials:24 - Trial = 12106/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.805 | DEBUG    | __main__:trials:29 - Trial = 12106/30000 | Total reward = 24.80
2022-01-26 14:17:23.809 | DEBUG    | __main__:trials:24 - Trial = 12107/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.809 | DEBUG    | __main__:trials:29 - Trial = 12107/30000 | Total reward = 41.20
2022-01-26 14:17:23.813 | DEBUG    | __main__:trials:24 - Trial = 12108/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.814 | DEBUG    | __main__:trials:29 - Trial = 12108/30000 | Total reward = 29.22
2022-01-26 14:17:23.817 | DEBUG    | __main__:trials:24 - Trial = 12109/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.819 | DEBUG    | __main__:trials:29 - Trial = 12109/30000 | Total reward = 31.57
2022-01-26 14:17:23.822 | DEBUG    | __main__:trials:24 - Trial = 12110/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.824 | DEBUG    | __main__:trials:29 - Trial = 12110/30000 | Total reward = 31.66
2022-01-26 14:17:23.827 | DEBUG    | __main__:trials:24 - Trial = 12111/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.828 | DEBUG    | __main__:trials:29 - Trial = 12111/30000 | Total reward = 30.59
2022-01-26 14:17:23.832 | DEBUG    | __main__:trials:24 - Trial = 12112/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.834 | DEBUG    | __main__:trials:29 - Trial = 12112/30000 | Total reward = 41.48
2022-01-26 14:17:23.838 | DEBUG    | __main__:trials:24 - Trial = 12113/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.839 | DEBUG    | __main__:trials:29 - Trial = 12113/30000 | Total reward = 30.08
2022-01-26 14:17:23.842 | DEBUG    | __main__:trials:24 - Trial = 12114/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.843 | DEBUG    | __main__:trials:29 - Trial = 12114/30000 | Total reward = 27.98
2022-01-26 14:17:23.846 | DEBUG    | __main__:trials:24 - Trial = 12115/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.848 | DEBUG    | __main__:trials:29 - Trial = 12115/30000 | Total reward = 21.26
2022-01-26 14:17:23.852 | DEBUG    | __main__:trials:24 - Trial = 12116/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.852 | DEBUG    | __main__:trials:29 - Trial = 12116/30000 | Total reward = 28.37
2022-01-26 14:17:23.856 | DEBUG    | __main__:trials:24 - Trial = 12117/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.858 | DEBUG    | __main__:trials:29 - Trial = 12117/30000 | Total reward = 34.36
2022-01-26 14:17:23.862 | DEBUG    | __main__:trials:24 - Trial = 12118/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.863 | DEBUG    | __main__:trials:29 - Trial = 12118/30000 | Total reward = 31.11
2022-01-26 14:17:23.866 | DEBUG    | __main__:trials:24 - Trial = 12119/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.868 | DEBUG    | __main__:trials:29 - Trial = 12119/30000 | Total reward = 35.72
2022-01-26 14:17:23.871 | DEBUG    | __main__:trials:24 - Trial = 12120/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.873 | DEBUG    | __main__:trials:29 - Trial = 12120/30000 | Total reward = 34.07
2022-01-26 14:17:23.876 | DEBUG    | __main__:trials:24 - Trial = 12121/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.878 | DEBUG    | __main__:trials:29 - Trial = 12121/30000 | Total reward = 31.64
2022-01-26 14:17:23.881 | DEBUG    | __main__:trials:24 - Trial = 12122/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.882 | DEBUG    | __main__:trials:29 - Trial = 12122/30000 | Total reward = 42.90
2022-01-26 14:17:23.885 | DEBUG    | __main__:trials:24 - Trial = 12123/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.887 | DEBUG    | __main__:trials:29 - Trial = 12123/30000 | Total reward = 40.18
2022-01-26 14:17:23.891 | DEBUG    | __main__:trials:24 - Trial = 12124/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.892 | DEBUG    | __main__:trials:29 - Trial = 12124/30000 | Total reward = 40.26
2022-01-26 14:17:23.895 | DEBUG    | __main__:trials:24 - Trial = 12125/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.897 | DEBUG    | __main__:trials:29 - Trial = 12125/30000 | Total reward = 29.80
2022-01-26 14:17:23.901 | DEBUG    | __main__:trials:24 - Trial = 12126/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.902 | DEBUG    | __main__:trials:29 - Trial = 12126/30000 | Total reward = 39.81
2022-01-26 14:17:23.906 | DEBUG    | __main__:trials:24 - Trial = 12127/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.907 | DEBUG    | __main__:trials:29 - Trial = 12127/30000 | Total reward = 29.81
2022-01-26 14:17:23.910 | DEBUG    | __main__:trials:24 - Trial = 12128/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.912 | DEBUG    | __main__:trials:29 - Trial = 12128/30000 | Total reward = 31.71
2022-01-26 14:17:23.915 | DEBUG    | __main__:trials:24 - Trial = 12129/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.917 | DEBUG    | __main__:trials:29 - Trial = 12129/30000 | Total reward = 31.71
2022-01-26 14:17:23.920 | DEBUG    | __main__:trials:26 - Trial = 12130/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.922 | DEBUG    | __main__:trials:29 - Trial = 12130/30000 | Total reward = 18.92
2022-01-26 14:17:23.925 | DEBUG    | __main__:trials:26 - Trial = 12131/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.927 | DEBUG    | __main__:trials:29 - Trial = 12131/30000 | Total reward = 21.14
2022-01-26 14:17:23.930 | DEBUG    | __main__:trials:24 - Trial = 12132/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.931 | DEBUG    | __main__:trials:29 - Trial = 12132/30000 | Total reward = 34.34
2022-01-26 14:17:23.934 | DEBUG    | __main__:trials:24 - Trial = 12133/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.936 | DEBUG    | __main__:trials:29 - Trial = 12133/30000 | Total reward = 41.73
2022-01-26 14:17:23.940 | DEBUG    | __main__:trials:24 - Trial = 12134/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.941 | DEBUG    | __main__:trials:29 - Trial = 12134/30000 | Total reward = 32.81
2022-01-26 14:17:23.945 | DEBUG    | __main__:trials:26 - Trial = 12135/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.946 | DEBUG    | __main__:trials:29 - Trial = 12135/30000 | Total reward = 23.08
2022-01-26 14:17:23.950 | DEBUG    | __main__:trials:24 - Trial = 12136/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.951 | DEBUG    | __main__:trials:29 - Trial = 12136/30000 | Total reward = 31.14
2022-01-26 14:17:23.955 | DEBUG    | __main__:trials:24 - Trial = 12137/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.957 | DEBUG    | __main__:trials:29 - Trial = 12137/30000 | Total reward = 23.38
2022-01-26 14:17:23.959 | DEBUG    | __main__:trials:24 - Trial = 12138/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.961 | DEBUG    | __main__:trials:29 - Trial = 12138/30000 | Total reward = 44.13
2022-01-26 14:17:23.965 | DEBUG    | __main__:trials:24 - Trial = 12139/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.967 | DEBUG    | __main__:trials:29 - Trial = 12139/30000 | Total reward = 29.91
2022-01-26 14:17:23.969 | DEBUG    | __main__:trials:24 - Trial = 12140/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.971 | DEBUG    | __main__:trials:29 - Trial = 12140/30000 | Total reward = 31.90
2022-01-26 14:17:23.975 | DEBUG    | __main__:trials:26 - Trial = 12141/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.976 | DEBUG    | __main__:trials:29 - Trial = 12141/30000 | Total reward = 14.83
2022-01-26 14:17:23.980 | DEBUG    | __main__:trials:24 - Trial = 12142/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.981 | DEBUG    | __main__:trials:29 - Trial = 12142/30000 | Total reward = 34.34
2022-01-26 14:17:23.985 | DEBUG    | __main__:trials:24 - Trial = 12143/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.986 | DEBUG    | __main__:trials:29 - Trial = 12143/30000 | Total reward = 31.36
2022-01-26 14:17:23.990 | DEBUG    | __main__:trials:24 - Trial = 12144/30000 | Max number of steps (20) reached
2022-01-26 14:17:23.991 | DEBUG    | __main__:trials:29 - Trial = 12144/30000 | Total reward = 34.76
2022-01-26 14:17:23.995 | DEBUG    | __main__:trials:26 - Trial = 12145/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:23.995 | DEBUG    | __main__:trials:29 - Trial = 12145/30000 | Total reward = 15.76
2022-01-26 14:17:24.000 | DEBUG    | __main__:trials:24 - Trial = 12146/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.000 | DEBUG    | __main__:trials:29 - Trial = 12146/30000 | Total reward = 29.91
2022-01-26 14:17:24.005 | DEBUG    | __main__:trials:24 - Trial = 12147/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.005 | DEBUG    | __main__:trials:29 - Trial = 12147/30000 | Total reward = 30.60
2022-01-26 14:17:24.011 | DEBUG    | __main__:trials:24 - Trial = 12148/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.012 | DEBUG    | __main__:trials:29 - Trial = 12148/30000 | Total reward = 31.76
2022-01-26 14:17:24.015 | DEBUG    | __main__:trials:24 - Trial = 12149/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.016 | DEBUG    | __main__:trials:29 - Trial = 12149/30000 | Total reward = 34.71
2022-01-26 14:17:24.020 | DEBUG    | __main__:trials:24 - Trial = 12150/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.022 | DEBUG    | __main__:trials:29 - Trial = 12150/30000 | Total reward = 31.75
2022-01-26 14:17:24.025 | DEBUG    | __main__:trials:24 - Trial = 12151/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.026 | DEBUG    | __main__:trials:29 - Trial = 12151/30000 | Total reward = 31.79
2022-01-26 14:17:24.031 | DEBUG    | __main__:trials:24 - Trial = 12152/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.032 | DEBUG    | __main__:trials:29 - Trial = 12152/30000 | Total reward = 30.61
2022-01-26 14:17:24.036 | DEBUG    | __main__:trials:24 - Trial = 12153/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.037 | DEBUG    | __main__:trials:29 - Trial = 12153/30000 | Total reward = 27.33
2022-01-26 14:17:24.041 | DEBUG    | __main__:trials:24 - Trial = 12154/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.043 | DEBUG    | __main__:trials:29 - Trial = 12154/30000 | Total reward = 29.23
2022-01-26 14:17:24.045 | DEBUG    | __main__:trials:24 - Trial = 12155/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.047 | DEBUG    | __main__:trials:29 - Trial = 12155/30000 | Total reward = 53.54
2022-01-26 14:17:24.051 | DEBUG    | __main__:trials:24 - Trial = 12156/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.052 | DEBUG    | __main__:trials:29 - Trial = 12156/30000 | Total reward = 43.06
2022-01-26 14:17:24.056 | DEBUG    | __main__:trials:26 - Trial = 12157/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.057 | DEBUG    | __main__:trials:29 - Trial = 12157/30000 | Total reward = 28.93
2022-01-26 14:17:24.061 | DEBUG    | __main__:trials:24 - Trial = 12158/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.062 | DEBUG    | __main__:trials:29 - Trial = 12158/30000 | Total reward = 24.67
2022-01-26 14:17:24.066 | DEBUG    | __main__:trials:24 - Trial = 12159/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.068 | DEBUG    | __main__:trials:29 - Trial = 12159/30000 | Total reward = 29.30
2022-01-26 14:17:24.071 | DEBUG    | __main__:trials:24 - Trial = 12160/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.072 | DEBUG    | __main__:trials:29 - Trial = 12160/30000 | Total reward = 40.33
2022-01-26 14:17:24.076 | DEBUG    | __main__:trials:24 - Trial = 12161/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.078 | DEBUG    | __main__:trials:29 - Trial = 12161/30000 | Total reward = 37.25
2022-01-26 14:17:24.082 | DEBUG    | __main__:trials:24 - Trial = 12162/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.083 | DEBUG    | __main__:trials:29 - Trial = 12162/30000 | Total reward = 22.07
2022-01-26 14:17:24.087 | DEBUG    | __main__:trials:24 - Trial = 12163/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.089 | DEBUG    | __main__:trials:29 - Trial = 12163/30000 | Total reward = 45.40
2022-01-26 14:17:24.094 | DEBUG    | __main__:trials:24 - Trial = 12164/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.095 | DEBUG    | __main__:trials:29 - Trial = 12164/30000 | Total reward = 37.30
2022-01-26 14:17:24.099 | DEBUG    | __main__:trials:24 - Trial = 12165/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.100 | DEBUG    | __main__:trials:29 - Trial = 12165/30000 | Total reward = 56.05
2022-01-26 14:17:24.104 | DEBUG    | __main__:trials:24 - Trial = 12166/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.106 | DEBUG    | __main__:trials:29 - Trial = 12166/30000 | Total reward = 49.55
2022-01-26 14:17:24.109 | DEBUG    | __main__:trials:24 - Trial = 12167/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.111 | DEBUG    | __main__:trials:29 - Trial = 12167/30000 | Total reward = 47.03
2022-01-26 14:17:24.115 | DEBUG    | __main__:trials:24 - Trial = 12168/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.116 | DEBUG    | __main__:trials:29 - Trial = 12168/30000 | Total reward = 51.53
2022-01-26 14:17:24.120 | DEBUG    | __main__:trials:24 - Trial = 12169/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.121 | DEBUG    | __main__:trials:29 - Trial = 12169/30000 | Total reward = 39.32
2022-01-26 14:17:24.125 | DEBUG    | __main__:trials:24 - Trial = 12170/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.127 | DEBUG    | __main__:trials:29 - Trial = 12170/30000 | Total reward = 45.17
2022-01-26 14:17:24.131 | DEBUG    | __main__:trials:24 - Trial = 12171/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.131 | DEBUG    | __main__:trials:29 - Trial = 12171/30000 | Total reward = 39.58
2022-01-26 14:17:24.135 | DEBUG    | __main__:trials:24 - Trial = 12172/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.137 | DEBUG    | __main__:trials:29 - Trial = 12172/30000 | Total reward = 49.25
2022-01-26 14:17:24.140 | DEBUG    | __main__:trials:24 - Trial = 12173/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.141 | DEBUG    | __main__:trials:29 - Trial = 12173/30000 | Total reward = 54.76
2022-01-26 14:17:24.145 | DEBUG    | __main__:trials:24 - Trial = 12174/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.146 | DEBUG    | __main__:trials:29 - Trial = 12174/30000 | Total reward = 43.19
2022-01-26 14:17:24.150 | DEBUG    | __main__:trials:24 - Trial = 12175/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.151 | DEBUG    | __main__:trials:29 - Trial = 12175/30000 | Total reward = 51.24
2022-01-26 14:17:24.154 | DEBUG    | __main__:trials:24 - Trial = 12176/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.156 | DEBUG    | __main__:trials:29 - Trial = 12176/30000 | Total reward = 30.23
2022-01-26 14:17:24.159 | DEBUG    | __main__:trials:24 - Trial = 12177/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.161 | DEBUG    | __main__:trials:29 - Trial = 12177/30000 | Total reward = 42.57
2022-01-26 14:17:24.164 | DEBUG    | __main__:trials:24 - Trial = 12178/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.165 | DEBUG    | __main__:trials:29 - Trial = 12178/30000 | Total reward = 41.51
2022-01-26 14:17:24.168 | DEBUG    | __main__:trials:24 - Trial = 12179/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.170 | DEBUG    | __main__:trials:29 - Trial = 12179/30000 | Total reward = 32.75
2022-01-26 14:17:24.174 | DEBUG    | __main__:trials:24 - Trial = 12180/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.175 | DEBUG    | __main__:trials:29 - Trial = 12180/30000 | Total reward = 53.69
2022-01-26 14:17:24.179 | DEBUG    | __main__:trials:24 - Trial = 12181/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.181 | DEBUG    | __main__:trials:29 - Trial = 12181/30000 | Total reward = 33.17
2022-01-26 14:17:24.184 | DEBUG    | __main__:trials:24 - Trial = 12182/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.186 | DEBUG    | __main__:trials:29 - Trial = 12182/30000 | Total reward = 49.62
2022-01-26 14:17:24.189 | DEBUG    | __main__:trials:24 - Trial = 12183/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.190 | DEBUG    | __main__:trials:29 - Trial = 12183/30000 | Total reward = 41.59
2022-01-26 14:17:24.194 | DEBUG    | __main__:trials:24 - Trial = 12184/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.196 | DEBUG    | __main__:trials:29 - Trial = 12184/30000 | Total reward = 57.12
2022-01-26 14:17:24.199 | DEBUG    | __main__:trials:24 - Trial = 12185/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.201 | DEBUG    | __main__:trials:29 - Trial = 12185/30000 | Total reward = 61.09
2022-01-26 14:17:24.204 | DEBUG    | __main__:trials:24 - Trial = 12186/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.205 | DEBUG    | __main__:trials:29 - Trial = 12186/30000 | Total reward = 36.76
2022-01-26 14:17:24.208 | DEBUG    | __main__:trials:24 - Trial = 12187/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.209 | DEBUG    | __main__:trials:29 - Trial = 12187/30000 | Total reward = 38.15
2022-01-26 14:17:24.213 | DEBUG    | __main__:trials:24 - Trial = 12188/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.213 | DEBUG    | __main__:trials:29 - Trial = 12188/30000 | Total reward = 45.44
2022-01-26 14:17:24.218 | DEBUG    | __main__:trials:24 - Trial = 12189/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.218 | DEBUG    | __main__:trials:29 - Trial = 12189/30000 | Total reward = 47.03
2022-01-26 14:17:24.223 | DEBUG    | __main__:trials:24 - Trial = 12190/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.224 | DEBUG    | __main__:trials:29 - Trial = 12190/30000 | Total reward = 50.69
2022-01-26 14:17:24.228 | DEBUG    | __main__:trials:24 - Trial = 12191/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.229 | DEBUG    | __main__:trials:29 - Trial = 12191/30000 | Total reward = 51.52
2022-01-26 14:17:24.234 | DEBUG    | __main__:trials:24 - Trial = 12192/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.234 | DEBUG    | __main__:trials:29 - Trial = 12192/30000 | Total reward = 41.65
2022-01-26 14:17:24.238 | DEBUG    | __main__:trials:24 - Trial = 12193/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.240 | DEBUG    | __main__:trials:29 - Trial = 12193/30000 | Total reward = 48.21
2022-01-26 14:17:24.243 | DEBUG    | __main__:trials:24 - Trial = 12194/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.244 | DEBUG    | __main__:trials:29 - Trial = 12194/30000 | Total reward = 45.37
2022-01-26 14:17:24.248 | DEBUG    | __main__:trials:24 - Trial = 12195/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.249 | DEBUG    | __main__:trials:29 - Trial = 12195/30000 | Total reward = 58.28
2022-01-26 14:17:24.252 | DEBUG    | __main__:trials:24 - Trial = 12196/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.254 | DEBUG    | __main__:trials:29 - Trial = 12196/30000 | Total reward = 57.77
2022-01-26 14:17:24.257 | DEBUG    | __main__:trials:24 - Trial = 12197/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.259 | DEBUG    | __main__:trials:29 - Trial = 12197/30000 | Total reward = 47.21
2022-01-26 14:17:24.262 | DEBUG    | __main__:trials:24 - Trial = 12198/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.263 | DEBUG    | __main__:trials:29 - Trial = 12198/30000 | Total reward = 38.14
2022-01-26 14:17:24.267 | DEBUG    | __main__:trials:24 - Trial = 12199/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.267 | DEBUG    | __main__:trials:29 - Trial = 12199/30000 | Total reward = 47.62
2022-01-26 14:17:24.271 | DEBUG    | __main__:trials:24 - Trial = 12200/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.272 | DEBUG    | __main__:trials:29 - Trial = 12200/30000 | Total reward = 66.34
2022-01-26 14:17:24.275 | DEBUG    | __main__:trials:24 - Trial = 12201/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.277 | DEBUG    | __main__:trials:29 - Trial = 12201/30000 | Total reward = 36.91
2022-01-26 14:17:24.281 | DEBUG    | __main__:trials:24 - Trial = 12202/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.282 | DEBUG    | __main__:trials:29 - Trial = 12202/30000 | Total reward = 51.88
2022-01-26 14:17:24.286 | DEBUG    | __main__:trials:24 - Trial = 12203/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.288 | DEBUG    | __main__:trials:29 - Trial = 12203/30000 | Total reward = 30.08
2022-01-26 14:17:24.291 | DEBUG    | __main__:trials:24 - Trial = 12204/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.292 | DEBUG    | __main__:trials:29 - Trial = 12204/30000 | Total reward = 37.08
2022-01-26 14:17:24.295 | DEBUG    | __main__:trials:24 - Trial = 12205/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.297 | DEBUG    | __main__:trials:29 - Trial = 12205/30000 | Total reward = 56.45
2022-01-26 14:17:24.301 | DEBUG    | __main__:trials:24 - Trial = 12206/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.302 | DEBUG    | __main__:trials:29 - Trial = 12206/30000 | Total reward = 31.01
2022-01-26 14:17:24.305 | DEBUG    | __main__:trials:24 - Trial = 12207/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.306 | DEBUG    | __main__:trials:29 - Trial = 12207/30000 | Total reward = 34.87
2022-01-26 14:17:24.309 | DEBUG    | __main__:trials:24 - Trial = 12208/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.311 | DEBUG    | __main__:trials:29 - Trial = 12208/30000 | Total reward = 16.14
2022-01-26 14:17:24.314 | DEBUG    | __main__:trials:26 - Trial = 12209/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.315 | DEBUG    | __main__:trials:29 - Trial = 12209/30000 | Total reward = 25.86
2022-01-26 14:17:24.318 | DEBUG    | __main__:trials:24 - Trial = 12210/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.320 | DEBUG    | __main__:trials:29 - Trial = 12210/30000 | Total reward = 43.19
2022-01-26 14:17:24.323 | DEBUG    | __main__:trials:24 - Trial = 12211/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.324 | DEBUG    | __main__:trials:29 - Trial = 12211/30000 | Total reward = 30.04
2022-01-26 14:17:24.327 | DEBUG    | __main__:trials:24 - Trial = 12212/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.329 | DEBUG    | __main__:trials:29 - Trial = 12212/30000 | Total reward = 43.52
2022-01-26 14:17:24.332 | DEBUG    | __main__:trials:24 - Trial = 12213/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.333 | DEBUG    | __main__:trials:29 - Trial = 12213/30000 | Total reward = 29.68
2022-01-26 14:17:24.337 | DEBUG    | __main__:trials:24 - Trial = 12214/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.338 | DEBUG    | __main__:trials:29 - Trial = 12214/30000 | Total reward = 26.72
2022-01-26 14:17:24.343 | DEBUG    | __main__:trials:24 - Trial = 12215/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.344 | DEBUG    | __main__:trials:29 - Trial = 12215/30000 | Total reward = 33.75
2022-01-26 14:17:24.348 | DEBUG    | __main__:trials:24 - Trial = 12216/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.349 | DEBUG    | __main__:trials:29 - Trial = 12216/30000 | Total reward = 32.38
2022-01-26 14:17:24.354 | DEBUG    | __main__:trials:24 - Trial = 12217/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.354 | DEBUG    | __main__:trials:29 - Trial = 12217/30000 | Total reward = 36.26
2022-01-26 14:17:24.359 | DEBUG    | __main__:trials:24 - Trial = 12218/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.360 | DEBUG    | __main__:trials:29 - Trial = 12218/30000 | Total reward = 29.85
2022-01-26 14:17:24.364 | DEBUG    | __main__:trials:24 - Trial = 12219/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.366 | DEBUG    | __main__:trials:29 - Trial = 12219/30000 | Total reward = 29.37
2022-01-26 14:17:24.369 | DEBUG    | __main__:trials:24 - Trial = 12220/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.370 | DEBUG    | __main__:trials:29 - Trial = 12220/30000 | Total reward = 30.54
2022-01-26 14:17:24.374 | DEBUG    | __main__:trials:24 - Trial = 12221/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.375 | DEBUG    | __main__:trials:29 - Trial = 12221/30000 | Total reward = 27.21
2022-01-26 14:17:24.378 | DEBUG    | __main__:trials:24 - Trial = 12222/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.379 | DEBUG    | __main__:trials:29 - Trial = 12222/30000 | Total reward = 20.65
2022-01-26 14:17:24.382 | DEBUG    | __main__:trials:24 - Trial = 12223/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.384 | DEBUG    | __main__:trials:29 - Trial = 12223/30000 | Total reward = 26.25
2022-01-26 14:17:24.388 | DEBUG    | __main__:trials:24 - Trial = 12224/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.389 | DEBUG    | __main__:trials:29 - Trial = 12224/30000 | Total reward = 30.91
2022-01-26 14:17:24.393 | DEBUG    | __main__:trials:24 - Trial = 12225/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.395 | DEBUG    | __main__:trials:29 - Trial = 12225/30000 | Total reward = 57.75
2022-01-26 14:17:24.399 | DEBUG    | __main__:trials:24 - Trial = 12226/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.400 | DEBUG    | __main__:trials:29 - Trial = 12226/30000 | Total reward = 30.14
2022-01-26 14:17:24.404 | DEBUG    | __main__:trials:24 - Trial = 12227/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.405 | DEBUG    | __main__:trials:29 - Trial = 12227/30000 | Total reward = 38.94
2022-01-26 14:17:24.409 | DEBUG    | __main__:trials:24 - Trial = 12228/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.410 | DEBUG    | __main__:trials:29 - Trial = 12228/30000 | Total reward = 33.81
2022-01-26 14:17:24.414 | DEBUG    | __main__:trials:24 - Trial = 12229/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.416 | DEBUG    | __main__:trials:29 - Trial = 12229/30000 | Total reward = 37.41
2022-01-26 14:17:24.420 | DEBUG    | __main__:trials:24 - Trial = 12230/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.421 | DEBUG    | __main__:trials:29 - Trial = 12230/30000 | Total reward = 34.69
2022-01-26 14:17:24.425 | DEBUG    | __main__:trials:24 - Trial = 12231/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.427 | DEBUG    | __main__:trials:29 - Trial = 12231/30000 | Total reward = 38.12
2022-01-26 14:17:24.431 | DEBUG    | __main__:trials:24 - Trial = 12232/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.431 | DEBUG    | __main__:trials:29 - Trial = 12232/30000 | Total reward = 29.91
2022-01-26 14:17:24.436 | DEBUG    | __main__:trials:24 - Trial = 12233/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.436 | DEBUG    | __main__:trials:29 - Trial = 12233/30000 | Total reward = 35.48
2022-01-26 14:17:24.440 | DEBUG    | __main__:trials:24 - Trial = 12234/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.442 | DEBUG    | __main__:trials:29 - Trial = 12234/30000 | Total reward = 31.82
2022-01-26 14:17:24.446 | DEBUG    | __main__:trials:24 - Trial = 12235/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.446 | DEBUG    | __main__:trials:29 - Trial = 12235/30000 | Total reward = 26.20
2022-01-26 14:17:24.449 | DEBUG    | __main__:trials:26 - Trial = 12236/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.451 | DEBUG    | __main__:trials:29 - Trial = 12236/30000 | Total reward = 16.42
2022-01-26 14:17:24.454 | DEBUG    | __main__:trials:24 - Trial = 12237/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.455 | DEBUG    | __main__:trials:29 - Trial = 12237/30000 | Total reward = 25.21
2022-01-26 14:17:24.458 | DEBUG    | __main__:trials:26 - Trial = 12238/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.460 | DEBUG    | __main__:trials:29 - Trial = 12238/30000 | Total reward = 13.20
2022-01-26 14:17:24.463 | DEBUG    | __main__:trials:24 - Trial = 12239/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.465 | DEBUG    | __main__:trials:29 - Trial = 12239/30000 | Total reward = 29.14
2022-01-26 14:17:24.468 | DEBUG    | __main__:trials:24 - Trial = 12240/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.470 | DEBUG    | __main__:trials:29 - Trial = 12240/30000 | Total reward = 32.01
2022-01-26 14:17:24.473 | DEBUG    | __main__:trials:24 - Trial = 12241/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.473 | DEBUG    | __main__:trials:29 - Trial = 12241/30000 | Total reward = 25.87
2022-01-26 14:17:24.478 | DEBUG    | __main__:trials:24 - Trial = 12242/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.478 | DEBUG    | __main__:trials:29 - Trial = 12242/30000 | Total reward = 26.58
2022-01-26 14:17:24.483 | DEBUG    | __main__:trials:24 - Trial = 12243/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.483 | DEBUG    | __main__:trials:29 - Trial = 12243/30000 | Total reward = 36.76
2022-01-26 14:17:24.488 | DEBUG    | __main__:trials:24 - Trial = 12244/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.490 | DEBUG    | __main__:trials:29 - Trial = 12244/30000 | Total reward = 31.82
2022-01-26 14:17:24.493 | DEBUG    | __main__:trials:24 - Trial = 12245/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.495 | DEBUG    | __main__:trials:29 - Trial = 12245/30000 | Total reward = 27.68
2022-01-26 14:17:24.498 | DEBUG    | __main__:trials:24 - Trial = 12246/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.500 | DEBUG    | __main__:trials:29 - Trial = 12246/30000 | Total reward = 44.81
2022-01-26 14:17:24.503 | DEBUG    | __main__:trials:24 - Trial = 12247/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.505 | DEBUG    | __main__:trials:29 - Trial = 12247/30000 | Total reward = 34.03
2022-01-26 14:17:24.508 | DEBUG    | __main__:trials:24 - Trial = 12248/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.509 | DEBUG    | __main__:trials:29 - Trial = 12248/30000 | Total reward = 29.91
2022-01-26 14:17:24.513 | DEBUG    | __main__:trials:24 - Trial = 12249/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.514 | DEBUG    | __main__:trials:29 - Trial = 12249/30000 | Total reward = 31.48
2022-01-26 14:17:24.518 | DEBUG    | __main__:trials:24 - Trial = 12250/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.519 | DEBUG    | __main__:trials:29 - Trial = 12250/30000 | Total reward = 39.52
2022-01-26 14:17:24.523 | DEBUG    | __main__:trials:26 - Trial = 12251/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.524 | DEBUG    | __main__:trials:29 - Trial = 12251/30000 | Total reward = 16.58
2022-01-26 14:17:24.528 | DEBUG    | __main__:trials:24 - Trial = 12252/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.529 | DEBUG    | __main__:trials:29 - Trial = 12252/30000 | Total reward = 44.52
2022-01-26 14:17:24.533 | DEBUG    | __main__:trials:24 - Trial = 12253/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.535 | DEBUG    | __main__:trials:29 - Trial = 12253/30000 | Total reward = 41.18
2022-01-26 14:17:24.539 | DEBUG    | __main__:trials:24 - Trial = 12254/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.540 | DEBUG    | __main__:trials:29 - Trial = 12254/30000 | Total reward = 41.51
2022-01-26 14:17:24.544 | DEBUG    | __main__:trials:24 - Trial = 12255/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.545 | DEBUG    | __main__:trials:29 - Trial = 12255/30000 | Total reward = 33.49
2022-01-26 14:17:24.550 | DEBUG    | __main__:trials:24 - Trial = 12256/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.550 | DEBUG    | __main__:trials:29 - Trial = 12256/30000 | Total reward = 43.77
2022-01-26 14:17:24.555 | DEBUG    | __main__:trials:24 - Trial = 12257/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.556 | DEBUG    | __main__:trials:29 - Trial = 12257/30000 | Total reward = 31.92
2022-01-26 14:17:24.560 | DEBUG    | __main__:trials:24 - Trial = 12258/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.562 | DEBUG    | __main__:trials:29 - Trial = 12258/30000 | Total reward = 28.03
2022-01-26 14:17:24.565 | DEBUG    | __main__:trials:24 - Trial = 12259/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.567 | DEBUG    | __main__:trials:29 - Trial = 12259/30000 | Total reward = 32.12
2022-01-26 14:17:24.571 | DEBUG    | __main__:trials:24 - Trial = 12260/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.572 | DEBUG    | __main__:trials:29 - Trial = 12260/30000 | Total reward = 31.46
2022-01-26 14:17:24.576 | DEBUG    | __main__:trials:24 - Trial = 12261/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.578 | DEBUG    | __main__:trials:29 - Trial = 12261/30000 | Total reward = 37.96
2022-01-26 14:17:24.580 | DEBUG    | __main__:trials:24 - Trial = 12262/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.582 | DEBUG    | __main__:trials:29 - Trial = 12262/30000 | Total reward = 34.56
2022-01-26 14:17:24.585 | DEBUG    | __main__:trials:24 - Trial = 12263/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.587 | DEBUG    | __main__:trials:29 - Trial = 12263/30000 | Total reward = 43.51
2022-01-26 14:17:24.591 | DEBUG    | __main__:trials:24 - Trial = 12264/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.592 | DEBUG    | __main__:trials:29 - Trial = 12264/30000 | Total reward = 35.70
2022-01-26 14:17:24.596 | DEBUG    | __main__:trials:24 - Trial = 12265/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.598 | DEBUG    | __main__:trials:29 - Trial = 12265/30000 | Total reward = 30.18
2022-01-26 14:17:24.601 | DEBUG    | __main__:trials:24 - Trial = 12266/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.603 | DEBUG    | __main__:trials:29 - Trial = 12266/30000 | Total reward = 33.09
2022-01-26 14:17:24.607 | DEBUG    | __main__:trials:24 - Trial = 12267/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.608 | DEBUG    | __main__:trials:29 - Trial = 12267/30000 | Total reward = 31.42
2022-01-26 14:17:24.612 | DEBUG    | __main__:trials:24 - Trial = 12268/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.613 | DEBUG    | __main__:trials:29 - Trial = 12268/30000 | Total reward = 33.67
2022-01-26 14:17:24.616 | DEBUG    | __main__:trials:24 - Trial = 12269/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.618 | DEBUG    | __main__:trials:29 - Trial = 12269/30000 | Total reward = 37.79
2022-01-26 14:17:24.622 | DEBUG    | __main__:trials:24 - Trial = 12270/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.622 | DEBUG    | __main__:trials:29 - Trial = 12270/30000 | Total reward = 32.83
2022-01-26 14:17:24.627 | DEBUG    | __main__:trials:24 - Trial = 12271/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.628 | DEBUG    | __main__:trials:29 - Trial = 12271/30000 | Total reward = 31.79
2022-01-26 14:17:24.631 | DEBUG    | __main__:trials:24 - Trial = 12272/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.633 | DEBUG    | __main__:trials:29 - Trial = 12272/30000 | Total reward = 33.37
2022-01-26 14:17:24.637 | DEBUG    | __main__:trials:24 - Trial = 12273/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.637 | DEBUG    | __main__:trials:29 - Trial = 12273/30000 | Total reward = 40.10
2022-01-26 14:17:24.641 | DEBUG    | __main__:trials:24 - Trial = 12274/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.642 | DEBUG    | __main__:trials:29 - Trial = 12274/30000 | Total reward = 29.95
2022-01-26 14:17:24.646 | DEBUG    | __main__:trials:24 - Trial = 12275/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.647 | DEBUG    | __main__:trials:29 - Trial = 12275/30000 | Total reward = 40.20
2022-01-26 14:17:24.651 | DEBUG    | __main__:trials:24 - Trial = 12276/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.653 | DEBUG    | __main__:trials:29 - Trial = 12276/30000 | Total reward = 31.29
2022-01-26 14:17:24.656 | DEBUG    | __main__:trials:26 - Trial = 12277/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.658 | DEBUG    | __main__:trials:29 - Trial = 12277/30000 | Total reward = 23.61
2022-01-26 14:17:24.662 | DEBUG    | __main__:trials:24 - Trial = 12278/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.663 | DEBUG    | __main__:trials:29 - Trial = 12278/30000 | Total reward = 26.20
2022-01-26 14:17:24.667 | DEBUG    | __main__:trials:24 - Trial = 12279/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.668 | DEBUG    | __main__:trials:29 - Trial = 12279/30000 | Total reward = 27.78
2022-01-26 14:17:24.672 | DEBUG    | __main__:trials:24 - Trial = 12280/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.674 | DEBUG    | __main__:trials:29 - Trial = 12280/30000 | Total reward = 28.61
2022-01-26 14:17:24.677 | DEBUG    | __main__:trials:24 - Trial = 12281/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.679 | DEBUG    | __main__:trials:29 - Trial = 12281/30000 | Total reward = 27.29
2022-01-26 14:17:24.681 | DEBUG    | __main__:trials:26 - Trial = 12282/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.682 | DEBUG    | __main__:trials:29 - Trial = 12282/30000 | Total reward = 8.00
2022-01-26 14:17:24.686 | DEBUG    | __main__:trials:24 - Trial = 12283/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.687 | DEBUG    | __main__:trials:29 - Trial = 12283/30000 | Total reward = 33.03
2022-01-26 14:17:24.691 | DEBUG    | __main__:trials:24 - Trial = 12284/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.693 | DEBUG    | __main__:trials:29 - Trial = 12284/30000 | Total reward = 31.38
2022-01-26 14:17:24.697 | DEBUG    | __main__:trials:24 - Trial = 12285/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.699 | DEBUG    | __main__:trials:29 - Trial = 12285/30000 | Total reward = 47.84
2022-01-26 14:17:24.703 | DEBUG    | __main__:trials:24 - Trial = 12286/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.703 | DEBUG    | __main__:trials:29 - Trial = 12286/30000 | Total reward = 31.87
2022-01-26 14:17:24.708 | DEBUG    | __main__:trials:24 - Trial = 12287/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.710 | DEBUG    | __main__:trials:29 - Trial = 12287/30000 | Total reward = 29.68
2022-01-26 14:17:24.713 | DEBUG    | __main__:trials:24 - Trial = 12288/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.714 | DEBUG    | __main__:trials:29 - Trial = 12288/30000 | Total reward = 29.97
2022-01-26 14:17:24.717 | DEBUG    | __main__:trials:24 - Trial = 12289/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.719 | DEBUG    | __main__:trials:29 - Trial = 12289/30000 | Total reward = 37.50
2022-01-26 14:17:24.722 | DEBUG    | __main__:trials:24 - Trial = 12290/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.723 | DEBUG    | __main__:trials:29 - Trial = 12290/30000 | Total reward = 30.39
2022-01-26 14:17:24.727 | DEBUG    | __main__:trials:24 - Trial = 12291/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.727 | DEBUG    | __main__:trials:29 - Trial = 12291/30000 | Total reward = 44.92
2022-01-26 14:17:24.731 | DEBUG    | __main__:trials:24 - Trial = 12292/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.732 | DEBUG    | __main__:trials:29 - Trial = 12292/30000 | Total reward = 32.19
2022-01-26 14:17:24.735 | DEBUG    | __main__:trials:24 - Trial = 12293/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.736 | DEBUG    | __main__:trials:29 - Trial = 12293/30000 | Total reward = 32.48
2022-01-26 14:17:24.739 | DEBUG    | __main__:trials:24 - Trial = 12294/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.741 | DEBUG    | __main__:trials:29 - Trial = 12294/30000 | Total reward = 55.81
2022-01-26 14:17:24.742 | DEBUG    | __main__:trials:26 - Trial = 12295/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.744 | DEBUG    | __main__:trials:29 - Trial = 12295/30000 | Total reward = 10.03
2022-01-26 14:17:24.747 | DEBUG    | __main__:trials:24 - Trial = 12296/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.748 | DEBUG    | __main__:trials:29 - Trial = 12296/30000 | Total reward = 45.57
2022-01-26 14:17:24.752 | DEBUG    | __main__:trials:24 - Trial = 12297/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.753 | DEBUG    | __main__:trials:29 - Trial = 12297/30000 | Total reward = 41.78
2022-01-26 14:17:24.757 | DEBUG    | __main__:trials:26 - Trial = 12298/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.758 | DEBUG    | __main__:trials:29 - Trial = 12298/30000 | Total reward = 18.59
2022-01-26 14:17:24.761 | DEBUG    | __main__:trials:24 - Trial = 12299/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.762 | DEBUG    | __main__:trials:29 - Trial = 12299/30000 | Total reward = 26.90
2022-01-26 14:17:24.767 | DEBUG    | __main__:trials:24 - Trial = 12300/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.769 | DEBUG    | __main__:trials:29 - Trial = 12300/30000 | Total reward = 31.92
2022-01-26 14:17:24.773 | DEBUG    | __main__:trials:24 - Trial = 12301/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.775 | DEBUG    | __main__:trials:29 - Trial = 12301/30000 | Total reward = 29.91
2022-01-26 14:17:24.779 | DEBUG    | __main__:trials:24 - Trial = 12302/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.780 | DEBUG    | __main__:trials:29 - Trial = 12302/30000 | Total reward = 26.50
2022-01-26 14:17:24.784 | DEBUG    | __main__:trials:24 - Trial = 12303/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.785 | DEBUG    | __main__:trials:29 - Trial = 12303/30000 | Total reward = 31.10
2022-01-26 14:17:24.788 | DEBUG    | __main__:trials:24 - Trial = 12304/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.790 | DEBUG    | __main__:trials:29 - Trial = 12304/30000 | Total reward = 14.74
2022-01-26 14:17:24.793 | DEBUG    | __main__:trials:26 - Trial = 12305/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.794 | DEBUG    | __main__:trials:29 - Trial = 12305/30000 | Total reward = 13.69
2022-01-26 14:17:24.798 | DEBUG    | __main__:trials:24 - Trial = 12306/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.799 | DEBUG    | __main__:trials:29 - Trial = 12306/30000 | Total reward = 30.29
2022-01-26 14:17:24.803 | DEBUG    | __main__:trials:24 - Trial = 12307/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.804 | DEBUG    | __main__:trials:29 - Trial = 12307/30000 | Total reward = 38.27
2022-01-26 14:17:24.808 | DEBUG    | __main__:trials:24 - Trial = 12308/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.809 | DEBUG    | __main__:trials:29 - Trial = 12308/30000 | Total reward = 36.76
2022-01-26 14:17:24.813 | DEBUG    | __main__:trials:24 - Trial = 12309/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.814 | DEBUG    | __main__:trials:29 - Trial = 12309/30000 | Total reward = 40.92
2022-01-26 14:17:24.818 | DEBUG    | __main__:trials:24 - Trial = 12310/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.819 | DEBUG    | __main__:trials:29 - Trial = 12310/30000 | Total reward = 32.22
2022-01-26 14:17:24.822 | DEBUG    | __main__:trials:24 - Trial = 12311/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.824 | DEBUG    | __main__:trials:29 - Trial = 12311/30000 | Total reward = 44.22
2022-01-26 14:17:24.827 | DEBUG    | __main__:trials:24 - Trial = 12312/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.828 | DEBUG    | __main__:trials:29 - Trial = 12312/30000 | Total reward = 32.14
2022-01-26 14:17:24.832 | DEBUG    | __main__:trials:24 - Trial = 12313/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.834 | DEBUG    | __main__:trials:29 - Trial = 12313/30000 | Total reward = 29.91
2022-01-26 14:17:24.837 | DEBUG    | __main__:trials:24 - Trial = 12314/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.838 | DEBUG    | __main__:trials:29 - Trial = 12314/30000 | Total reward = 30.27
2022-01-26 14:17:24.841 | DEBUG    | __main__:trials:24 - Trial = 12315/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.843 | DEBUG    | __main__:trials:29 - Trial = 12315/30000 | Total reward = 31.93
2022-01-26 14:17:24.847 | DEBUG    | __main__:trials:24 - Trial = 12316/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.848 | DEBUG    | __main__:trials:29 - Trial = 12316/30000 | Total reward = 34.65
2022-01-26 14:17:24.852 | DEBUG    | __main__:trials:24 - Trial = 12317/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.853 | DEBUG    | __main__:trials:29 - Trial = 12317/30000 | Total reward = 41.78
2022-01-26 14:17:24.857 | DEBUG    | __main__:trials:24 - Trial = 12318/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.859 | DEBUG    | __main__:trials:29 - Trial = 12318/30000 | Total reward = 18.76
2022-01-26 14:17:24.863 | DEBUG    | __main__:trials:24 - Trial = 12319/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.864 | DEBUG    | __main__:trials:29 - Trial = 12319/30000 | Total reward = 35.70
2022-01-26 14:17:24.868 | DEBUG    | __main__:trials:24 - Trial = 12320/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.869 | DEBUG    | __main__:trials:29 - Trial = 12320/30000 | Total reward = 38.89
2022-01-26 14:17:24.872 | DEBUG    | __main__:trials:24 - Trial = 12321/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.874 | DEBUG    | __main__:trials:29 - Trial = 12321/30000 | Total reward = 54.59
2022-01-26 14:17:24.878 | DEBUG    | __main__:trials:24 - Trial = 12322/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.879 | DEBUG    | __main__:trials:29 - Trial = 12322/30000 | Total reward = 42.63
2022-01-26 14:17:24.883 | DEBUG    | __main__:trials:24 - Trial = 12323/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.884 | DEBUG    | __main__:trials:29 - Trial = 12323/30000 | Total reward = 42.99
2022-01-26 14:17:24.888 | DEBUG    | __main__:trials:24 - Trial = 12324/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.889 | DEBUG    | __main__:trials:29 - Trial = 12324/30000 | Total reward = 41.34
2022-01-26 14:17:24.893 | DEBUG    | __main__:trials:24 - Trial = 12325/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.894 | DEBUG    | __main__:trials:29 - Trial = 12325/30000 | Total reward = 29.91
2022-01-26 14:17:24.898 | DEBUG    | __main__:trials:24 - Trial = 12326/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.900 | DEBUG    | __main__:trials:29 - Trial = 12326/30000 | Total reward = 41.10
2022-01-26 14:17:24.904 | DEBUG    | __main__:trials:24 - Trial = 12327/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.904 | DEBUG    | __main__:trials:29 - Trial = 12327/30000 | Total reward = 32.36
2022-01-26 14:17:24.908 | DEBUG    | __main__:trials:24 - Trial = 12328/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.910 | DEBUG    | __main__:trials:29 - Trial = 12328/30000 | Total reward = 50.23
2022-01-26 14:17:24.914 | DEBUG    | __main__:trials:24 - Trial = 12329/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.915 | DEBUG    | __main__:trials:29 - Trial = 12329/30000 | Total reward = 29.89
2022-01-26 14:17:24.918 | DEBUG    | __main__:trials:24 - Trial = 12330/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.920 | DEBUG    | __main__:trials:29 - Trial = 12330/30000 | Total reward = 28.87
2022-01-26 14:17:24.924 | DEBUG    | __main__:trials:26 - Trial = 12331/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.925 | DEBUG    | __main__:trials:29 - Trial = 12331/30000 | Total reward = 21.94
2022-01-26 14:17:24.928 | DEBUG    | __main__:trials:26 - Trial = 12332/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:24.930 | DEBUG    | __main__:trials:29 - Trial = 12332/30000 | Total reward = 16.08
2022-01-26 14:17:24.933 | DEBUG    | __main__:trials:24 - Trial = 12333/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.935 | DEBUG    | __main__:trials:29 - Trial = 12333/30000 | Total reward = 32.55
2022-01-26 14:17:24.939 | DEBUG    | __main__:trials:24 - Trial = 12334/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.940 | DEBUG    | __main__:trials:29 - Trial = 12334/30000 | Total reward = 47.03
2022-01-26 14:17:24.944 | DEBUG    | __main__:trials:24 - Trial = 12335/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.945 | DEBUG    | __main__:trials:29 - Trial = 12335/30000 | Total reward = 29.79
2022-01-26 14:17:24.948 | DEBUG    | __main__:trials:24 - Trial = 12336/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.950 | DEBUG    | __main__:trials:29 - Trial = 12336/30000 | Total reward = 29.95
2022-01-26 14:17:24.953 | DEBUG    | __main__:trials:24 - Trial = 12337/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.955 | DEBUG    | __main__:trials:29 - Trial = 12337/30000 | Total reward = 35.87
2022-01-26 14:17:24.957 | DEBUG    | __main__:trials:24 - Trial = 12338/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.958 | DEBUG    | __main__:trials:29 - Trial = 12338/30000 | Total reward = 34.16
2022-01-26 14:17:24.962 | DEBUG    | __main__:trials:24 - Trial = 12339/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.963 | DEBUG    | __main__:trials:29 - Trial = 12339/30000 | Total reward = 31.10
2022-01-26 14:17:24.967 | DEBUG    | __main__:trials:24 - Trial = 12340/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.969 | DEBUG    | __main__:trials:29 - Trial = 12340/30000 | Total reward = 43.29
2022-01-26 14:17:24.972 | DEBUG    | __main__:trials:24 - Trial = 12341/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.974 | DEBUG    | __main__:trials:29 - Trial = 12341/30000 | Total reward = 35.06
2022-01-26 14:17:24.977 | DEBUG    | __main__:trials:24 - Trial = 12342/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.978 | DEBUG    | __main__:trials:29 - Trial = 12342/30000 | Total reward = 26.87
2022-01-26 14:17:24.982 | DEBUG    | __main__:trials:24 - Trial = 12343/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.983 | DEBUG    | __main__:trials:29 - Trial = 12343/30000 | Total reward = 45.22
2022-01-26 14:17:24.987 | DEBUG    | __main__:trials:24 - Trial = 12344/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.988 | DEBUG    | __main__:trials:29 - Trial = 12344/30000 | Total reward = 25.20
2022-01-26 14:17:24.991 | DEBUG    | __main__:trials:24 - Trial = 12345/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.993 | DEBUG    | __main__:trials:29 - Trial = 12345/30000 | Total reward = 29.91
2022-01-26 14:17:24.997 | DEBUG    | __main__:trials:24 - Trial = 12346/30000 | Max number of steps (20) reached
2022-01-26 14:17:24.998 | DEBUG    | __main__:trials:29 - Trial = 12346/30000 | Total reward = 36.49
2022-01-26 14:17:25.001 | DEBUG    | __main__:trials:24 - Trial = 12347/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.003 | DEBUG    | __main__:trials:29 - Trial = 12347/30000 | Total reward = 29.50
2022-01-26 14:17:25.007 | DEBUG    | __main__:trials:24 - Trial = 12348/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.008 | DEBUG    | __main__:trials:29 - Trial = 12348/30000 | Total reward = 32.98
2022-01-26 14:17:25.011 | DEBUG    | __main__:trials:24 - Trial = 12349/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.013 | DEBUG    | __main__:trials:29 - Trial = 12349/30000 | Total reward = 29.86
2022-01-26 14:17:25.016 | DEBUG    | __main__:trials:24 - Trial = 12350/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.018 | DEBUG    | __main__:trials:29 - Trial = 12350/30000 | Total reward = 30.67
2022-01-26 14:17:25.021 | DEBUG    | __main__:trials:24 - Trial = 12351/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.023 | DEBUG    | __main__:trials:29 - Trial = 12351/30000 | Total reward = 30.44
2022-01-26 14:17:25.027 | DEBUG    | __main__:trials:24 - Trial = 12352/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.027 | DEBUG    | __main__:trials:29 - Trial = 12352/30000 | Total reward = 33.05
2022-01-26 14:17:25.031 | DEBUG    | __main__:trials:24 - Trial = 12353/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.033 | DEBUG    | __main__:trials:29 - Trial = 12353/30000 | Total reward = 32.20
2022-01-26 14:17:25.037 | DEBUG    | __main__:trials:24 - Trial = 12354/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.038 | DEBUG    | __main__:trials:29 - Trial = 12354/30000 | Total reward = 41.22
2022-01-26 14:17:25.042 | DEBUG    | __main__:trials:24 - Trial = 12355/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.042 | DEBUG    | __main__:trials:29 - Trial = 12355/30000 | Total reward = 31.17
2022-01-26 14:17:25.046 | DEBUG    | __main__:trials:24 - Trial = 12356/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.047 | DEBUG    | __main__:trials:29 - Trial = 12356/30000 | Total reward = 34.97
2022-01-26 14:17:25.051 | DEBUG    | __main__:trials:24 - Trial = 12357/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.052 | DEBUG    | __main__:trials:29 - Trial = 12357/30000 | Total reward = 30.58
2022-01-26 14:17:25.056 | DEBUG    | __main__:trials:24 - Trial = 12358/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.057 | DEBUG    | __main__:trials:29 - Trial = 12358/30000 | Total reward = 38.03
2022-01-26 14:17:25.062 | DEBUG    | __main__:trials:24 - Trial = 12359/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.062 | DEBUG    | __main__:trials:29 - Trial = 12359/30000 | Total reward = 29.41
2022-01-26 14:17:25.066 | DEBUG    | __main__:trials:24 - Trial = 12360/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.068 | DEBUG    | __main__:trials:29 - Trial = 12360/30000 | Total reward = 40.75
2022-01-26 14:17:25.071 | DEBUG    | __main__:trials:26 - Trial = 12361/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.073 | DEBUG    | __main__:trials:29 - Trial = 12361/30000 | Total reward = 12.71
2022-01-26 14:17:25.076 | DEBUG    | __main__:trials:24 - Trial = 12362/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.077 | DEBUG    | __main__:trials:29 - Trial = 12362/30000 | Total reward = 34.51
2022-01-26 14:17:25.081 | DEBUG    | __main__:trials:24 - Trial = 12363/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.082 | DEBUG    | __main__:trials:29 - Trial = 12363/30000 | Total reward = 29.15
2022-01-26 14:17:25.085 | DEBUG    | __main__:trials:24 - Trial = 12364/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.086 | DEBUG    | __main__:trials:29 - Trial = 12364/30000 | Total reward = 36.34
2022-01-26 14:17:25.089 | DEBUG    | __main__:trials:24 - Trial = 12365/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.091 | DEBUG    | __main__:trials:29 - Trial = 12365/30000 | Total reward = 41.14
2022-01-26 14:17:25.093 | DEBUG    | __main__:trials:26 - Trial = 12366/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.095 | DEBUG    | __main__:trials:29 - Trial = 12366/30000 | Total reward = 18.35
2022-01-26 14:17:25.097 | DEBUG    | __main__:trials:24 - Trial = 12367/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.099 | DEBUG    | __main__:trials:29 - Trial = 12367/30000 | Total reward = 36.70
2022-01-26 14:17:25.102 | DEBUG    | __main__:trials:24 - Trial = 12368/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.104 | DEBUG    | __main__:trials:29 - Trial = 12368/30000 | Total reward = 25.58
2022-01-26 14:17:25.107 | DEBUG    | __main__:trials:24 - Trial = 12369/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.108 | DEBUG    | __main__:trials:29 - Trial = 12369/30000 | Total reward = 30.85
2022-01-26 14:17:25.111 | DEBUG    | __main__:trials:24 - Trial = 12370/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.113 | DEBUG    | __main__:trials:29 - Trial = 12370/30000 | Total reward = 30.50
2022-01-26 14:17:25.117 | DEBUG    | __main__:trials:24 - Trial = 12371/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.118 | DEBUG    | __main__:trials:29 - Trial = 12371/30000 | Total reward = 51.20
2022-01-26 14:17:25.122 | DEBUG    | __main__:trials:24 - Trial = 12372/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.123 | DEBUG    | __main__:trials:29 - Trial = 12372/30000 | Total reward = 30.10
2022-01-26 14:17:25.127 | DEBUG    | __main__:trials:24 - Trial = 12373/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.129 | DEBUG    | __main__:trials:29 - Trial = 12373/30000 | Total reward = 33.91
2022-01-26 14:17:25.132 | DEBUG    | __main__:trials:24 - Trial = 12374/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.134 | DEBUG    | __main__:trials:29 - Trial = 12374/30000 | Total reward = 47.62
2022-01-26 14:17:25.137 | DEBUG    | __main__:trials:24 - Trial = 12375/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.138 | DEBUG    | __main__:trials:29 - Trial = 12375/30000 | Total reward = 59.44
2022-01-26 14:17:25.143 | DEBUG    | __main__:trials:24 - Trial = 12376/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.144 | DEBUG    | __main__:trials:29 - Trial = 12376/30000 | Total reward = 13.55
2022-01-26 14:17:25.148 | DEBUG    | __main__:trials:24 - Trial = 12377/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.149 | DEBUG    | __main__:trials:29 - Trial = 12377/30000 | Total reward = 57.96
2022-01-26 14:17:25.152 | DEBUG    | __main__:trials:24 - Trial = 12378/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.154 | DEBUG    | __main__:trials:29 - Trial = 12378/30000 | Total reward = 47.03
2022-01-26 14:17:25.157 | DEBUG    | __main__:trials:24 - Trial = 12379/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.158 | DEBUG    | __main__:trials:29 - Trial = 12379/30000 | Total reward = 38.93
2022-01-26 14:17:25.161 | DEBUG    | __main__:trials:24 - Trial = 12380/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.162 | DEBUG    | __main__:trials:29 - Trial = 12380/30000 | Total reward = 44.92
2022-01-26 14:17:25.166 | DEBUG    | __main__:trials:24 - Trial = 12381/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.166 | DEBUG    | __main__:trials:29 - Trial = 12381/30000 | Total reward = 36.78
2022-01-26 14:17:25.170 | DEBUG    | __main__:trials:24 - Trial = 12382/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.172 | DEBUG    | __main__:trials:29 - Trial = 12382/30000 | Total reward = 43.91
2022-01-26 14:17:25.176 | DEBUG    | __main__:trials:24 - Trial = 12383/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.177 | DEBUG    | __main__:trials:29 - Trial = 12383/30000 | Total reward = 35.19
2022-01-26 14:17:25.181 | DEBUG    | __main__:trials:24 - Trial = 12384/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.181 | DEBUG    | __main__:trials:29 - Trial = 12384/30000 | Total reward = 41.54
2022-01-26 14:17:25.186 | DEBUG    | __main__:trials:24 - Trial = 12385/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.187 | DEBUG    | __main__:trials:29 - Trial = 12385/30000 | Total reward = 51.87
2022-01-26 14:17:25.190 | DEBUG    | __main__:trials:24 - Trial = 12386/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.192 | DEBUG    | __main__:trials:29 - Trial = 12386/30000 | Total reward = 53.03
2022-01-26 14:17:25.196 | DEBUG    | __main__:trials:24 - Trial = 12387/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.197 | DEBUG    | __main__:trials:29 - Trial = 12387/30000 | Total reward = 51.76
2022-01-26 14:17:25.201 | DEBUG    | __main__:trials:24 - Trial = 12388/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.203 | DEBUG    | __main__:trials:29 - Trial = 12388/30000 | Total reward = 47.03
2022-01-26 14:17:25.206 | DEBUG    | __main__:trials:24 - Trial = 12389/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.207 | DEBUG    | __main__:trials:29 - Trial = 12389/30000 | Total reward = 33.47
2022-01-26 14:17:25.212 | DEBUG    | __main__:trials:24 - Trial = 12390/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.212 | DEBUG    | __main__:trials:29 - Trial = 12390/30000 | Total reward = 42.05
2022-01-26 14:17:25.216 | DEBUG    | __main__:trials:24 - Trial = 12391/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.217 | DEBUG    | __main__:trials:29 - Trial = 12391/30000 | Total reward = 36.85
2022-01-26 14:17:25.221 | DEBUG    | __main__:trials:26 - Trial = 12392/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.222 | DEBUG    | __main__:trials:29 - Trial = 12392/30000 | Total reward = 34.23
2022-01-26 14:17:25.226 | DEBUG    | __main__:trials:24 - Trial = 12393/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.227 | DEBUG    | __main__:trials:29 - Trial = 12393/30000 | Total reward = 47.62
2022-01-26 14:17:25.231 | DEBUG    | __main__:trials:24 - Trial = 12394/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.231 | DEBUG    | __main__:trials:29 - Trial = 12394/30000 | Total reward = 40.91
2022-01-26 14:17:25.235 | DEBUG    | __main__:trials:24 - Trial = 12395/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.237 | DEBUG    | __main__:trials:29 - Trial = 12395/30000 | Total reward = 48.03
2022-01-26 14:17:25.241 | DEBUG    | __main__:trials:24 - Trial = 12396/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.242 | DEBUG    | __main__:trials:29 - Trial = 12396/30000 | Total reward = 37.44
2022-01-26 14:17:25.246 | DEBUG    | __main__:trials:24 - Trial = 12397/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.248 | DEBUG    | __main__:trials:29 - Trial = 12397/30000 | Total reward = 46.07
2022-01-26 14:17:25.252 | DEBUG    | __main__:trials:24 - Trial = 12398/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.253 | DEBUG    | __main__:trials:29 - Trial = 12398/30000 | Total reward = 51.53
2022-01-26 14:17:25.257 | DEBUG    | __main__:trials:24 - Trial = 12399/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.258 | DEBUG    | __main__:trials:29 - Trial = 12399/30000 | Total reward = 25.33
2022-01-26 14:17:25.261 | DEBUG    | __main__:trials:24 - Trial = 12400/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.263 | DEBUG    | __main__:trials:29 - Trial = 12400/30000 | Total reward = 56.86
2022-01-26 14:17:25.265 | DEBUG    | __main__:trials:24 - Trial = 12401/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.267 | DEBUG    | __main__:trials:29 - Trial = 12401/30000 | Total reward = 31.29
2022-01-26 14:17:25.271 | DEBUG    | __main__:trials:24 - Trial = 12402/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.273 | DEBUG    | __main__:trials:29 - Trial = 12402/30000 | Total reward = 36.82
2022-01-26 14:17:25.276 | DEBUG    | __main__:trials:24 - Trial = 12403/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.278 | DEBUG    | __main__:trials:29 - Trial = 12403/30000 | Total reward = 44.38
2022-01-26 14:17:25.282 | DEBUG    | __main__:trials:24 - Trial = 12404/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.284 | DEBUG    | __main__:trials:29 - Trial = 12404/30000 | Total reward = 62.18
2022-01-26 14:17:25.288 | DEBUG    | __main__:trials:24 - Trial = 12405/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.289 | DEBUG    | __main__:trials:29 - Trial = 12405/30000 | Total reward = 42.06
2022-01-26 14:17:25.293 | DEBUG    | __main__:trials:24 - Trial = 12406/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.294 | DEBUG    | __main__:trials:29 - Trial = 12406/30000 | Total reward = 47.93
2022-01-26 14:17:25.298 | DEBUG    | __main__:trials:24 - Trial = 12407/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.300 | DEBUG    | __main__:trials:29 - Trial = 12407/30000 | Total reward = 48.21
2022-01-26 14:17:25.304 | DEBUG    | __main__:trials:24 - Trial = 12408/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.306 | DEBUG    | __main__:trials:29 - Trial = 12408/30000 | Total reward = 63.52
2022-01-26 14:17:25.310 | DEBUG    | __main__:trials:24 - Trial = 12409/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.312 | DEBUG    | __main__:trials:29 - Trial = 12409/30000 | Total reward = 25.68
2022-01-26 14:17:25.316 | DEBUG    | __main__:trials:26 - Trial = 12410/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.318 | DEBUG    | __main__:trials:29 - Trial = 12410/30000 | Total reward = 22.56
2022-01-26 14:17:25.321 | DEBUG    | __main__:trials:24 - Trial = 12411/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.323 | DEBUG    | __main__:trials:29 - Trial = 12411/30000 | Total reward = 47.03
2022-01-26 14:17:25.327 | DEBUG    | __main__:trials:24 - Trial = 12412/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.328 | DEBUG    | __main__:trials:29 - Trial = 12412/30000 | Total reward = 58.65
2022-01-26 14:17:25.332 | DEBUG    | __main__:trials:24 - Trial = 12413/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.334 | DEBUG    | __main__:trials:29 - Trial = 12413/30000 | Total reward = 39.20
2022-01-26 14:17:25.337 | DEBUG    | __main__:trials:24 - Trial = 12414/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.339 | DEBUG    | __main__:trials:29 - Trial = 12414/30000 | Total reward = 61.94
2022-01-26 14:17:25.343 | DEBUG    | __main__:trials:24 - Trial = 12415/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.344 | DEBUG    | __main__:trials:29 - Trial = 12415/30000 | Total reward = 42.62
2022-01-26 14:17:25.348 | DEBUG    | __main__:trials:24 - Trial = 12416/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.350 | DEBUG    | __main__:trials:29 - Trial = 12416/30000 | Total reward = 44.27
2022-01-26 14:17:25.353 | DEBUG    | __main__:trials:24 - Trial = 12417/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.354 | DEBUG    | __main__:trials:29 - Trial = 12417/30000 | Total reward = 34.22
2022-01-26 14:17:25.359 | DEBUG    | __main__:trials:24 - Trial = 12418/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.361 | DEBUG    | __main__:trials:29 - Trial = 12418/30000 | Total reward = 34.50
2022-01-26 14:17:25.364 | DEBUG    | __main__:trials:24 - Trial = 12419/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.366 | DEBUG    | __main__:trials:29 - Trial = 12419/30000 | Total reward = 37.51
2022-01-26 14:17:25.368 | DEBUG    | __main__:trials:26 - Trial = 12420/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.370 | DEBUG    | __main__:trials:29 - Trial = 12420/30000 | Total reward = 15.93
2022-01-26 14:17:25.372 | DEBUG    | __main__:trials:26 - Trial = 12421/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.373 | DEBUG    | __main__:trials:29 - Trial = 12421/30000 | Total reward = 23.33
2022-01-26 14:17:25.376 | DEBUG    | __main__:trials:24 - Trial = 12422/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.377 | DEBUG    | __main__:trials:29 - Trial = 12422/30000 | Total reward = 46.80
2022-01-26 14:17:25.381 | DEBUG    | __main__:trials:24 - Trial = 12423/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.383 | DEBUG    | __main__:trials:29 - Trial = 12423/30000 | Total reward = 51.98
2022-01-26 14:17:25.386 | DEBUG    | __main__:trials:24 - Trial = 12424/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.388 | DEBUG    | __main__:trials:29 - Trial = 12424/30000 | Total reward = 41.93
2022-01-26 14:17:25.392 | DEBUG    | __main__:trials:24 - Trial = 12425/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.393 | DEBUG    | __main__:trials:29 - Trial = 12425/30000 | Total reward = 46.95
2022-01-26 14:17:25.397 | DEBUG    | __main__:trials:24 - Trial = 12426/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.398 | DEBUG    | __main__:trials:29 - Trial = 12426/30000 | Total reward = 46.66
2022-01-26 14:17:25.402 | DEBUG    | __main__:trials:24 - Trial = 12427/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.404 | DEBUG    | __main__:trials:29 - Trial = 12427/30000 | Total reward = 51.03
2022-01-26 14:17:25.407 | DEBUG    | __main__:trials:24 - Trial = 12428/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.409 | DEBUG    | __main__:trials:29 - Trial = 12428/30000 | Total reward = 40.33
2022-01-26 14:17:25.413 | DEBUG    | __main__:trials:24 - Trial = 12429/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.413 | DEBUG    | __main__:trials:29 - Trial = 12429/30000 | Total reward = 39.93
2022-01-26 14:17:25.417 | DEBUG    | __main__:trials:24 - Trial = 12430/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.417 | DEBUG    | __main__:trials:29 - Trial = 12430/30000 | Total reward = 39.85
2022-01-26 14:17:25.422 | DEBUG    | __main__:trials:24 - Trial = 12431/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.423 | DEBUG    | __main__:trials:29 - Trial = 12431/30000 | Total reward = 39.22
2022-01-26 14:17:25.427 | DEBUG    | __main__:trials:24 - Trial = 12432/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.428 | DEBUG    | __main__:trials:29 - Trial = 12432/30000 | Total reward = 42.76
2022-01-26 14:17:25.432 | DEBUG    | __main__:trials:24 - Trial = 12433/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.433 | DEBUG    | __main__:trials:29 - Trial = 12433/30000 | Total reward = 47.21
2022-01-26 14:17:25.437 | DEBUG    | __main__:trials:24 - Trial = 12434/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.438 | DEBUG    | __main__:trials:29 - Trial = 12434/30000 | Total reward = 33.32
2022-01-26 14:17:25.442 | DEBUG    | __main__:trials:24 - Trial = 12435/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.444 | DEBUG    | __main__:trials:29 - Trial = 12435/30000 | Total reward = 43.01
2022-01-26 14:17:25.446 | DEBUG    | __main__:trials:24 - Trial = 12436/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.448 | DEBUG    | __main__:trials:29 - Trial = 12436/30000 | Total reward = 54.62
2022-01-26 14:17:25.452 | DEBUG    | __main__:trials:24 - Trial = 12437/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.454 | DEBUG    | __main__:trials:29 - Trial = 12437/30000 | Total reward = 42.62
2022-01-26 14:17:25.457 | DEBUG    | __main__:trials:24 - Trial = 12438/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.459 | DEBUG    | __main__:trials:29 - Trial = 12438/30000 | Total reward = 47.38
2022-01-26 14:17:25.462 | DEBUG    | __main__:trials:24 - Trial = 12439/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.464 | DEBUG    | __main__:trials:29 - Trial = 12439/30000 | Total reward = 46.05
2022-01-26 14:17:25.468 | DEBUG    | __main__:trials:24 - Trial = 12440/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.470 | DEBUG    | __main__:trials:29 - Trial = 12440/30000 | Total reward = 45.75
2022-01-26 14:17:25.474 | DEBUG    | __main__:trials:24 - Trial = 12441/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.475 | DEBUG    | __main__:trials:29 - Trial = 12441/30000 | Total reward = 35.89
2022-01-26 14:17:25.479 | DEBUG    | __main__:trials:24 - Trial = 12442/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.481 | DEBUG    | __main__:trials:29 - Trial = 12442/30000 | Total reward = 66.93
2022-01-26 14:17:25.482 | DEBUG    | __main__:trials:26 - Trial = 12443/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.484 | DEBUG    | __main__:trials:29 - Trial = 12443/30000 | Total reward = 11.17
2022-01-26 14:17:25.488 | DEBUG    | __main__:trials:24 - Trial = 12444/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.489 | DEBUG    | __main__:trials:29 - Trial = 12444/30000 | Total reward = 33.82
2022-01-26 14:17:25.493 | DEBUG    | __main__:trials:24 - Trial = 12445/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.495 | DEBUG    | __main__:trials:29 - Trial = 12445/30000 | Total reward = 47.93
2022-01-26 14:17:25.498 | DEBUG    | __main__:trials:24 - Trial = 12446/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.500 | DEBUG    | __main__:trials:29 - Trial = 12446/30000 | Total reward = 28.44
2022-01-26 14:17:25.504 | DEBUG    | __main__:trials:24 - Trial = 12447/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.504 | DEBUG    | __main__:trials:29 - Trial = 12447/30000 | Total reward = 47.60
2022-01-26 14:17:25.508 | DEBUG    | __main__:trials:26 - Trial = 12448/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.509 | DEBUG    | __main__:trials:29 - Trial = 12448/30000 | Total reward = 36.36
2022-01-26 14:17:25.513 | DEBUG    | __main__:trials:24 - Trial = 12449/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.514 | DEBUG    | __main__:trials:29 - Trial = 12449/30000 | Total reward = 59.56
2022-01-26 14:17:25.518 | DEBUG    | __main__:trials:24 - Trial = 12450/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.520 | DEBUG    | __main__:trials:29 - Trial = 12450/30000 | Total reward = 47.09
2022-01-26 14:17:25.523 | DEBUG    | __main__:trials:24 - Trial = 12451/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.525 | DEBUG    | __main__:trials:29 - Trial = 12451/30000 | Total reward = 43.01
2022-01-26 14:17:25.528 | DEBUG    | __main__:trials:24 - Trial = 12452/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.530 | DEBUG    | __main__:trials:29 - Trial = 12452/30000 | Total reward = 47.03
2022-01-26 14:17:25.533 | DEBUG    | __main__:trials:24 - Trial = 12453/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.535 | DEBUG    | __main__:trials:29 - Trial = 12453/30000 | Total reward = 33.35
2022-01-26 14:17:25.538 | DEBUG    | __main__:trials:24 - Trial = 12454/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.540 | DEBUG    | __main__:trials:29 - Trial = 12454/30000 | Total reward = 52.40
2022-01-26 14:17:25.543 | DEBUG    | __main__:trials:24 - Trial = 12455/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.545 | DEBUG    | __main__:trials:29 - Trial = 12455/30000 | Total reward = 55.28
2022-01-26 14:17:25.548 | DEBUG    | __main__:trials:24 - Trial = 12456/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.549 | DEBUG    | __main__:trials:29 - Trial = 12456/30000 | Total reward = 36.02
2022-01-26 14:17:25.552 | DEBUG    | __main__:trials:24 - Trial = 12457/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.554 | DEBUG    | __main__:trials:29 - Trial = 12457/30000 | Total reward = 45.45
2022-01-26 14:17:25.557 | DEBUG    | __main__:trials:24 - Trial = 12458/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.558 | DEBUG    | __main__:trials:29 - Trial = 12458/30000 | Total reward = 49.09
2022-01-26 14:17:25.561 | DEBUG    | __main__:trials:24 - Trial = 12459/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.562 | DEBUG    | __main__:trials:29 - Trial = 12459/30000 | Total reward = 35.19
2022-01-26 14:17:25.565 | DEBUG    | __main__:trials:24 - Trial = 12460/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.566 | DEBUG    | __main__:trials:29 - Trial = 12460/30000 | Total reward = 27.19
2022-01-26 14:17:25.569 | DEBUG    | __main__:trials:24 - Trial = 12461/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.570 | DEBUG    | __main__:trials:29 - Trial = 12461/30000 | Total reward = 39.77
2022-01-26 14:17:25.573 | DEBUG    | __main__:trials:24 - Trial = 12462/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.575 | DEBUG    | __main__:trials:29 - Trial = 12462/30000 | Total reward = 43.30
2022-01-26 14:17:25.578 | DEBUG    | __main__:trials:24 - Trial = 12463/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.580 | DEBUG    | __main__:trials:29 - Trial = 12463/30000 | Total reward = 50.51
2022-01-26 14:17:25.583 | DEBUG    | __main__:trials:24 - Trial = 12464/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.585 | DEBUG    | __main__:trials:29 - Trial = 12464/30000 | Total reward = 34.30
2022-01-26 14:17:25.588 | DEBUG    | __main__:trials:24 - Trial = 12465/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.590 | DEBUG    | __main__:trials:29 - Trial = 12465/30000 | Total reward = 32.70
2022-01-26 14:17:25.593 | DEBUG    | __main__:trials:26 - Trial = 12466/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.594 | DEBUG    | __main__:trials:29 - Trial = 12466/30000 | Total reward = 15.82
2022-01-26 14:17:25.598 | DEBUG    | __main__:trials:24 - Trial = 12467/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.600 | DEBUG    | __main__:trials:29 - Trial = 12467/30000 | Total reward = 40.38
2022-01-26 14:17:25.603 | DEBUG    | __main__:trials:24 - Trial = 12468/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.605 | DEBUG    | __main__:trials:29 - Trial = 12468/30000 | Total reward = 43.31
2022-01-26 14:17:25.608 | DEBUG    | __main__:trials:24 - Trial = 12469/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.610 | DEBUG    | __main__:trials:29 - Trial = 12469/30000 | Total reward = 34.94
2022-01-26 14:17:25.613 | DEBUG    | __main__:trials:24 - Trial = 12470/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.615 | DEBUG    | __main__:trials:29 - Trial = 12470/30000 | Total reward = 50.48
2022-01-26 14:17:25.618 | DEBUG    | __main__:trials:24 - Trial = 12471/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.619 | DEBUG    | __main__:trials:29 - Trial = 12471/30000 | Total reward = 59.93
2022-01-26 14:17:25.623 | DEBUG    | __main__:trials:26 - Trial = 12472/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.623 | DEBUG    | __main__:trials:29 - Trial = 12472/30000 | Total reward = 31.88
2022-01-26 14:17:25.627 | DEBUG    | __main__:trials:24 - Trial = 12473/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.629 | DEBUG    | __main__:trials:29 - Trial = 12473/30000 | Total reward = 58.33
2022-01-26 14:17:25.632 | DEBUG    | __main__:trials:24 - Trial = 12474/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.633 | DEBUG    | __main__:trials:29 - Trial = 12474/30000 | Total reward = 59.95
2022-01-26 14:17:25.636 | DEBUG    | __main__:trials:26 - Trial = 12475/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.638 | DEBUG    | __main__:trials:29 - Trial = 12475/30000 | Total reward = 23.22
2022-01-26 14:17:25.642 | DEBUG    | __main__:trials:24 - Trial = 12476/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.643 | DEBUG    | __main__:trials:29 - Trial = 12476/30000 | Total reward = 47.64
2022-01-26 14:17:25.646 | DEBUG    | __main__:trials:24 - Trial = 12477/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.648 | DEBUG    | __main__:trials:29 - Trial = 12477/30000 | Total reward = 49.05
2022-01-26 14:17:25.652 | DEBUG    | __main__:trials:24 - Trial = 12478/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.653 | DEBUG    | __main__:trials:29 - Trial = 12478/30000 | Total reward = 30.23
2022-01-26 14:17:25.656 | DEBUG    | __main__:trials:26 - Trial = 12479/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.658 | DEBUG    | __main__:trials:29 - Trial = 12479/30000 | Total reward = 20.88
2022-01-26 14:17:25.662 | DEBUG    | __main__:trials:24 - Trial = 12480/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.662 | DEBUG    | __main__:trials:29 - Trial = 12480/30000 | Total reward = 36.84
2022-01-26 14:17:25.666 | DEBUG    | __main__:trials:24 - Trial = 12481/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.668 | DEBUG    | __main__:trials:29 - Trial = 12481/30000 | Total reward = 48.66
2022-01-26 14:17:25.671 | DEBUG    | __main__:trials:24 - Trial = 12482/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.673 | DEBUG    | __main__:trials:29 - Trial = 12482/30000 | Total reward = 47.03
2022-01-26 14:17:25.675 | DEBUG    | __main__:trials:26 - Trial = 12483/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.677 | DEBUG    | __main__:trials:29 - Trial = 12483/30000 | Total reward = 18.35
2022-01-26 14:17:25.680 | DEBUG    | __main__:trials:24 - Trial = 12484/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.681 | DEBUG    | __main__:trials:29 - Trial = 12484/30000 | Total reward = 60.54
2022-01-26 14:17:25.685 | DEBUG    | __main__:trials:24 - Trial = 12485/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.687 | DEBUG    | __main__:trials:29 - Trial = 12485/30000 | Total reward = 34.27
2022-01-26 14:17:25.690 | DEBUG    | __main__:trials:26 - Trial = 12486/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.691 | DEBUG    | __main__:trials:29 - Trial = 12486/30000 | Total reward = 18.42
2022-01-26 14:17:25.694 | DEBUG    | __main__:trials:26 - Trial = 12487/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.696 | DEBUG    | __main__:trials:29 - Trial = 12487/30000 | Total reward = 23.64
2022-01-26 14:17:25.700 | DEBUG    | __main__:trials:24 - Trial = 12488/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.702 | DEBUG    | __main__:trials:29 - Trial = 12488/30000 | Total reward = 58.58
2022-01-26 14:17:25.705 | DEBUG    | __main__:trials:24 - Trial = 12489/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.706 | DEBUG    | __main__:trials:29 - Trial = 12489/30000 | Total reward = 47.52
2022-01-26 14:17:25.709 | DEBUG    | __main__:trials:24 - Trial = 12490/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.711 | DEBUG    | __main__:trials:29 - Trial = 12490/30000 | Total reward = 34.67
2022-01-26 14:17:25.713 | DEBUG    | __main__:trials:24 - Trial = 12491/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.715 | DEBUG    | __main__:trials:29 - Trial = 12491/30000 | Total reward = 39.42
2022-01-26 14:17:25.719 | DEBUG    | __main__:trials:24 - Trial = 12492/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.721 | DEBUG    | __main__:trials:29 - Trial = 12492/30000 | Total reward = 47.03
2022-01-26 14:17:25.724 | DEBUG    | __main__:trials:24 - Trial = 12493/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.726 | DEBUG    | __main__:trials:29 - Trial = 12493/30000 | Total reward = 48.42
2022-01-26 14:17:25.729 | DEBUG    | __main__:trials:24 - Trial = 12494/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.731 | DEBUG    | __main__:trials:29 - Trial = 12494/30000 | Total reward = 59.78
2022-01-26 14:17:25.735 | DEBUG    | __main__:trials:24 - Trial = 12495/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.737 | DEBUG    | __main__:trials:29 - Trial = 12495/30000 | Total reward = 45.42
2022-01-26 14:17:25.740 | DEBUG    | __main__:trials:24 - Trial = 12496/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.742 | DEBUG    | __main__:trials:29 - Trial = 12496/30000 | Total reward = 42.30
2022-01-26 14:17:25.746 | DEBUG    | __main__:trials:24 - Trial = 12497/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.747 | DEBUG    | __main__:trials:29 - Trial = 12497/30000 | Total reward = 41.28
2022-01-26 14:17:25.750 | DEBUG    | __main__:trials:24 - Trial = 12498/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.753 | DEBUG    | __main__:trials:29 - Trial = 12498/30000 | Total reward = 40.12
2022-01-26 14:17:25.757 | DEBUG    | __main__:trials:24 - Trial = 12499/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.758 | DEBUG    | __main__:trials:29 - Trial = 12499/30000 | Total reward = 35.50
2022-01-26 14:17:25.762 | DEBUG    | __main__:trials:24 - Trial = 12500/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.763 | DEBUG    | __main__:trials:29 - Trial = 12500/30000 | Total reward = 29.85
2022-01-26 14:17:25.766 | DEBUG    | __main__:trials:24 - Trial = 12501/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.768 | DEBUG    | __main__:trials:29 - Trial = 12501/30000 | Total reward = 43.63
2022-01-26 14:17:25.771 | DEBUG    | __main__:trials:26 - Trial = 12502/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.773 | DEBUG    | __main__:trials:29 - Trial = 12502/30000 | Total reward = 26.88
2022-01-26 14:17:25.777 | DEBUG    | __main__:trials:24 - Trial = 12503/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.779 | DEBUG    | __main__:trials:29 - Trial = 12503/30000 | Total reward = 48.87
2022-01-26 14:17:25.782 | DEBUG    | __main__:trials:24 - Trial = 12504/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.784 | DEBUG    | __main__:trials:29 - Trial = 12504/30000 | Total reward = 40.81
2022-01-26 14:17:25.787 | DEBUG    | __main__:trials:24 - Trial = 12505/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.789 | DEBUG    | __main__:trials:29 - Trial = 12505/30000 | Total reward = 41.96
2022-01-26 14:17:25.792 | DEBUG    | __main__:trials:24 - Trial = 12506/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.794 | DEBUG    | __main__:trials:29 - Trial = 12506/30000 | Total reward = 41.44
2022-01-26 14:17:25.797 | DEBUG    | __main__:trials:24 - Trial = 12507/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.798 | DEBUG    | __main__:trials:29 - Trial = 12507/30000 | Total reward = 47.92
2022-01-26 14:17:25.801 | DEBUG    | __main__:trials:24 - Trial = 12508/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.803 | DEBUG    | __main__:trials:29 - Trial = 12508/30000 | Total reward = 47.03
2022-01-26 14:17:25.806 | DEBUG    | __main__:trials:24 - Trial = 12509/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.807 | DEBUG    | __main__:trials:29 - Trial = 12509/30000 | Total reward = 41.79
2022-01-26 14:17:25.811 | DEBUG    | __main__:trials:24 - Trial = 12510/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.813 | DEBUG    | __main__:trials:29 - Trial = 12510/30000 | Total reward = 34.65
2022-01-26 14:17:25.817 | DEBUG    | __main__:trials:24 - Trial = 12511/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.818 | DEBUG    | __main__:trials:29 - Trial = 12511/30000 | Total reward = 41.02
2022-01-26 14:17:25.822 | DEBUG    | __main__:trials:24 - Trial = 12512/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.823 | DEBUG    | __main__:trials:29 - Trial = 12512/30000 | Total reward = 36.14
2022-01-26 14:17:25.827 | DEBUG    | __main__:trials:24 - Trial = 12513/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.829 | DEBUG    | __main__:trials:29 - Trial = 12513/30000 | Total reward = 47.05
2022-01-26 14:17:25.832 | DEBUG    | __main__:trials:24 - Trial = 12514/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.833 | DEBUG    | __main__:trials:29 - Trial = 12514/30000 | Total reward = 47.94
2022-01-26 14:17:25.837 | DEBUG    | __main__:trials:24 - Trial = 12515/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.837 | DEBUG    | __main__:trials:29 - Trial = 12515/30000 | Total reward = 35.73
2022-01-26 14:17:25.842 | DEBUG    | __main__:trials:24 - Trial = 12516/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.843 | DEBUG    | __main__:trials:29 - Trial = 12516/30000 | Total reward = 40.30
2022-01-26 14:17:25.847 | DEBUG    | __main__:trials:24 - Trial = 12517/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.849 | DEBUG    | __main__:trials:29 - Trial = 12517/30000 | Total reward = 38.90
2022-01-26 14:17:25.851 | DEBUG    | __main__:trials:26 - Trial = 12518/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.852 | DEBUG    | __main__:trials:29 - Trial = 12518/30000 | Total reward = 23.19
2022-01-26 14:17:25.856 | DEBUG    | __main__:trials:24 - Trial = 12519/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.858 | DEBUG    | __main__:trials:29 - Trial = 12519/30000 | Total reward = 47.27
2022-01-26 14:17:25.861 | DEBUG    | __main__:trials:24 - Trial = 12520/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.863 | DEBUG    | __main__:trials:29 - Trial = 12520/30000 | Total reward = 42.78
2022-01-26 14:17:25.866 | DEBUG    | __main__:trials:24 - Trial = 12521/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.868 | DEBUG    | __main__:trials:29 - Trial = 12521/30000 | Total reward = 50.00
2022-01-26 14:17:25.871 | DEBUG    | __main__:trials:24 - Trial = 12522/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.873 | DEBUG    | __main__:trials:29 - Trial = 12522/30000 | Total reward = 57.09
2022-01-26 14:17:25.876 | DEBUG    | __main__:trials:24 - Trial = 12523/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.878 | DEBUG    | __main__:trials:29 - Trial = 12523/30000 | Total reward = 33.72
2022-01-26 14:17:25.882 | DEBUG    | __main__:trials:24 - Trial = 12524/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.884 | DEBUG    | __main__:trials:29 - Trial = 12524/30000 | Total reward = 38.12
2022-01-26 14:17:25.887 | DEBUG    | __main__:trials:24 - Trial = 12525/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.888 | DEBUG    | __main__:trials:29 - Trial = 12525/30000 | Total reward = 43.03
2022-01-26 14:17:25.892 | DEBUG    | __main__:trials:24 - Trial = 12526/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.894 | DEBUG    | __main__:trials:29 - Trial = 12526/30000 | Total reward = 52.43
2022-01-26 14:17:25.897 | DEBUG    | __main__:trials:24 - Trial = 12527/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.899 | DEBUG    | __main__:trials:29 - Trial = 12527/30000 | Total reward = 37.49
2022-01-26 14:17:25.903 | DEBUG    | __main__:trials:24 - Trial = 12528/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.904 | DEBUG    | __main__:trials:29 - Trial = 12528/30000 | Total reward = 44.99
2022-01-26 14:17:25.907 | DEBUG    | __main__:trials:24 - Trial = 12529/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.909 | DEBUG    | __main__:trials:29 - Trial = 12529/30000 | Total reward = 49.66
2022-01-26 14:17:25.913 | DEBUG    | __main__:trials:24 - Trial = 12530/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.915 | DEBUG    | __main__:trials:29 - Trial = 12530/30000 | Total reward = 48.18
2022-01-26 14:17:25.918 | DEBUG    | __main__:trials:24 - Trial = 12531/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.920 | DEBUG    | __main__:trials:29 - Trial = 12531/30000 | Total reward = 41.77
2022-01-26 14:17:25.923 | DEBUG    | __main__:trials:24 - Trial = 12532/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.925 | DEBUG    | __main__:trials:29 - Trial = 12532/30000 | Total reward = 34.59
2022-01-26 14:17:25.928 | DEBUG    | __main__:trials:24 - Trial = 12533/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.930 | DEBUG    | __main__:trials:29 - Trial = 12533/30000 | Total reward = 40.66
2022-01-26 14:17:25.934 | DEBUG    | __main__:trials:24 - Trial = 12534/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.935 | DEBUG    | __main__:trials:29 - Trial = 12534/30000 | Total reward = 46.02
2022-01-26 14:17:25.939 | DEBUG    | __main__:trials:24 - Trial = 12535/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.941 | DEBUG    | __main__:trials:29 - Trial = 12535/30000 | Total reward = 27.77
2022-01-26 14:17:25.943 | DEBUG    | __main__:trials:24 - Trial = 12536/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.946 | DEBUG    | __main__:trials:29 - Trial = 12536/30000 | Total reward = 20.88
2022-01-26 14:17:25.950 | DEBUG    | __main__:trials:24 - Trial = 12537/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.951 | DEBUG    | __main__:trials:29 - Trial = 12537/30000 | Total reward = 36.33
2022-01-26 14:17:25.955 | DEBUG    | __main__:trials:24 - Trial = 12538/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.956 | DEBUG    | __main__:trials:29 - Trial = 12538/30000 | Total reward = 37.65
2022-01-26 14:17:25.959 | DEBUG    | __main__:trials:24 - Trial = 12539/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.961 | DEBUG    | __main__:trials:29 - Trial = 12539/30000 | Total reward = 42.74
2022-01-26 14:17:25.965 | DEBUG    | __main__:trials:26 - Trial = 12540/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.967 | DEBUG    | __main__:trials:29 - Trial = 12540/30000 | Total reward = 34.14
2022-01-26 14:17:25.970 | DEBUG    | __main__:trials:26 - Trial = 12541/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:25.971 | DEBUG    | __main__:trials:29 - Trial = 12541/30000 | Total reward = 17.36
2022-01-26 14:17:25.975 | DEBUG    | __main__:trials:24 - Trial = 12542/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.976 | DEBUG    | __main__:trials:29 - Trial = 12542/30000 | Total reward = 44.61
2022-01-26 14:17:25.980 | DEBUG    | __main__:trials:24 - Trial = 12543/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.982 | DEBUG    | __main__:trials:29 - Trial = 12543/30000 | Total reward = 46.26
2022-01-26 14:17:25.985 | DEBUG    | __main__:trials:24 - Trial = 12544/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.986 | DEBUG    | __main__:trials:29 - Trial = 12544/30000 | Total reward = 47.87
2022-01-26 14:17:25.989 | DEBUG    | __main__:trials:24 - Trial = 12545/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.991 | DEBUG    | __main__:trials:29 - Trial = 12545/30000 | Total reward = 47.49
2022-01-26 14:17:25.995 | DEBUG    | __main__:trials:24 - Trial = 12546/30000 | Max number of steps (20) reached
2022-01-26 14:17:25.996 | DEBUG    | __main__:trials:29 - Trial = 12546/30000 | Total reward = 39.88
2022-01-26 14:17:26.000 | DEBUG    | __main__:trials:24 - Trial = 12547/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.002 | DEBUG    | __main__:trials:29 - Trial = 12547/30000 | Total reward = 30.25
2022-01-26 14:17:26.004 | DEBUG    | __main__:trials:24 - Trial = 12548/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.006 | DEBUG    | __main__:trials:29 - Trial = 12548/30000 | Total reward = 40.14
2022-01-26 14:17:26.010 | DEBUG    | __main__:trials:24 - Trial = 12549/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.012 | DEBUG    | __main__:trials:29 - Trial = 12549/30000 | Total reward = 44.83
2022-01-26 14:17:26.016 | DEBUG    | __main__:trials:24 - Trial = 12550/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.017 | DEBUG    | __main__:trials:29 - Trial = 12550/30000 | Total reward = 36.62
2022-01-26 14:17:26.020 | DEBUG    | __main__:trials:24 - Trial = 12551/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.022 | DEBUG    | __main__:trials:29 - Trial = 12551/30000 | Total reward = 33.92
2022-01-26 14:17:26.026 | DEBUG    | __main__:trials:24 - Trial = 12552/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.027 | DEBUG    | __main__:trials:29 - Trial = 12552/30000 | Total reward = 27.68
2022-01-26 14:17:26.031 | DEBUG    | __main__:trials:24 - Trial = 12553/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.032 | DEBUG    | __main__:trials:29 - Trial = 12553/30000 | Total reward = 48.35
2022-01-26 14:17:26.035 | DEBUG    | __main__:trials:26 - Trial = 12554/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:26.037 | DEBUG    | __main__:trials:29 - Trial = 12554/30000 | Total reward = 20.25
2022-01-26 14:17:26.040 | DEBUG    | __main__:trials:24 - Trial = 12555/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.042 | DEBUG    | __main__:trials:29 - Trial = 12555/30000 | Total reward = 30.43
2022-01-26 14:17:26.046 | DEBUG    | __main__:trials:24 - Trial = 12556/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.047 | DEBUG    | __main__:trials:29 - Trial = 12556/30000 | Total reward = 47.63
2022-01-26 14:17:26.051 | DEBUG    | __main__:trials:24 - Trial = 12557/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.053 | DEBUG    | __main__:trials:29 - Trial = 12557/30000 | Total reward = 47.03
2022-01-26 14:17:26.057 | DEBUG    | __main__:trials:24 - Trial = 12558/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.058 | DEBUG    | __main__:trials:29 - Trial = 12558/30000 | Total reward = 42.45
2022-01-26 14:17:26.062 | DEBUG    | __main__:trials:24 - Trial = 12559/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.064 | DEBUG    | __main__:trials:29 - Trial = 12559/30000 | Total reward = 40.72
2022-01-26 14:17:26.067 | DEBUG    | __main__:trials:24 - Trial = 12560/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.069 | DEBUG    | __main__:trials:29 - Trial = 12560/30000 | Total reward = 46.83
2022-01-26 14:17:26.072 | DEBUG    | __main__:trials:24 - Trial = 12561/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.074 | DEBUG    | __main__:trials:29 - Trial = 12561/30000 | Total reward = 28.07
2022-01-26 14:17:26.078 | DEBUG    | __main__:trials:24 - Trial = 12562/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.079 | DEBUG    | __main__:trials:29 - Trial = 12562/30000 | Total reward = 22.50
2022-01-26 14:17:26.083 | DEBUG    | __main__:trials:24 - Trial = 12563/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.085 | DEBUG    | __main__:trials:29 - Trial = 12563/30000 | Total reward = 35.03
2022-01-26 14:17:26.088 | DEBUG    | __main__:trials:24 - Trial = 12564/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.090 | DEBUG    | __main__:trials:29 - Trial = 12564/30000 | Total reward = 47.27
2022-01-26 14:17:26.093 | DEBUG    | __main__:trials:24 - Trial = 12565/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.095 | DEBUG    | __main__:trials:29 - Trial = 12565/30000 | Total reward = 45.52
2022-01-26 14:17:26.099 | DEBUG    | __main__:trials:24 - Trial = 12566/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.099 | DEBUG    | __main__:trials:29 - Trial = 12566/30000 | Total reward = 32.05
2022-01-26 14:17:26.103 | DEBUG    | __main__:trials:24 - Trial = 12567/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.105 | DEBUG    | __main__:trials:29 - Trial = 12567/30000 | Total reward = 44.33
2022-01-26 14:17:26.108 | DEBUG    | __main__:trials:24 - Trial = 12568/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.109 | DEBUG    | __main__:trials:29 - Trial = 12568/30000 | Total reward = 57.25
2022-01-26 14:17:26.113 | DEBUG    | __main__:trials:24 - Trial = 12569/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.115 | DEBUG    | __main__:trials:29 - Trial = 12569/30000 | Total reward = 33.04
2022-01-26 14:17:26.118 | DEBUG    | __main__:trials:24 - Trial = 12570/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.120 | DEBUG    | __main__:trials:29 - Trial = 12570/30000 | Total reward = 43.42
2022-01-26 14:17:26.123 | DEBUG    | __main__:trials:24 - Trial = 12571/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.125 | DEBUG    | __main__:trials:29 - Trial = 12571/30000 | Total reward = 48.06
2022-01-26 14:17:26.128 | DEBUG    | __main__:trials:24 - Trial = 12572/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.129 | DEBUG    | __main__:trials:29 - Trial = 12572/30000 | Total reward = 61.24
2022-01-26 14:17:26.132 | DEBUG    | __main__:trials:24 - Trial = 12573/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.133 | DEBUG    | __main__:trials:29 - Trial = 12573/30000 | Total reward = 53.55
2022-01-26 14:17:26.136 | DEBUG    | __main__:trials:24 - Trial = 12574/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.137 | DEBUG    | __main__:trials:29 - Trial = 12574/30000 | Total reward = 49.59
2022-01-26 14:17:26.140 | DEBUG    | __main__:trials:24 - Trial = 12575/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.142 | DEBUG    | __main__:trials:29 - Trial = 12575/30000 | Total reward = 52.44
2022-01-26 14:17:26.146 | DEBUG    | __main__:trials:24 - Trial = 12576/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.147 | DEBUG    | __main__:trials:29 - Trial = 12576/30000 | Total reward = 43.35
2022-01-26 14:17:26.151 | DEBUG    | __main__:trials:24 - Trial = 12577/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.152 | DEBUG    | __main__:trials:29 - Trial = 12577/30000 | Total reward = 31.35
2022-01-26 14:17:26.156 | DEBUG    | __main__:trials:24 - Trial = 12578/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.158 | DEBUG    | __main__:trials:29 - Trial = 12578/30000 | Total reward = 44.57
2022-01-26 14:17:26.161 | DEBUG    | __main__:trials:24 - Trial = 12579/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.163 | DEBUG    | __main__:trials:29 - Trial = 12579/30000 | Total reward = 53.45
2022-01-26 14:17:26.168 | DEBUG    | __main__:trials:24 - Trial = 12580/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.170 | DEBUG    | __main__:trials:29 - Trial = 12580/30000 | Total reward = 52.34
2022-01-26 14:17:26.173 | DEBUG    | __main__:trials:24 - Trial = 12581/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.175 | DEBUG    | __main__:trials:29 - Trial = 12581/30000 | Total reward = 50.08
2022-01-26 14:17:26.179 | DEBUG    | __main__:trials:24 - Trial = 12582/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.180 | DEBUG    | __main__:trials:29 - Trial = 12582/30000 | Total reward = 51.39
2022-01-26 14:17:26.184 | DEBUG    | __main__:trials:24 - Trial = 12583/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.185 | DEBUG    | __main__:trials:29 - Trial = 12583/30000 | Total reward = 52.85
2022-01-26 14:17:26.189 | DEBUG    | __main__:trials:24 - Trial = 12584/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.190 | DEBUG    | __main__:trials:29 - Trial = 12584/30000 | Total reward = 47.00
2022-01-26 14:17:26.193 | DEBUG    | __main__:trials:24 - Trial = 12585/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.195 | DEBUG    | __main__:trials:29 - Trial = 12585/30000 | Total reward = 65.18
2022-01-26 14:17:26.199 | DEBUG    | __main__:trials:24 - Trial = 12586/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.200 | DEBUG    | __main__:trials:29 - Trial = 12586/30000 | Total reward = 47.99
2022-01-26 14:17:26.203 | DEBUG    | __main__:trials:24 - Trial = 12587/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.204 | DEBUG    | __main__:trials:29 - Trial = 12587/30000 | Total reward = 37.03
2022-01-26 14:17:26.208 | DEBUG    | __main__:trials:24 - Trial = 12588/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.210 | DEBUG    | __main__:trials:29 - Trial = 12588/30000 | Total reward = 49.88
2022-01-26 14:17:26.214 | DEBUG    | __main__:trials:24 - Trial = 12589/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.215 | DEBUG    | __main__:trials:29 - Trial = 12589/30000 | Total reward = 43.78
2022-01-26 14:17:26.219 | DEBUG    | __main__:trials:24 - Trial = 12590/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.221 | DEBUG    | __main__:trials:29 - Trial = 12590/30000 | Total reward = 51.53
2022-01-26 14:17:26.225 | DEBUG    | __main__:trials:24 - Trial = 12591/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.226 | DEBUG    | __main__:trials:29 - Trial = 12591/30000 | Total reward = 52.57
2022-01-26 14:17:26.230 | DEBUG    | __main__:trials:24 - Trial = 12592/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.232 | DEBUG    | __main__:trials:29 - Trial = 12592/30000 | Total reward = 59.50
2022-01-26 14:17:26.235 | DEBUG    | __main__:trials:24 - Trial = 12593/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.237 | DEBUG    | __main__:trials:29 - Trial = 12593/30000 | Total reward = 41.87
2022-01-26 14:17:26.240 | DEBUG    | __main__:trials:24 - Trial = 12594/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.242 | DEBUG    | __main__:trials:29 - Trial = 12594/30000 | Total reward = 41.56
2022-01-26 14:17:26.246 | DEBUG    | __main__:trials:24 - Trial = 12595/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.246 | DEBUG    | __main__:trials:29 - Trial = 12595/30000 | Total reward = 53.82
2022-01-26 14:17:26.251 | DEBUG    | __main__:trials:24 - Trial = 12596/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.251 | DEBUG    | __main__:trials:29 - Trial = 12596/30000 | Total reward = 52.71
2022-01-26 14:17:26.255 | DEBUG    | __main__:trials:24 - Trial = 12597/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.256 | DEBUG    | __main__:trials:29 - Trial = 12597/30000 | Total reward = 64.74
2022-01-26 14:17:26.260 | DEBUG    | __main__:trials:24 - Trial = 12598/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.262 | DEBUG    | __main__:trials:29 - Trial = 12598/30000 | Total reward = 52.62
2022-01-26 14:17:26.265 | DEBUG    | __main__:trials:24 - Trial = 12599/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.267 | DEBUG    | __main__:trials:29 - Trial = 12599/30000 | Total reward = 35.37
2022-01-26 14:17:26.271 | DEBUG    | __main__:trials:24 - Trial = 12600/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.273 | DEBUG    | __main__:trials:29 - Trial = 12600/30000 | Total reward = 36.65
2022-01-26 14:17:26.276 | DEBUG    | __main__:trials:24 - Trial = 12601/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.278 | DEBUG    | __main__:trials:29 - Trial = 12601/30000 | Total reward = 49.47
2022-01-26 14:17:26.282 | DEBUG    | __main__:trials:24 - Trial = 12602/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.284 | DEBUG    | __main__:trials:29 - Trial = 12602/30000 | Total reward = 49.09
2022-01-26 14:17:26.287 | DEBUG    | __main__:trials:24 - Trial = 12603/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.289 | DEBUG    | __main__:trials:29 - Trial = 12603/30000 | Total reward = 49.88
2022-01-26 14:17:26.292 | DEBUG    | __main__:trials:24 - Trial = 12604/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.294 | DEBUG    | __main__:trials:29 - Trial = 12604/30000 | Total reward = 59.51
2022-01-26 14:17:26.298 | DEBUG    | __main__:trials:24 - Trial = 12605/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.299 | DEBUG    | __main__:trials:29 - Trial = 12605/30000 | Total reward = 48.51
2022-01-26 14:17:26.303 | DEBUG    | __main__:trials:24 - Trial = 12606/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.305 | DEBUG    | __main__:trials:29 - Trial = 12606/30000 | Total reward = 62.49
2022-01-26 14:17:26.308 | DEBUG    | __main__:trials:24 - Trial = 12607/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.310 | DEBUG    | __main__:trials:29 - Trial = 12607/30000 | Total reward = 59.87
2022-01-26 14:17:26.314 | DEBUG    | __main__:trials:24 - Trial = 12608/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.315 | DEBUG    | __main__:trials:29 - Trial = 12608/30000 | Total reward = 43.90
2022-01-26 14:17:26.319 | DEBUG    | __main__:trials:24 - Trial = 12609/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.320 | DEBUG    | __main__:trials:29 - Trial = 12609/30000 | Total reward = 37.90
2022-01-26 14:17:26.324 | DEBUG    | __main__:trials:24 - Trial = 12610/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.326 | DEBUG    | __main__:trials:29 - Trial = 12610/30000 | Total reward = 45.95
2022-01-26 14:17:26.328 | DEBUG    | __main__:trials:24 - Trial = 12611/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.330 | DEBUG    | __main__:trials:29 - Trial = 12611/30000 | Total reward = 35.44
2022-01-26 14:17:26.334 | DEBUG    | __main__:trials:24 - Trial = 12612/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.336 | DEBUG    | __main__:trials:29 - Trial = 12612/30000 | Total reward = 45.15
2022-01-26 14:17:26.340 | DEBUG    | __main__:trials:24 - Trial = 12613/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.341 | DEBUG    | __main__:trials:29 - Trial = 12613/30000 | Total reward = 45.24
2022-01-26 14:17:26.344 | DEBUG    | __main__:trials:24 - Trial = 12614/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.346 | DEBUG    | __main__:trials:29 - Trial = 12614/30000 | Total reward = 49.00
2022-01-26 14:17:26.350 | DEBUG    | __main__:trials:24 - Trial = 12615/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.352 | DEBUG    | __main__:trials:29 - Trial = 12615/30000 | Total reward = 62.54
2022-01-26 14:17:26.355 | DEBUG    | __main__:trials:24 - Trial = 12616/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.357 | DEBUG    | __main__:trials:29 - Trial = 12616/30000 | Total reward = 40.47
2022-01-26 14:17:26.361 | DEBUG    | __main__:trials:24 - Trial = 12617/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.362 | DEBUG    | __main__:trials:29 - Trial = 12617/30000 | Total reward = 45.76
2022-01-26 14:17:26.366 | DEBUG    | __main__:trials:24 - Trial = 12618/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.367 | DEBUG    | __main__:trials:29 - Trial = 12618/30000 | Total reward = 49.48
2022-01-26 14:17:26.371 | DEBUG    | __main__:trials:24 - Trial = 12619/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.373 | DEBUG    | __main__:trials:29 - Trial = 12619/30000 | Total reward = 37.64
2022-01-26 14:17:26.376 | DEBUG    | __main__:trials:24 - Trial = 12620/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.378 | DEBUG    | __main__:trials:29 - Trial = 12620/30000 | Total reward = 40.74
2022-01-26 14:17:26.382 | DEBUG    | __main__:trials:24 - Trial = 12621/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.383 | DEBUG    | __main__:trials:29 - Trial = 12621/30000 | Total reward = 41.05
2022-01-26 14:17:26.386 | DEBUG    | __main__:trials:24 - Trial = 12622/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.388 | DEBUG    | __main__:trials:29 - Trial = 12622/30000 | Total reward = 30.55
2022-01-26 14:17:26.392 | DEBUG    | __main__:trials:24 - Trial = 12623/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.394 | DEBUG    | __main__:trials:29 - Trial = 12623/30000 | Total reward = 36.45
2022-01-26 14:17:26.397 | DEBUG    | __main__:trials:24 - Trial = 12624/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.399 | DEBUG    | __main__:trials:29 - Trial = 12624/30000 | Total reward = 46.31
2022-01-26 14:17:26.403 | DEBUG    | __main__:trials:24 - Trial = 12625/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.403 | DEBUG    | __main__:trials:29 - Trial = 12625/30000 | Total reward = 45.64
2022-01-26 14:17:26.408 | DEBUG    | __main__:trials:24 - Trial = 12626/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.409 | DEBUG    | __main__:trials:29 - Trial = 12626/30000 | Total reward = 39.54
2022-01-26 14:17:26.412 | DEBUG    | __main__:trials:24 - Trial = 12627/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.414 | DEBUG    | __main__:trials:29 - Trial = 12627/30000 | Total reward = 34.70
2022-01-26 14:17:26.418 | DEBUG    | __main__:trials:24 - Trial = 12628/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.419 | DEBUG    | __main__:trials:29 - Trial = 12628/30000 | Total reward = 34.92
2022-01-26 14:17:26.423 | DEBUG    | __main__:trials:24 - Trial = 12629/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.425 | DEBUG    | __main__:trials:29 - Trial = 12629/30000 | Total reward = 35.20
2022-01-26 14:17:26.428 | DEBUG    | __main__:trials:24 - Trial = 12630/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.430 | DEBUG    | __main__:trials:29 - Trial = 12630/30000 | Total reward = 56.11
2022-01-26 14:17:26.433 | DEBUG    | __main__:trials:24 - Trial = 12631/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.435 | DEBUG    | __main__:trials:29 - Trial = 12631/30000 | Total reward = 51.89
2022-01-26 14:17:26.439 | DEBUG    | __main__:trials:24 - Trial = 12632/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.439 | DEBUG    | __main__:trials:29 - Trial = 12632/30000 | Total reward = 47.16
2022-01-26 14:17:26.443 | DEBUG    | __main__:trials:24 - Trial = 12633/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.444 | DEBUG    | __main__:trials:29 - Trial = 12633/30000 | Total reward = 33.61
2022-01-26 14:17:26.448 | DEBUG    | __main__:trials:24 - Trial = 12634/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.450 | DEBUG    | __main__:trials:29 - Trial = 12634/30000 | Total reward = 62.17
2022-01-26 14:17:26.453 | DEBUG    | __main__:trials:24 - Trial = 12635/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.455 | DEBUG    | __main__:trials:29 - Trial = 12635/30000 | Total reward = 47.62
2022-01-26 14:17:26.459 | DEBUG    | __main__:trials:24 - Trial = 12636/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.460 | DEBUG    | __main__:trials:29 - Trial = 12636/30000 | Total reward = 51.52
2022-01-26 14:17:26.463 | DEBUG    | __main__:trials:24 - Trial = 12637/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.465 | DEBUG    | __main__:trials:29 - Trial = 12637/30000 | Total reward = 57.90
2022-01-26 14:17:26.469 | DEBUG    | __main__:trials:24 - Trial = 12638/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.470 | DEBUG    | __main__:trials:29 - Trial = 12638/30000 | Total reward = 57.25
2022-01-26 14:17:26.474 | DEBUG    | __main__:trials:24 - Trial = 12639/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.476 | DEBUG    | __main__:trials:29 - Trial = 12639/30000 | Total reward = 47.70
2022-01-26 14:17:26.480 | DEBUG    | __main__:trials:24 - Trial = 12640/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.481 | DEBUG    | __main__:trials:29 - Trial = 12640/30000 | Total reward = 43.73
2022-01-26 14:17:26.484 | DEBUG    | __main__:trials:24 - Trial = 12641/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.485 | DEBUG    | __main__:trials:29 - Trial = 12641/30000 | Total reward = 52.73
2022-01-26 14:17:26.489 | DEBUG    | __main__:trials:24 - Trial = 12642/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.490 | DEBUG    | __main__:trials:29 - Trial = 12642/30000 | Total reward = 39.81
2022-01-26 14:17:26.494 | DEBUG    | __main__:trials:24 - Trial = 12643/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.496 | DEBUG    | __main__:trials:29 - Trial = 12643/30000 | Total reward = 44.88
2022-01-26 14:17:26.499 | DEBUG    | __main__:trials:24 - Trial = 12644/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.501 | DEBUG    | __main__:trials:29 - Trial = 12644/30000 | Total reward = 33.07
2022-01-26 14:17:26.503 | DEBUG    | __main__:trials:24 - Trial = 12645/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.505 | DEBUG    | __main__:trials:29 - Trial = 12645/30000 | Total reward = 37.57
2022-01-26 14:17:26.508 | DEBUG    | __main__:trials:24 - Trial = 12646/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.510 | DEBUG    | __main__:trials:29 - Trial = 12646/30000 | Total reward = 27.51
2022-01-26 14:17:26.514 | DEBUG    | __main__:trials:24 - Trial = 12647/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.515 | DEBUG    | __main__:trials:29 - Trial = 12647/30000 | Total reward = 54.85
2022-01-26 14:17:26.518 | DEBUG    | __main__:trials:24 - Trial = 12648/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.519 | DEBUG    | __main__:trials:29 - Trial = 12648/30000 | Total reward = 32.41
2022-01-26 14:17:26.523 | DEBUG    | __main__:trials:24 - Trial = 12649/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.524 | DEBUG    | __main__:trials:29 - Trial = 12649/30000 | Total reward = 39.31
2022-01-26 14:17:26.527 | DEBUG    | __main__:trials:24 - Trial = 12650/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.529 | DEBUG    | __main__:trials:29 - Trial = 12650/30000 | Total reward = 42.55
2022-01-26 14:17:26.532 | DEBUG    | __main__:trials:24 - Trial = 12651/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.534 | DEBUG    | __main__:trials:29 - Trial = 12651/30000 | Total reward = 45.38
2022-01-26 14:17:26.537 | DEBUG    | __main__:trials:24 - Trial = 12652/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.539 | DEBUG    | __main__:trials:29 - Trial = 12652/30000 | Total reward = 44.35
2022-01-26 14:17:26.542 | DEBUG    | __main__:trials:24 - Trial = 12653/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.542 | DEBUG    | __main__:trials:29 - Trial = 12653/30000 | Total reward = 48.07
2022-01-26 14:17:26.547 | DEBUG    | __main__:trials:24 - Trial = 12654/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.548 | DEBUG    | __main__:trials:29 - Trial = 12654/30000 | Total reward = 52.59
2022-01-26 14:17:26.551 | DEBUG    | __main__:trials:24 - Trial = 12655/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.553 | DEBUG    | __main__:trials:29 - Trial = 12655/30000 | Total reward = 43.31
2022-01-26 14:17:26.556 | DEBUG    | __main__:trials:24 - Trial = 12656/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.557 | DEBUG    | __main__:trials:29 - Trial = 12656/30000 | Total reward = 44.78
2022-01-26 14:17:26.560 | DEBUG    | __main__:trials:26 - Trial = 12657/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:26.560 | DEBUG    | __main__:trials:29 - Trial = 12657/30000 | Total reward = 18.12
2022-01-26 14:17:26.564 | DEBUG    | __main__:trials:24 - Trial = 12658/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.565 | DEBUG    | __main__:trials:29 - Trial = 12658/30000 | Total reward = 54.93
2022-01-26 14:17:26.568 | DEBUG    | __main__:trials:24 - Trial = 12659/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.570 | DEBUG    | __main__:trials:29 - Trial = 12659/30000 | Total reward = 40.82
2022-01-26 14:17:26.573 | DEBUG    | __main__:trials:24 - Trial = 12660/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.574 | DEBUG    | __main__:trials:29 - Trial = 12660/30000 | Total reward = 51.79
2022-01-26 14:17:26.578 | DEBUG    | __main__:trials:24 - Trial = 12661/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.580 | DEBUG    | __main__:trials:29 - Trial = 12661/30000 | Total reward = 50.94
2022-01-26 14:17:26.582 | DEBUG    | __main__:trials:24 - Trial = 12662/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.584 | DEBUG    | __main__:trials:29 - Trial = 12662/30000 | Total reward = 46.05
2022-01-26 14:17:26.587 | DEBUG    | __main__:trials:24 - Trial = 12663/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.588 | DEBUG    | __main__:trials:29 - Trial = 12663/30000 | Total reward = 47.38
2022-01-26 14:17:26.592 | DEBUG    | __main__:trials:24 - Trial = 12664/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.593 | DEBUG    | __main__:trials:29 - Trial = 12664/30000 | Total reward = 40.34
2022-01-26 14:17:26.596 | DEBUG    | __main__:trials:24 - Trial = 12665/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.598 | DEBUG    | __main__:trials:29 - Trial = 12665/30000 | Total reward = 41.09
2022-01-26 14:17:26.602 | DEBUG    | __main__:trials:24 - Trial = 12666/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.602 | DEBUG    | __main__:trials:29 - Trial = 12666/30000 | Total reward = 47.51
2022-01-26 14:17:26.606 | DEBUG    | __main__:trials:24 - Trial = 12667/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.607 | DEBUG    | __main__:trials:29 - Trial = 12667/30000 | Total reward = 57.89
2022-01-26 14:17:26.610 | DEBUG    | __main__:trials:24 - Trial = 12668/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.611 | DEBUG    | __main__:trials:29 - Trial = 12668/30000 | Total reward = 57.75
2022-01-26 14:17:26.614 | DEBUG    | __main__:trials:24 - Trial = 12669/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.615 | DEBUG    | __main__:trials:29 - Trial = 12669/30000 | Total reward = 47.03
2022-01-26 14:17:26.619 | DEBUG    | __main__:trials:24 - Trial = 12670/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.620 | DEBUG    | __main__:trials:29 - Trial = 12670/30000 | Total reward = 41.76
2022-01-26 14:17:26.623 | DEBUG    | __main__:trials:24 - Trial = 12671/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.625 | DEBUG    | __main__:trials:29 - Trial = 12671/30000 | Total reward = 37.21
2022-01-26 14:17:26.628 | DEBUG    | __main__:trials:24 - Trial = 12672/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.629 | DEBUG    | __main__:trials:29 - Trial = 12672/30000 | Total reward = 47.80
2022-01-26 14:17:26.633 | DEBUG    | __main__:trials:24 - Trial = 12673/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.633 | DEBUG    | __main__:trials:29 - Trial = 12673/30000 | Total reward = 47.72
2022-01-26 14:17:26.638 | DEBUG    | __main__:trials:24 - Trial = 12674/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.638 | DEBUG    | __main__:trials:29 - Trial = 12674/30000 | Total reward = 43.60
2022-01-26 14:17:26.642 | DEBUG    | __main__:trials:24 - Trial = 12675/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.643 | DEBUG    | __main__:trials:29 - Trial = 12675/30000 | Total reward = 42.25
2022-01-26 14:17:26.647 | DEBUG    | __main__:trials:24 - Trial = 12676/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.648 | DEBUG    | __main__:trials:29 - Trial = 12676/30000 | Total reward = 60.55
2022-01-26 14:17:26.651 | DEBUG    | __main__:trials:24 - Trial = 12677/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.653 | DEBUG    | __main__:trials:29 - Trial = 12677/30000 | Total reward = 56.02
2022-01-26 14:17:26.656 | DEBUG    | __main__:trials:24 - Trial = 12678/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.657 | DEBUG    | __main__:trials:29 - Trial = 12678/30000 | Total reward = 45.44
2022-01-26 14:17:26.661 | DEBUG    | __main__:trials:24 - Trial = 12679/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.662 | DEBUG    | __main__:trials:29 - Trial = 12679/30000 | Total reward = 52.48
2022-01-26 14:17:26.666 | DEBUG    | __main__:trials:24 - Trial = 12680/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.666 | DEBUG    | __main__:trials:29 - Trial = 12680/30000 | Total reward = 33.48
2022-01-26 14:17:26.671 | DEBUG    | __main__:trials:24 - Trial = 12681/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.671 | DEBUG    | __main__:trials:29 - Trial = 12681/30000 | Total reward = 52.87
2022-01-26 14:17:26.675 | DEBUG    | __main__:trials:24 - Trial = 12682/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.677 | DEBUG    | __main__:trials:29 - Trial = 12682/30000 | Total reward = 51.55
2022-01-26 14:17:26.680 | DEBUG    | __main__:trials:24 - Trial = 12683/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.681 | DEBUG    | __main__:trials:29 - Trial = 12683/30000 | Total reward = 46.37
2022-01-26 14:17:26.684 | DEBUG    | __main__:trials:24 - Trial = 12684/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.686 | DEBUG    | __main__:trials:29 - Trial = 12684/30000 | Total reward = 51.50
2022-01-26 14:17:26.689 | DEBUG    | __main__:trials:24 - Trial = 12685/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.689 | DEBUG    | __main__:trials:29 - Trial = 12685/30000 | Total reward = 23.82
2022-01-26 14:17:26.693 | DEBUG    | __main__:trials:24 - Trial = 12686/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.695 | DEBUG    | __main__:trials:29 - Trial = 12686/30000 | Total reward = 54.80
2022-01-26 14:17:26.699 | DEBUG    | __main__:trials:24 - Trial = 12687/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.700 | DEBUG    | __main__:trials:29 - Trial = 12687/30000 | Total reward = 39.97
2022-01-26 14:17:26.703 | DEBUG    | __main__:trials:24 - Trial = 12688/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.705 | DEBUG    | __main__:trials:29 - Trial = 12688/30000 | Total reward = 44.22
2022-01-26 14:17:26.708 | DEBUG    | __main__:trials:24 - Trial = 12689/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.710 | DEBUG    | __main__:trials:29 - Trial = 12689/30000 | Total reward = 52.68
2022-01-26 14:17:26.714 | DEBUG    | __main__:trials:24 - Trial = 12690/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.715 | DEBUG    | __main__:trials:29 - Trial = 12690/30000 | Total reward = 50.18
2022-01-26 14:17:26.718 | DEBUG    | __main__:trials:24 - Trial = 12691/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.720 | DEBUG    | __main__:trials:29 - Trial = 12691/30000 | Total reward = 50.75
2022-01-26 14:17:26.723 | DEBUG    | __main__:trials:24 - Trial = 12692/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.725 | DEBUG    | __main__:trials:29 - Trial = 12692/30000 | Total reward = 62.65
2022-01-26 14:17:26.728 | DEBUG    | __main__:trials:24 - Trial = 12693/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.730 | DEBUG    | __main__:trials:29 - Trial = 12693/30000 | Total reward = 41.96
2022-01-26 14:17:26.734 | DEBUG    | __main__:trials:24 - Trial = 12694/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.734 | DEBUG    | __main__:trials:29 - Trial = 12694/30000 | Total reward = 51.76
2022-01-26 14:17:26.739 | DEBUG    | __main__:trials:24 - Trial = 12695/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.740 | DEBUG    | __main__:trials:29 - Trial = 12695/30000 | Total reward = 46.18
2022-01-26 14:17:26.744 | DEBUG    | __main__:trials:24 - Trial = 12696/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.746 | DEBUG    | __main__:trials:29 - Trial = 12696/30000 | Total reward = 51.19
2022-01-26 14:17:26.749 | DEBUG    | __main__:trials:24 - Trial = 12697/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.752 | DEBUG    | __main__:trials:29 - Trial = 12697/30000 | Total reward = 46.34
2022-01-26 14:17:26.756 | DEBUG    | __main__:trials:24 - Trial = 12698/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.757 | DEBUG    | __main__:trials:29 - Trial = 12698/30000 | Total reward = 59.29
2022-01-26 14:17:26.760 | DEBUG    | __main__:trials:24 - Trial = 12699/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.762 | DEBUG    | __main__:trials:29 - Trial = 12699/30000 | Total reward = 35.26
2022-01-26 14:17:26.766 | DEBUG    | __main__:trials:24 - Trial = 12700/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.767 | DEBUG    | __main__:trials:29 - Trial = 12700/30000 | Total reward = 50.86
2022-01-26 14:17:26.771 | DEBUG    | __main__:trials:24 - Trial = 12701/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.772 | DEBUG    | __main__:trials:29 - Trial = 12701/30000 | Total reward = 49.53
2022-01-26 14:17:26.775 | DEBUG    | __main__:trials:24 - Trial = 12702/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.777 | DEBUG    | __main__:trials:29 - Trial = 12702/30000 | Total reward = 58.90
2022-01-26 14:17:26.781 | DEBUG    | __main__:trials:24 - Trial = 12703/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.782 | DEBUG    | __main__:trials:29 - Trial = 12703/30000 | Total reward = 43.02
2022-01-26 14:17:26.786 | DEBUG    | __main__:trials:24 - Trial = 12704/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.787 | DEBUG    | __main__:trials:29 - Trial = 12704/30000 | Total reward = 22.27
2022-01-26 14:17:26.791 | DEBUG    | __main__:trials:24 - Trial = 12705/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.792 | DEBUG    | __main__:trials:29 - Trial = 12705/30000 | Total reward = 47.06
2022-01-26 14:17:26.796 | DEBUG    | __main__:trials:24 - Trial = 12706/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.798 | DEBUG    | __main__:trials:29 - Trial = 12706/30000 | Total reward = 62.17
2022-01-26 14:17:26.801 | DEBUG    | __main__:trials:24 - Trial = 12707/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.802 | DEBUG    | __main__:trials:29 - Trial = 12707/30000 | Total reward = 49.21
2022-01-26 14:17:26.806 | DEBUG    | __main__:trials:24 - Trial = 12708/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.807 | DEBUG    | __main__:trials:29 - Trial = 12708/30000 | Total reward = 37.14
2022-01-26 14:17:26.812 | DEBUG    | __main__:trials:24 - Trial = 12709/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.812 | DEBUG    | __main__:trials:29 - Trial = 12709/30000 | Total reward = 49.16
2022-01-26 14:17:26.816 | DEBUG    | __main__:trials:24 - Trial = 12710/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.818 | DEBUG    | __main__:trials:29 - Trial = 12710/30000 | Total reward = 41.24
2022-01-26 14:17:26.822 | DEBUG    | __main__:trials:24 - Trial = 12711/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.822 | DEBUG    | __main__:trials:29 - Trial = 12711/30000 | Total reward = 49.21
2022-01-26 14:17:26.827 | DEBUG    | __main__:trials:24 - Trial = 12712/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.828 | DEBUG    | __main__:trials:29 - Trial = 12712/30000 | Total reward = 54.45
2022-01-26 14:17:26.831 | DEBUG    | __main__:trials:24 - Trial = 12713/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.833 | DEBUG    | __main__:trials:29 - Trial = 12713/30000 | Total reward = 61.03
2022-01-26 14:17:26.837 | DEBUG    | __main__:trials:24 - Trial = 12714/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.837 | DEBUG    | __main__:trials:29 - Trial = 12714/30000 | Total reward = 32.61
2022-01-26 14:17:26.842 | DEBUG    | __main__:trials:24 - Trial = 12715/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.843 | DEBUG    | __main__:trials:29 - Trial = 12715/30000 | Total reward = 42.78
2022-01-26 14:17:26.847 | DEBUG    | __main__:trials:24 - Trial = 12716/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.848 | DEBUG    | __main__:trials:29 - Trial = 12716/30000 | Total reward = 42.32
2022-01-26 14:17:26.852 | DEBUG    | __main__:trials:24 - Trial = 12717/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.853 | DEBUG    | __main__:trials:29 - Trial = 12717/30000 | Total reward = 62.67
2022-01-26 14:17:26.856 | DEBUG    | __main__:trials:24 - Trial = 12718/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.857 | DEBUG    | __main__:trials:29 - Trial = 12718/30000 | Total reward = 31.29
2022-01-26 14:17:26.860 | DEBUG    | __main__:trials:24 - Trial = 12719/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.862 | DEBUG    | __main__:trials:29 - Trial = 12719/30000 | Total reward = 48.76
2022-01-26 14:17:26.866 | DEBUG    | __main__:trials:24 - Trial = 12720/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.866 | DEBUG    | __main__:trials:29 - Trial = 12720/30000 | Total reward = 42.72
2022-01-26 14:17:26.871 | DEBUG    | __main__:trials:24 - Trial = 12721/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.872 | DEBUG    | __main__:trials:29 - Trial = 12721/30000 | Total reward = 22.70
2022-01-26 14:17:26.875 | DEBUG    | __main__:trials:24 - Trial = 12722/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.877 | DEBUG    | __main__:trials:29 - Trial = 12722/30000 | Total reward = 51.69
2022-01-26 14:17:26.880 | DEBUG    | __main__:trials:24 - Trial = 12723/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.881 | DEBUG    | __main__:trials:29 - Trial = 12723/30000 | Total reward = 39.02
2022-01-26 14:17:26.885 | DEBUG    | __main__:trials:24 - Trial = 12724/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.886 | DEBUG    | __main__:trials:29 - Trial = 12724/30000 | Total reward = 49.79
2022-01-26 14:17:26.891 | DEBUG    | __main__:trials:24 - Trial = 12725/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.891 | DEBUG    | __main__:trials:29 - Trial = 12725/30000 | Total reward = 36.19
2022-01-26 14:17:26.895 | DEBUG    | __main__:trials:24 - Trial = 12726/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.897 | DEBUG    | __main__:trials:29 - Trial = 12726/30000 | Total reward = 43.91
2022-01-26 14:17:26.901 | DEBUG    | __main__:trials:26 - Trial = 12727/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:26.902 | DEBUG    | __main__:trials:29 - Trial = 12727/30000 | Total reward = 32.37
2022-01-26 14:17:26.906 | DEBUG    | __main__:trials:24 - Trial = 12728/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.907 | DEBUG    | __main__:trials:29 - Trial = 12728/30000 | Total reward = 53.91
2022-01-26 14:17:26.911 | DEBUG    | __main__:trials:24 - Trial = 12729/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.913 | DEBUG    | __main__:trials:29 - Trial = 12729/30000 | Total reward = 38.07
2022-01-26 14:17:26.916 | DEBUG    | __main__:trials:24 - Trial = 12730/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.917 | DEBUG    | __main__:trials:29 - Trial = 12730/30000 | Total reward = 53.60
2022-01-26 14:17:26.921 | DEBUG    | __main__:trials:24 - Trial = 12731/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.921 | DEBUG    | __main__:trials:29 - Trial = 12731/30000 | Total reward = 47.69
2022-01-26 14:17:26.926 | DEBUG    | __main__:trials:24 - Trial = 12732/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.926 | DEBUG    | __main__:trials:29 - Trial = 12732/30000 | Total reward = 52.87
2022-01-26 14:17:26.931 | DEBUG    | __main__:trials:24 - Trial = 12733/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.931 | DEBUG    | __main__:trials:29 - Trial = 12733/30000 | Total reward = 57.31
2022-01-26 14:17:26.936 | DEBUG    | __main__:trials:24 - Trial = 12734/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.936 | DEBUG    | __main__:trials:29 - Trial = 12734/30000 | Total reward = 42.17
2022-01-26 14:17:26.940 | DEBUG    | __main__:trials:24 - Trial = 12735/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.942 | DEBUG    | __main__:trials:29 - Trial = 12735/30000 | Total reward = 53.60
2022-01-26 14:17:26.945 | DEBUG    | __main__:trials:24 - Trial = 12736/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.947 | DEBUG    | __main__:trials:29 - Trial = 12736/30000 | Total reward = 53.33
2022-01-26 14:17:26.951 | DEBUG    | __main__:trials:24 - Trial = 12737/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.951 | DEBUG    | __main__:trials:29 - Trial = 12737/30000 | Total reward = 54.72
2022-01-26 14:17:26.955 | DEBUG    | __main__:trials:24 - Trial = 12738/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.957 | DEBUG    | __main__:trials:29 - Trial = 12738/30000 | Total reward = 33.85
2022-01-26 14:17:26.960 | DEBUG    | __main__:trials:24 - Trial = 12739/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.961 | DEBUG    | __main__:trials:29 - Trial = 12739/30000 | Total reward = 48.58
2022-01-26 14:17:26.965 | DEBUG    | __main__:trials:24 - Trial = 12740/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.967 | DEBUG    | __main__:trials:29 - Trial = 12740/30000 | Total reward = 34.42
2022-01-26 14:17:26.970 | DEBUG    | __main__:trials:24 - Trial = 12741/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.972 | DEBUG    | __main__:trials:29 - Trial = 12741/30000 | Total reward = 37.96
2022-01-26 14:17:26.975 | DEBUG    | __main__:trials:24 - Trial = 12742/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.976 | DEBUG    | __main__:trials:29 - Trial = 12742/30000 | Total reward = 39.70
2022-01-26 14:17:26.981 | DEBUG    | __main__:trials:24 - Trial = 12743/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.982 | DEBUG    | __main__:trials:29 - Trial = 12743/30000 | Total reward = 64.60
2022-01-26 14:17:26.986 | DEBUG    | __main__:trials:24 - Trial = 12744/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.987 | DEBUG    | __main__:trials:29 - Trial = 12744/30000 | Total reward = 37.66
2022-01-26 14:17:26.991 | DEBUG    | __main__:trials:24 - Trial = 12745/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.992 | DEBUG    | __main__:trials:29 - Trial = 12745/30000 | Total reward = 42.47
2022-01-26 14:17:26.996 | DEBUG    | __main__:trials:24 - Trial = 12746/30000 | Max number of steps (20) reached
2022-01-26 14:17:26.997 | DEBUG    | __main__:trials:29 - Trial = 12746/30000 | Total reward = 50.44
2022-01-26 14:17:27.001 | DEBUG    | __main__:trials:24 - Trial = 12747/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.003 | DEBUG    | __main__:trials:29 - Trial = 12747/30000 | Total reward = 23.50
2022-01-26 14:17:27.006 | DEBUG    | __main__:trials:24 - Trial = 12748/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.007 | DEBUG    | __main__:trials:29 - Trial = 12748/30000 | Total reward = 37.83
2022-01-26 14:17:27.011 | DEBUG    | __main__:trials:24 - Trial = 12749/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.013 | DEBUG    | __main__:trials:29 - Trial = 12749/30000 | Total reward = 32.01
2022-01-26 14:17:27.016 | DEBUG    | __main__:trials:24 - Trial = 12750/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.018 | DEBUG    | __main__:trials:29 - Trial = 12750/30000 | Total reward = 39.20
2022-01-26 14:17:27.021 | DEBUG    | __main__:trials:24 - Trial = 12751/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.022 | DEBUG    | __main__:trials:29 - Trial = 12751/30000 | Total reward = 51.59
2022-01-26 14:17:27.027 | DEBUG    | __main__:trials:24 - Trial = 12752/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.027 | DEBUG    | __main__:trials:29 - Trial = 12752/30000 | Total reward = 57.71
2022-01-26 14:17:27.032 | DEBUG    | __main__:trials:24 - Trial = 12753/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.033 | DEBUG    | __main__:trials:29 - Trial = 12753/30000 | Total reward = 48.52
2022-01-26 14:17:27.037 | DEBUG    | __main__:trials:24 - Trial = 12754/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.038 | DEBUG    | __main__:trials:29 - Trial = 12754/30000 | Total reward = 47.73
2022-01-26 14:17:27.042 | DEBUG    | __main__:trials:24 - Trial = 12755/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.044 | DEBUG    | __main__:trials:29 - Trial = 12755/30000 | Total reward = 40.44
2022-01-26 14:17:27.048 | DEBUG    | __main__:trials:24 - Trial = 12756/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.049 | DEBUG    | __main__:trials:29 - Trial = 12756/30000 | Total reward = 37.69
2022-01-26 14:17:27.053 | DEBUG    | __main__:trials:24 - Trial = 12757/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.055 | DEBUG    | __main__:trials:29 - Trial = 12757/30000 | Total reward = 54.19
2022-01-26 14:17:27.059 | DEBUG    | __main__:trials:24 - Trial = 12758/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.060 | DEBUG    | __main__:trials:29 - Trial = 12758/30000 | Total reward = 53.14
2022-01-26 14:17:27.064 | DEBUG    | __main__:trials:24 - Trial = 12759/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.066 | DEBUG    | __main__:trials:29 - Trial = 12759/30000 | Total reward = 49.02
2022-01-26 14:17:27.070 | DEBUG    | __main__:trials:24 - Trial = 12760/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.070 | DEBUG    | __main__:trials:29 - Trial = 12760/30000 | Total reward = 48.57
2022-01-26 14:17:27.075 | DEBUG    | __main__:trials:24 - Trial = 12761/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.077 | DEBUG    | __main__:trials:29 - Trial = 12761/30000 | Total reward = 48.34
2022-01-26 14:17:27.080 | DEBUG    | __main__:trials:26 - Trial = 12762/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.081 | DEBUG    | __main__:trials:29 - Trial = 12762/30000 | Total reward = 32.37
2022-01-26 14:17:27.085 | DEBUG    | __main__:trials:24 - Trial = 12763/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.085 | DEBUG    | __main__:trials:29 - Trial = 12763/30000 | Total reward = 46.72
2022-01-26 14:17:27.089 | DEBUG    | __main__:trials:24 - Trial = 12764/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.090 | DEBUG    | __main__:trials:29 - Trial = 12764/30000 | Total reward = 39.51
2022-01-26 14:17:27.093 | DEBUG    | __main__:trials:24 - Trial = 12765/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.095 | DEBUG    | __main__:trials:29 - Trial = 12765/30000 | Total reward = 51.49
2022-01-26 14:17:27.098 | DEBUG    | __main__:trials:24 - Trial = 12766/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.099 | DEBUG    | __main__:trials:29 - Trial = 12766/30000 | Total reward = 48.80
2022-01-26 14:17:27.102 | DEBUG    | __main__:trials:24 - Trial = 12767/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.104 | DEBUG    | __main__:trials:29 - Trial = 12767/30000 | Total reward = 49.05
2022-01-26 14:17:27.107 | DEBUG    | __main__:trials:26 - Trial = 12768/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.109 | DEBUG    | __main__:trials:29 - Trial = 12768/30000 | Total reward = 24.77
2022-01-26 14:17:27.112 | DEBUG    | __main__:trials:24 - Trial = 12769/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.114 | DEBUG    | __main__:trials:29 - Trial = 12769/30000 | Total reward = 31.26
2022-01-26 14:17:27.118 | DEBUG    | __main__:trials:24 - Trial = 12770/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.119 | DEBUG    | __main__:trials:29 - Trial = 12770/30000 | Total reward = 41.03
2022-01-26 14:17:27.123 | DEBUG    | __main__:trials:24 - Trial = 12771/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.124 | DEBUG    | __main__:trials:29 - Trial = 12771/30000 | Total reward = 47.09
2022-01-26 14:17:27.128 | DEBUG    | __main__:trials:24 - Trial = 12772/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.130 | DEBUG    | __main__:trials:29 - Trial = 12772/30000 | Total reward = 46.90
2022-01-26 14:17:27.134 | DEBUG    | __main__:trials:24 - Trial = 12773/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.134 | DEBUG    | __main__:trials:29 - Trial = 12773/30000 | Total reward = 39.54
2022-01-26 14:17:27.139 | DEBUG    | __main__:trials:24 - Trial = 12774/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.140 | DEBUG    | __main__:trials:29 - Trial = 12774/30000 | Total reward = 53.66
2022-01-26 14:17:27.144 | DEBUG    | __main__:trials:24 - Trial = 12775/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.145 | DEBUG    | __main__:trials:29 - Trial = 12775/30000 | Total reward = 42.47
2022-01-26 14:17:27.149 | DEBUG    | __main__:trials:24 - Trial = 12776/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.151 | DEBUG    | __main__:trials:29 - Trial = 12776/30000 | Total reward = 56.92
2022-01-26 14:17:27.155 | DEBUG    | __main__:trials:24 - Trial = 12777/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.155 | DEBUG    | __main__:trials:29 - Trial = 12777/30000 | Total reward = 47.70
2022-01-26 14:17:27.159 | DEBUG    | __main__:trials:24 - Trial = 12778/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.161 | DEBUG    | __main__:trials:29 - Trial = 12778/30000 | Total reward = 41.88
2022-01-26 14:17:27.164 | DEBUG    | __main__:trials:24 - Trial = 12779/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.166 | DEBUG    | __main__:trials:29 - Trial = 12779/30000 | Total reward = 43.75
2022-01-26 14:17:27.169 | DEBUG    | __main__:trials:26 - Trial = 12780/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.170 | DEBUG    | __main__:trials:29 - Trial = 12780/30000 | Total reward = 36.84
2022-01-26 14:17:27.173 | DEBUG    | __main__:trials:24 - Trial = 12781/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.175 | DEBUG    | __main__:trials:29 - Trial = 12781/30000 | Total reward = 42.20
2022-01-26 14:17:27.179 | DEBUG    | __main__:trials:24 - Trial = 12782/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.180 | DEBUG    | __main__:trials:29 - Trial = 12782/30000 | Total reward = 40.40
2022-01-26 14:17:27.183 | DEBUG    | __main__:trials:24 - Trial = 12783/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.185 | DEBUG    | __main__:trials:29 - Trial = 12783/30000 | Total reward = 55.51
2022-01-26 14:17:27.188 | DEBUG    | __main__:trials:24 - Trial = 12784/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.190 | DEBUG    | __main__:trials:29 - Trial = 12784/30000 | Total reward = 47.36
2022-01-26 14:17:27.194 | DEBUG    | __main__:trials:24 - Trial = 12785/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.195 | DEBUG    | __main__:trials:29 - Trial = 12785/30000 | Total reward = 41.41
2022-01-26 14:17:27.198 | DEBUG    | __main__:trials:24 - Trial = 12786/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.200 | DEBUG    | __main__:trials:29 - Trial = 12786/30000 | Total reward = 60.57
2022-01-26 14:17:27.204 | DEBUG    | __main__:trials:24 - Trial = 12787/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.205 | DEBUG    | __main__:trials:29 - Trial = 12787/30000 | Total reward = 41.06
2022-01-26 14:17:27.208 | DEBUG    | __main__:trials:24 - Trial = 12788/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.210 | DEBUG    | __main__:trials:29 - Trial = 12788/30000 | Total reward = 42.51
2022-01-26 14:17:27.214 | DEBUG    | __main__:trials:24 - Trial = 12789/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.215 | DEBUG    | __main__:trials:29 - Trial = 12789/30000 | Total reward = 33.20
2022-01-26 14:17:27.219 | DEBUG    | __main__:trials:24 - Trial = 12790/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.220 | DEBUG    | __main__:trials:29 - Trial = 12790/30000 | Total reward = 45.51
2022-01-26 14:17:27.224 | DEBUG    | __main__:trials:24 - Trial = 12791/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.225 | DEBUG    | __main__:trials:29 - Trial = 12791/30000 | Total reward = 41.25
2022-01-26 14:17:27.229 | DEBUG    | __main__:trials:24 - Trial = 12792/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.230 | DEBUG    | __main__:trials:29 - Trial = 12792/30000 | Total reward = 41.91
2022-01-26 14:17:27.235 | DEBUG    | __main__:trials:24 - Trial = 12793/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.235 | DEBUG    | __main__:trials:29 - Trial = 12793/30000 | Total reward = 39.52
2022-01-26 14:17:27.239 | DEBUG    | __main__:trials:24 - Trial = 12794/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.241 | DEBUG    | __main__:trials:29 - Trial = 12794/30000 | Total reward = 38.46
2022-01-26 14:17:27.244 | DEBUG    | __main__:trials:24 - Trial = 12795/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.246 | DEBUG    | __main__:trials:29 - Trial = 12795/30000 | Total reward = 49.46
2022-01-26 14:17:27.249 | DEBUG    | __main__:trials:24 - Trial = 12796/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.250 | DEBUG    | __main__:trials:29 - Trial = 12796/30000 | Total reward = 51.51
2022-01-26 14:17:27.254 | DEBUG    | __main__:trials:24 - Trial = 12797/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.256 | DEBUG    | __main__:trials:29 - Trial = 12797/30000 | Total reward = 50.22
2022-01-26 14:17:27.259 | DEBUG    | __main__:trials:24 - Trial = 12798/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.260 | DEBUG    | __main__:trials:29 - Trial = 12798/30000 | Total reward = 47.38
2022-01-26 14:17:27.263 | DEBUG    | __main__:trials:24 - Trial = 12799/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.266 | DEBUG    | __main__:trials:29 - Trial = 12799/30000 | Total reward = 52.77
2022-01-26 14:17:27.269 | DEBUG    | __main__:trials:24 - Trial = 12800/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.270 | DEBUG    | __main__:trials:29 - Trial = 12800/30000 | Total reward = 48.11
2022-01-26 14:17:27.274 | DEBUG    | __main__:trials:24 - Trial = 12801/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.275 | DEBUG    | __main__:trials:29 - Trial = 12801/30000 | Total reward = 34.95
2022-01-26 14:17:27.280 | DEBUG    | __main__:trials:24 - Trial = 12802/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.281 | DEBUG    | __main__:trials:29 - Trial = 12802/30000 | Total reward = 52.80
2022-01-26 14:17:27.284 | DEBUG    | __main__:trials:24 - Trial = 12803/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.285 | DEBUG    | __main__:trials:29 - Trial = 12803/30000 | Total reward = 45.39
2022-01-26 14:17:27.289 | DEBUG    | __main__:trials:24 - Trial = 12804/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.298 | DEBUG    | __main__:trials:29 - Trial = 12804/30000 | Total reward = 52.34
2022-01-26 14:17:27.301 | DEBUG    | __main__:trials:24 - Trial = 12805/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.302 | DEBUG    | __main__:trials:29 - Trial = 12805/30000 | Total reward = 47.47
2022-01-26 14:17:27.306 | DEBUG    | __main__:trials:24 - Trial = 12806/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.307 | DEBUG    | __main__:trials:29 - Trial = 12806/30000 | Total reward = 43.30
2022-01-26 14:17:27.311 | DEBUG    | __main__:trials:24 - Trial = 12807/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.313 | DEBUG    | __main__:trials:29 - Trial = 12807/30000 | Total reward = 47.03
2022-01-26 14:17:27.316 | DEBUG    | __main__:trials:24 - Trial = 12808/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.317 | DEBUG    | __main__:trials:29 - Trial = 12808/30000 | Total reward = 36.85
2022-01-26 14:17:27.320 | DEBUG    | __main__:trials:24 - Trial = 12809/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.322 | DEBUG    | __main__:trials:29 - Trial = 12809/30000 | Total reward = 47.45
2022-01-26 14:17:27.325 | DEBUG    | __main__:trials:24 - Trial = 12810/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.326 | DEBUG    | __main__:trials:29 - Trial = 12810/30000 | Total reward = 46.22
2022-01-26 14:17:27.330 | DEBUG    | __main__:trials:24 - Trial = 12811/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.331 | DEBUG    | __main__:trials:29 - Trial = 12811/30000 | Total reward = 38.68
2022-01-26 14:17:27.334 | DEBUG    | __main__:trials:24 - Trial = 12812/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.336 | DEBUG    | __main__:trials:29 - Trial = 12812/30000 | Total reward = 47.51
2022-01-26 14:17:27.340 | DEBUG    | __main__:trials:24 - Trial = 12813/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.341 | DEBUG    | __main__:trials:29 - Trial = 12813/30000 | Total reward = 32.96
2022-01-26 14:17:27.344 | DEBUG    | __main__:trials:24 - Trial = 12814/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.346 | DEBUG    | __main__:trials:29 - Trial = 12814/30000 | Total reward = 49.80
2022-01-26 14:17:27.349 | DEBUG    | __main__:trials:24 - Trial = 12815/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.350 | DEBUG    | __main__:trials:29 - Trial = 12815/30000 | Total reward = 35.44
2022-01-26 14:17:27.354 | DEBUG    | __main__:trials:24 - Trial = 12816/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.356 | DEBUG    | __main__:trials:29 - Trial = 12816/30000 | Total reward = 45.85
2022-01-26 14:17:27.360 | DEBUG    | __main__:trials:24 - Trial = 12817/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.360 | DEBUG    | __main__:trials:29 - Trial = 12817/30000 | Total reward = 63.20
2022-01-26 14:17:27.363 | DEBUG    | __main__:trials:26 - Trial = 12818/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.365 | DEBUG    | __main__:trials:29 - Trial = 12818/30000 | Total reward = 22.51
2022-01-26 14:17:27.368 | DEBUG    | __main__:trials:24 - Trial = 12819/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.370 | DEBUG    | __main__:trials:29 - Trial = 12819/30000 | Total reward = 42.61
2022-01-26 14:17:27.373 | DEBUG    | __main__:trials:24 - Trial = 12820/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.374 | DEBUG    | __main__:trials:29 - Trial = 12820/30000 | Total reward = 55.55
2022-01-26 14:17:27.378 | DEBUG    | __main__:trials:24 - Trial = 12821/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.379 | DEBUG    | __main__:trials:29 - Trial = 12821/30000 | Total reward = 52.00
2022-01-26 14:17:27.383 | DEBUG    | __main__:trials:24 - Trial = 12822/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.384 | DEBUG    | __main__:trials:29 - Trial = 12822/30000 | Total reward = 47.62
2022-01-26 14:17:27.388 | DEBUG    | __main__:trials:24 - Trial = 12823/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.389 | DEBUG    | __main__:trials:29 - Trial = 12823/30000 | Total reward = 37.75
2022-01-26 14:17:27.392 | DEBUG    | __main__:trials:24 - Trial = 12824/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.394 | DEBUG    | __main__:trials:29 - Trial = 12824/30000 | Total reward = 47.62
2022-01-26 14:17:27.397 | DEBUG    | __main__:trials:24 - Trial = 12825/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.398 | DEBUG    | __main__:trials:29 - Trial = 12825/30000 | Total reward = 46.72
2022-01-26 14:17:27.401 | DEBUG    | __main__:trials:24 - Trial = 12826/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.403 | DEBUG    | __main__:trials:29 - Trial = 12826/30000 | Total reward = 43.67
2022-01-26 14:17:27.406 | DEBUG    | __main__:trials:24 - Trial = 12827/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.408 | DEBUG    | __main__:trials:29 - Trial = 12827/30000 | Total reward = 38.21
2022-01-26 14:17:27.411 | DEBUG    | __main__:trials:24 - Trial = 12828/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.413 | DEBUG    | __main__:trials:29 - Trial = 12828/30000 | Total reward = 47.56
2022-01-26 14:17:27.416 | DEBUG    | __main__:trials:24 - Trial = 12829/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.417 | DEBUG    | __main__:trials:29 - Trial = 12829/30000 | Total reward = 58.30
2022-01-26 14:17:27.421 | DEBUG    | __main__:trials:24 - Trial = 12830/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.422 | DEBUG    | __main__:trials:29 - Trial = 12830/30000 | Total reward = 48.05
2022-01-26 14:17:27.426 | DEBUG    | __main__:trials:26 - Trial = 12831/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.426 | DEBUG    | __main__:trials:29 - Trial = 12831/30000 | Total reward = 18.19
2022-01-26 14:17:27.431 | DEBUG    | __main__:trials:24 - Trial = 12832/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.432 | DEBUG    | __main__:trials:29 - Trial = 12832/30000 | Total reward = 45.02
2022-01-26 14:17:27.436 | DEBUG    | __main__:trials:24 - Trial = 12833/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.437 | DEBUG    | __main__:trials:29 - Trial = 12833/30000 | Total reward = 43.69
2022-01-26 14:17:27.440 | DEBUG    | __main__:trials:24 - Trial = 12834/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.441 | DEBUG    | __main__:trials:29 - Trial = 12834/30000 | Total reward = 48.99
2022-01-26 14:17:27.445 | DEBUG    | __main__:trials:24 - Trial = 12835/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.446 | DEBUG    | __main__:trials:29 - Trial = 12835/30000 | Total reward = 37.04
2022-01-26 14:17:27.449 | DEBUG    | __main__:trials:24 - Trial = 12836/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.450 | DEBUG    | __main__:trials:29 - Trial = 12836/30000 | Total reward = 42.84
2022-01-26 14:17:27.453 | DEBUG    | __main__:trials:24 - Trial = 12837/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.454 | DEBUG    | __main__:trials:29 - Trial = 12837/30000 | Total reward = 46.77
2022-01-26 14:17:27.457 | DEBUG    | __main__:trials:24 - Trial = 12838/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.458 | DEBUG    | __main__:trials:29 - Trial = 12838/30000 | Total reward = 42.53
2022-01-26 14:17:27.461 | DEBUG    | __main__:trials:24 - Trial = 12839/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.463 | DEBUG    | __main__:trials:29 - Trial = 12839/30000 | Total reward = 29.80
2022-01-26 14:17:27.467 | DEBUG    | __main__:trials:24 - Trial = 12840/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.468 | DEBUG    | __main__:trials:29 - Trial = 12840/30000 | Total reward = 47.03
2022-01-26 14:17:27.472 | DEBUG    | __main__:trials:24 - Trial = 12841/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.474 | DEBUG    | __main__:trials:29 - Trial = 12841/30000 | Total reward = 40.29
2022-01-26 14:17:27.477 | DEBUG    | __main__:trials:24 - Trial = 12842/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.479 | DEBUG    | __main__:trials:29 - Trial = 12842/30000 | Total reward = 45.07
2022-01-26 14:17:27.483 | DEBUG    | __main__:trials:24 - Trial = 12843/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.484 | DEBUG    | __main__:trials:29 - Trial = 12843/30000 | Total reward = 39.70
2022-01-26 14:17:27.488 | DEBUG    | __main__:trials:24 - Trial = 12844/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.489 | DEBUG    | __main__:trials:29 - Trial = 12844/30000 | Total reward = 45.55
2022-01-26 14:17:27.493 | DEBUG    | __main__:trials:24 - Trial = 12845/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.494 | DEBUG    | __main__:trials:29 - Trial = 12845/30000 | Total reward = 40.20
2022-01-26 14:17:27.501 | DEBUG    | __main__:trials:24 - Trial = 12846/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.501 | DEBUG    | __main__:trials:29 - Trial = 12846/30000 | Total reward = 35.83
2022-01-26 14:17:27.504 | DEBUG    | __main__:trials:24 - Trial = 12847/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.505 | DEBUG    | __main__:trials:29 - Trial = 12847/30000 | Total reward = 47.03
2022-01-26 14:17:27.508 | DEBUG    | __main__:trials:24 - Trial = 12848/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.509 | DEBUG    | __main__:trials:29 - Trial = 12848/30000 | Total reward = 43.55
2022-01-26 14:17:27.512 | DEBUG    | __main__:trials:24 - Trial = 12849/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.514 | DEBUG    | __main__:trials:29 - Trial = 12849/30000 | Total reward = 40.34
2022-01-26 14:17:27.518 | DEBUG    | __main__:trials:24 - Trial = 12850/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.518 | DEBUG    | __main__:trials:29 - Trial = 12850/30000 | Total reward = 45.41
2022-01-26 14:17:27.523 | DEBUG    | __main__:trials:24 - Trial = 12851/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.525 | DEBUG    | __main__:trials:29 - Trial = 12851/30000 | Total reward = 41.67
2022-01-26 14:17:27.529 | DEBUG    | __main__:trials:24 - Trial = 12852/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.530 | DEBUG    | __main__:trials:29 - Trial = 12852/30000 | Total reward = 50.53
2022-01-26 14:17:27.534 | DEBUG    | __main__:trials:24 - Trial = 12853/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.536 | DEBUG    | __main__:trials:29 - Trial = 12853/30000 | Total reward = 46.48
2022-01-26 14:17:27.539 | DEBUG    | __main__:trials:24 - Trial = 12854/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.541 | DEBUG    | __main__:trials:29 - Trial = 12854/30000 | Total reward = 38.94
2022-01-26 14:17:27.544 | DEBUG    | __main__:trials:24 - Trial = 12855/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.545 | DEBUG    | __main__:trials:29 - Trial = 12855/30000 | Total reward = 38.47
2022-01-26 14:17:27.548 | DEBUG    | __main__:trials:24 - Trial = 12856/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.550 | DEBUG    | __main__:trials:29 - Trial = 12856/30000 | Total reward = 38.39
2022-01-26 14:17:27.553 | DEBUG    | __main__:trials:24 - Trial = 12857/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.554 | DEBUG    | __main__:trials:29 - Trial = 12857/30000 | Total reward = 45.17
2022-01-26 14:17:27.557 | DEBUG    | __main__:trials:24 - Trial = 12858/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.558 | DEBUG    | __main__:trials:29 - Trial = 12858/30000 | Total reward = 38.13
2022-01-26 14:17:27.562 | DEBUG    | __main__:trials:24 - Trial = 12859/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.563 | DEBUG    | __main__:trials:29 - Trial = 12859/30000 | Total reward = 36.45
2022-01-26 14:17:27.567 | DEBUG    | __main__:trials:24 - Trial = 12860/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.568 | DEBUG    | __main__:trials:29 - Trial = 12860/30000 | Total reward = 52.68
2022-01-26 14:17:27.572 | DEBUG    | __main__:trials:24 - Trial = 12861/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.574 | DEBUG    | __main__:trials:29 - Trial = 12861/30000 | Total reward = 47.17
2022-01-26 14:17:27.578 | DEBUG    | __main__:trials:24 - Trial = 12862/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.578 | DEBUG    | __main__:trials:29 - Trial = 12862/30000 | Total reward = 49.03
2022-01-26 14:17:27.582 | DEBUG    | __main__:trials:24 - Trial = 12863/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.584 | DEBUG    | __main__:trials:29 - Trial = 12863/30000 | Total reward = 47.03
2022-01-26 14:17:27.587 | DEBUG    | __main__:trials:24 - Trial = 12864/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.589 | DEBUG    | __main__:trials:29 - Trial = 12864/30000 | Total reward = 42.34
2022-01-26 14:17:27.592 | DEBUG    | __main__:trials:24 - Trial = 12865/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.594 | DEBUG    | __main__:trials:29 - Trial = 12865/30000 | Total reward = 48.62
2022-01-26 14:17:27.598 | DEBUG    | __main__:trials:24 - Trial = 12866/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.599 | DEBUG    | __main__:trials:29 - Trial = 12866/30000 | Total reward = 42.79
2022-01-26 14:17:27.603 | DEBUG    | __main__:trials:24 - Trial = 12867/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.604 | DEBUG    | __main__:trials:29 - Trial = 12867/30000 | Total reward = 39.18
2022-01-26 14:17:27.608 | DEBUG    | __main__:trials:24 - Trial = 12868/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.610 | DEBUG    | __main__:trials:29 - Trial = 12868/30000 | Total reward = 39.09
2022-01-26 14:17:27.614 | DEBUG    | __main__:trials:24 - Trial = 12869/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.615 | DEBUG    | __main__:trials:29 - Trial = 12869/30000 | Total reward = 39.43
2022-01-26 14:17:27.619 | DEBUG    | __main__:trials:24 - Trial = 12870/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.621 | DEBUG    | __main__:trials:29 - Trial = 12870/30000 | Total reward = 46.75
2022-01-26 14:17:27.624 | DEBUG    | __main__:trials:24 - Trial = 12871/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.626 | DEBUG    | __main__:trials:29 - Trial = 12871/30000 | Total reward = 47.51
2022-01-26 14:17:27.630 | DEBUG    | __main__:trials:24 - Trial = 12872/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.631 | DEBUG    | __main__:trials:29 - Trial = 12872/30000 | Total reward = 41.78
2022-01-26 14:17:27.635 | DEBUG    | __main__:trials:24 - Trial = 12873/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.635 | DEBUG    | __main__:trials:29 - Trial = 12873/30000 | Total reward = 44.95
2022-01-26 14:17:27.640 | DEBUG    | __main__:trials:24 - Trial = 12874/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.642 | DEBUG    | __main__:trials:29 - Trial = 12874/30000 | Total reward = 38.49
2022-01-26 14:17:27.645 | DEBUG    | __main__:trials:24 - Trial = 12875/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.646 | DEBUG    | __main__:trials:29 - Trial = 12875/30000 | Total reward = 49.29
2022-01-26 14:17:27.650 | DEBUG    | __main__:trials:24 - Trial = 12876/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.651 | DEBUG    | __main__:trials:29 - Trial = 12876/30000 | Total reward = 38.48
2022-01-26 14:17:27.654 | DEBUG    | __main__:trials:24 - Trial = 12877/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.656 | DEBUG    | __main__:trials:29 - Trial = 12877/30000 | Total reward = 41.48
2022-01-26 14:17:27.659 | DEBUG    | __main__:trials:24 - Trial = 12878/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.661 | DEBUG    | __main__:trials:29 - Trial = 12878/30000 | Total reward = 47.03
2022-01-26 14:17:27.664 | DEBUG    | __main__:trials:24 - Trial = 12879/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.665 | DEBUG    | __main__:trials:29 - Trial = 12879/30000 | Total reward = 44.75
2022-01-26 14:17:27.668 | DEBUG    | __main__:trials:24 - Trial = 12880/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.670 | DEBUG    | __main__:trials:29 - Trial = 12880/30000 | Total reward = 45.16
2022-01-26 14:17:27.674 | DEBUG    | __main__:trials:24 - Trial = 12881/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.675 | DEBUG    | __main__:trials:29 - Trial = 12881/30000 | Total reward = 44.25
2022-01-26 14:17:27.678 | DEBUG    | __main__:trials:24 - Trial = 12882/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.680 | DEBUG    | __main__:trials:29 - Trial = 12882/30000 | Total reward = 48.86
2022-01-26 14:17:27.683 | DEBUG    | __main__:trials:24 - Trial = 12883/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.685 | DEBUG    | __main__:trials:29 - Trial = 12883/30000 | Total reward = 41.76
2022-01-26 14:17:27.688 | DEBUG    | __main__:trials:24 - Trial = 12884/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.690 | DEBUG    | __main__:trials:29 - Trial = 12884/30000 | Total reward = 38.66
2022-01-26 14:17:27.693 | DEBUG    | __main__:trials:24 - Trial = 12885/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.694 | DEBUG    | __main__:trials:29 - Trial = 12885/30000 | Total reward = 48.05
2022-01-26 14:17:27.697 | DEBUG    | __main__:trials:24 - Trial = 12886/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.699 | DEBUG    | __main__:trials:29 - Trial = 12886/30000 | Total reward = 38.96
2022-01-26 14:17:27.702 | DEBUG    | __main__:trials:24 - Trial = 12887/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.703 | DEBUG    | __main__:trials:29 - Trial = 12887/30000 | Total reward = 52.33
2022-01-26 14:17:27.706 | DEBUG    | __main__:trials:24 - Trial = 12888/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.708 | DEBUG    | __main__:trials:29 - Trial = 12888/30000 | Total reward = 35.04
2022-01-26 14:17:27.711 | DEBUG    | __main__:trials:24 - Trial = 12889/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.713 | DEBUG    | __main__:trials:29 - Trial = 12889/30000 | Total reward = 58.60
2022-01-26 14:17:27.716 | DEBUG    | __main__:trials:24 - Trial = 12890/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.717 | DEBUG    | __main__:trials:29 - Trial = 12890/30000 | Total reward = 16.36
2022-01-26 14:17:27.721 | DEBUG    | __main__:trials:24 - Trial = 12891/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.723 | DEBUG    | __main__:trials:29 - Trial = 12891/30000 | Total reward = 44.92
2022-01-26 14:17:27.726 | DEBUG    | __main__:trials:24 - Trial = 12892/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.728 | DEBUG    | __main__:trials:29 - Trial = 12892/30000 | Total reward = 39.55
2022-01-26 14:17:27.731 | DEBUG    | __main__:trials:24 - Trial = 12893/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.733 | DEBUG    | __main__:trials:29 - Trial = 12893/30000 | Total reward = 43.68
2022-01-26 14:17:27.736 | DEBUG    | __main__:trials:24 - Trial = 12894/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.737 | DEBUG    | __main__:trials:29 - Trial = 12894/30000 | Total reward = 47.03
2022-01-26 14:17:27.742 | DEBUG    | __main__:trials:24 - Trial = 12895/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.743 | DEBUG    | __main__:trials:29 - Trial = 12895/30000 | Total reward = 48.92
2022-01-26 14:17:27.746 | DEBUG    | __main__:trials:24 - Trial = 12896/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.748 | DEBUG    | __main__:trials:29 - Trial = 12896/30000 | Total reward = 39.12
2022-01-26 14:17:27.752 | DEBUG    | __main__:trials:24 - Trial = 12897/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.754 | DEBUG    | __main__:trials:29 - Trial = 12897/30000 | Total reward = 37.16
2022-01-26 14:17:27.757 | DEBUG    | __main__:trials:24 - Trial = 12898/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.759 | DEBUG    | __main__:trials:29 - Trial = 12898/30000 | Total reward = 36.26
2022-01-26 14:17:27.763 | DEBUG    | __main__:trials:24 - Trial = 12899/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.763 | DEBUG    | __main__:trials:29 - Trial = 12899/30000 | Total reward = 37.33
2022-01-26 14:17:27.767 | DEBUG    | __main__:trials:24 - Trial = 12900/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.768 | DEBUG    | __main__:trials:29 - Trial = 12900/30000 | Total reward = 45.15
2022-01-26 14:17:27.772 | DEBUG    | __main__:trials:24 - Trial = 12901/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.773 | DEBUG    | __main__:trials:29 - Trial = 12901/30000 | Total reward = 28.88
2022-01-26 14:17:27.777 | DEBUG    | __main__:trials:24 - Trial = 12902/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.778 | DEBUG    | __main__:trials:29 - Trial = 12902/30000 | Total reward = 38.60
2022-01-26 14:17:27.782 | DEBUG    | __main__:trials:24 - Trial = 12903/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.783 | DEBUG    | __main__:trials:29 - Trial = 12903/30000 | Total reward = 45.16
2022-01-26 14:17:27.786 | DEBUG    | __main__:trials:24 - Trial = 12904/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.788 | DEBUG    | __main__:trials:29 - Trial = 12904/30000 | Total reward = 64.78
2022-01-26 14:17:27.791 | DEBUG    | __main__:trials:24 - Trial = 12905/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.791 | DEBUG    | __main__:trials:29 - Trial = 12905/30000 | Total reward = 51.53
2022-01-26 14:17:27.795 | DEBUG    | __main__:trials:24 - Trial = 12906/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.795 | DEBUG    | __main__:trials:29 - Trial = 12906/30000 | Total reward = 40.45
2022-01-26 14:17:27.799 | DEBUG    | __main__:trials:24 - Trial = 12907/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.800 | DEBUG    | __main__:trials:29 - Trial = 12907/30000 | Total reward = 47.72
2022-01-26 14:17:27.804 | DEBUG    | __main__:trials:24 - Trial = 12908/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.805 | DEBUG    | __main__:trials:29 - Trial = 12908/30000 | Total reward = 56.14
2022-01-26 14:17:27.809 | DEBUG    | __main__:trials:24 - Trial = 12909/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.811 | DEBUG    | __main__:trials:29 - Trial = 12909/30000 | Total reward = 43.47
2022-01-26 14:17:27.814 | DEBUG    | __main__:trials:24 - Trial = 12910/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.815 | DEBUG    | __main__:trials:29 - Trial = 12910/30000 | Total reward = 41.17
2022-01-26 14:17:27.819 | DEBUG    | __main__:trials:24 - Trial = 12911/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.820 | DEBUG    | __main__:trials:29 - Trial = 12911/30000 | Total reward = 46.40
2022-01-26 14:17:27.824 | DEBUG    | __main__:trials:24 - Trial = 12912/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.826 | DEBUG    | __main__:trials:29 - Trial = 12912/30000 | Total reward = 41.48
2022-01-26 14:17:27.829 | DEBUG    | __main__:trials:24 - Trial = 12913/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.831 | DEBUG    | __main__:trials:29 - Trial = 12913/30000 | Total reward = 43.32
2022-01-26 14:17:27.834 | DEBUG    | __main__:trials:24 - Trial = 12914/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.836 | DEBUG    | __main__:trials:29 - Trial = 12914/30000 | Total reward = 39.57
2022-01-26 14:17:27.840 | DEBUG    | __main__:trials:24 - Trial = 12915/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.840 | DEBUG    | __main__:trials:29 - Trial = 12915/30000 | Total reward = 47.58
2022-01-26 14:17:27.844 | DEBUG    | __main__:trials:24 - Trial = 12916/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.845 | DEBUG    | __main__:trials:29 - Trial = 12916/30000 | Total reward = 33.73
2022-01-26 14:17:27.849 | DEBUG    | __main__:trials:26 - Trial = 12917/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:27.851 | DEBUG    | __main__:trials:29 - Trial = 12917/30000 | Total reward = 32.05
2022-01-26 14:17:27.855 | DEBUG    | __main__:trials:24 - Trial = 12918/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.855 | DEBUG    | __main__:trials:29 - Trial = 12918/30000 | Total reward = 44.80
2022-01-26 14:17:27.859 | DEBUG    | __main__:trials:24 - Trial = 12919/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.861 | DEBUG    | __main__:trials:29 - Trial = 12919/30000 | Total reward = 43.60
2022-01-26 14:17:27.864 | DEBUG    | __main__:trials:24 - Trial = 12920/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.866 | DEBUG    | __main__:trials:29 - Trial = 12920/30000 | Total reward = 37.88
2022-01-26 14:17:27.869 | DEBUG    | __main__:trials:24 - Trial = 12921/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.871 | DEBUG    | __main__:trials:29 - Trial = 12921/30000 | Total reward = 44.87
2022-01-26 14:17:27.874 | DEBUG    | __main__:trials:24 - Trial = 12922/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.876 | DEBUG    | __main__:trials:29 - Trial = 12922/30000 | Total reward = 34.83
2022-01-26 14:17:27.879 | DEBUG    | __main__:trials:24 - Trial = 12923/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.881 | DEBUG    | __main__:trials:29 - Trial = 12923/30000 | Total reward = 48.20
2022-01-26 14:17:27.884 | DEBUG    | __main__:trials:24 - Trial = 12924/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.886 | DEBUG    | __main__:trials:29 - Trial = 12924/30000 | Total reward = 47.03
2022-01-26 14:17:27.889 | DEBUG    | __main__:trials:24 - Trial = 12925/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.889 | DEBUG    | __main__:trials:29 - Trial = 12925/30000 | Total reward = 51.38
2022-01-26 14:17:27.894 | DEBUG    | __main__:trials:24 - Trial = 12926/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.894 | DEBUG    | __main__:trials:29 - Trial = 12926/30000 | Total reward = 47.45
2022-01-26 14:17:27.899 | DEBUG    | __main__:trials:24 - Trial = 12927/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.901 | DEBUG    | __main__:trials:29 - Trial = 12927/30000 | Total reward = 47.21
2022-01-26 14:17:27.904 | DEBUG    | __main__:trials:24 - Trial = 12928/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.906 | DEBUG    | __main__:trials:29 - Trial = 12928/30000 | Total reward = 43.10
2022-01-26 14:17:27.909 | DEBUG    | __main__:trials:24 - Trial = 12929/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.911 | DEBUG    | __main__:trials:29 - Trial = 12929/30000 | Total reward = 47.15
2022-01-26 14:17:27.915 | DEBUG    | __main__:trials:24 - Trial = 12930/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.916 | DEBUG    | __main__:trials:29 - Trial = 12930/30000 | Total reward = 39.48
2022-01-26 14:17:27.920 | DEBUG    | __main__:trials:24 - Trial = 12931/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.922 | DEBUG    | __main__:trials:29 - Trial = 12931/30000 | Total reward = 38.20
2022-01-26 14:17:27.925 | DEBUG    | __main__:trials:24 - Trial = 12932/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.927 | DEBUG    | __main__:trials:29 - Trial = 12932/30000 | Total reward = 55.13
2022-01-26 14:17:27.930 | DEBUG    | __main__:trials:24 - Trial = 12933/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.931 | DEBUG    | __main__:trials:29 - Trial = 12933/30000 | Total reward = 47.39
2022-01-26 14:17:27.935 | DEBUG    | __main__:trials:24 - Trial = 12934/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.937 | DEBUG    | __main__:trials:29 - Trial = 12934/30000 | Total reward = 43.62
2022-01-26 14:17:27.940 | DEBUG    | __main__:trials:24 - Trial = 12935/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.942 | DEBUG    | __main__:trials:29 - Trial = 12935/30000 | Total reward = 37.74
2022-01-26 14:17:27.945 | DEBUG    | __main__:trials:24 - Trial = 12936/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.946 | DEBUG    | __main__:trials:29 - Trial = 12936/30000 | Total reward = 48.53
2022-01-26 14:17:27.951 | DEBUG    | __main__:trials:24 - Trial = 12937/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.951 | DEBUG    | __main__:trials:29 - Trial = 12937/30000 | Total reward = 40.42
2022-01-26 14:17:27.956 | DEBUG    | __main__:trials:24 - Trial = 12938/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.957 | DEBUG    | __main__:trials:29 - Trial = 12938/30000 | Total reward = 40.37
2022-01-26 14:17:27.961 | DEBUG    | __main__:trials:24 - Trial = 12939/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.962 | DEBUG    | __main__:trials:29 - Trial = 12939/30000 | Total reward = 47.21
2022-01-26 14:17:27.966 | DEBUG    | __main__:trials:24 - Trial = 12940/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.968 | DEBUG    | __main__:trials:29 - Trial = 12940/30000 | Total reward = 44.96
2022-01-26 14:17:27.971 | DEBUG    | __main__:trials:24 - Trial = 12941/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.972 | DEBUG    | __main__:trials:29 - Trial = 12941/30000 | Total reward = 49.77
2022-01-26 14:17:27.976 | DEBUG    | __main__:trials:24 - Trial = 12942/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.977 | DEBUG    | __main__:trials:29 - Trial = 12942/30000 | Total reward = 40.83
2022-01-26 14:17:27.981 | DEBUG    | __main__:trials:24 - Trial = 12943/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.982 | DEBUG    | __main__:trials:29 - Trial = 12943/30000 | Total reward = 32.15
2022-01-26 14:17:27.986 | DEBUG    | __main__:trials:24 - Trial = 12944/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.986 | DEBUG    | __main__:trials:29 - Trial = 12944/30000 | Total reward = 42.31
2022-01-26 14:17:27.991 | DEBUG    | __main__:trials:24 - Trial = 12945/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.992 | DEBUG    | __main__:trials:29 - Trial = 12945/30000 | Total reward = 47.62
2022-01-26 14:17:27.996 | DEBUG    | __main__:trials:24 - Trial = 12946/30000 | Max number of steps (20) reached
2022-01-26 14:17:27.997 | DEBUG    | __main__:trials:29 - Trial = 12946/30000 | Total reward = 41.38
2022-01-26 14:17:28.000 | DEBUG    | __main__:trials:24 - Trial = 12947/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.002 | DEBUG    | __main__:trials:29 - Trial = 12947/30000 | Total reward = 34.37
2022-01-26 14:17:28.005 | DEBUG    | __main__:trials:24 - Trial = 12948/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.006 | DEBUG    | __main__:trials:29 - Trial = 12948/30000 | Total reward = 50.86
2022-01-26 14:17:28.009 | DEBUG    | __main__:trials:24 - Trial = 12949/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.010 | DEBUG    | __main__:trials:29 - Trial = 12949/30000 | Total reward = 47.41
2022-01-26 14:17:28.013 | DEBUG    | __main__:trials:24 - Trial = 12950/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.014 | DEBUG    | __main__:trials:29 - Trial = 12950/30000 | Total reward = 48.91
2022-01-26 14:17:28.017 | DEBUG    | __main__:trials:24 - Trial = 12951/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.018 | DEBUG    | __main__:trials:29 - Trial = 12951/30000 | Total reward = 32.65
2022-01-26 14:17:28.022 | DEBUG    | __main__:trials:24 - Trial = 12952/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.023 | DEBUG    | __main__:trials:29 - Trial = 12952/30000 | Total reward = 41.99
2022-01-26 14:17:28.026 | DEBUG    | __main__:trials:24 - Trial = 12953/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.028 | DEBUG    | __main__:trials:29 - Trial = 12953/30000 | Total reward = 35.42
2022-01-26 14:17:28.032 | DEBUG    | __main__:trials:24 - Trial = 12954/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.032 | DEBUG    | __main__:trials:29 - Trial = 12954/30000 | Total reward = 31.28
2022-01-26 14:17:28.037 | DEBUG    | __main__:trials:24 - Trial = 12955/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.038 | DEBUG    | __main__:trials:29 - Trial = 12955/30000 | Total reward = 48.64
2022-01-26 14:17:28.042 | DEBUG    | __main__:trials:24 - Trial = 12956/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.043 | DEBUG    | __main__:trials:29 - Trial = 12956/30000 | Total reward = 51.63
2022-01-26 14:17:28.048 | DEBUG    | __main__:trials:24 - Trial = 12957/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.048 | DEBUG    | __main__:trials:29 - Trial = 12957/30000 | Total reward = 39.12
2022-01-26 14:17:28.052 | DEBUG    | __main__:trials:24 - Trial = 12958/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.053 | DEBUG    | __main__:trials:29 - Trial = 12958/30000 | Total reward = 44.20
2022-01-26 14:17:28.057 | DEBUG    | __main__:trials:24 - Trial = 12959/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.058 | DEBUG    | __main__:trials:29 - Trial = 12959/30000 | Total reward = 41.67
2022-01-26 14:17:28.062 | DEBUG    | __main__:trials:24 - Trial = 12960/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.064 | DEBUG    | __main__:trials:29 - Trial = 12960/30000 | Total reward = 45.91
2022-01-26 14:17:28.068 | DEBUG    | __main__:trials:24 - Trial = 12961/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.068 | DEBUG    | __main__:trials:29 - Trial = 12961/30000 | Total reward = 36.98
2022-01-26 14:17:28.072 | DEBUG    | __main__:trials:24 - Trial = 12962/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.074 | DEBUG    | __main__:trials:29 - Trial = 12962/30000 | Total reward = 41.59
2022-01-26 14:17:28.078 | DEBUG    | __main__:trials:24 - Trial = 12963/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.079 | DEBUG    | __main__:trials:29 - Trial = 12963/30000 | Total reward = 33.33
2022-01-26 14:17:28.083 | DEBUG    | __main__:trials:24 - Trial = 12964/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.084 | DEBUG    | __main__:trials:29 - Trial = 12964/30000 | Total reward = 35.96
2022-01-26 14:17:28.089 | DEBUG    | __main__:trials:24 - Trial = 12965/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.089 | DEBUG    | __main__:trials:29 - Trial = 12965/30000 | Total reward = 39.72
2022-01-26 14:17:28.093 | DEBUG    | __main__:trials:24 - Trial = 12966/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.095 | DEBUG    | __main__:trials:29 - Trial = 12966/30000 | Total reward = 46.72
2022-01-26 14:17:28.099 | DEBUG    | __main__:trials:24 - Trial = 12967/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.099 | DEBUG    | __main__:trials:29 - Trial = 12967/30000 | Total reward = 43.91
2022-01-26 14:17:28.104 | DEBUG    | __main__:trials:26 - Trial = 12968/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:28.104 | DEBUG    | __main__:trials:29 - Trial = 12968/30000 | Total reward = 25.56
2022-01-26 14:17:28.109 | DEBUG    | __main__:trials:24 - Trial = 12969/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.110 | DEBUG    | __main__:trials:29 - Trial = 12969/30000 | Total reward = 47.79
2022-01-26 14:17:28.114 | DEBUG    | __main__:trials:24 - Trial = 12970/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.115 | DEBUG    | __main__:trials:29 - Trial = 12970/30000 | Total reward = 41.32
2022-01-26 14:17:28.119 | DEBUG    | __main__:trials:24 - Trial = 12971/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.120 | DEBUG    | __main__:trials:29 - Trial = 12971/30000 | Total reward = 42.60
2022-01-26 14:17:28.124 | DEBUG    | __main__:trials:24 - Trial = 12972/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.125 | DEBUG    | __main__:trials:29 - Trial = 12972/30000 | Total reward = 54.81
2022-01-26 14:17:28.129 | DEBUG    | __main__:trials:24 - Trial = 12973/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.130 | DEBUG    | __main__:trials:29 - Trial = 12973/30000 | Total reward = 38.57
2022-01-26 14:17:28.133 | DEBUG    | __main__:trials:24 - Trial = 12974/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.134 | DEBUG    | __main__:trials:29 - Trial = 12974/30000 | Total reward = 28.66
2022-01-26 14:17:28.138 | DEBUG    | __main__:trials:24 - Trial = 12975/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.138 | DEBUG    | __main__:trials:29 - Trial = 12975/30000 | Total reward = 31.01
2022-01-26 14:17:28.142 | DEBUG    | __main__:trials:24 - Trial = 12976/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.142 | DEBUG    | __main__:trials:29 - Trial = 12976/30000 | Total reward = 46.01
2022-01-26 14:17:28.146 | DEBUG    | __main__:trials:24 - Trial = 12977/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.148 | DEBUG    | __main__:trials:29 - Trial = 12977/30000 | Total reward = 43.85
2022-01-26 14:17:28.151 | DEBUG    | __main__:trials:24 - Trial = 12978/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.152 | DEBUG    | __main__:trials:29 - Trial = 12978/30000 | Total reward = 33.05
2022-01-26 14:17:28.156 | DEBUG    | __main__:trials:24 - Trial = 12979/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.157 | DEBUG    | __main__:trials:29 - Trial = 12979/30000 | Total reward = 60.91
2022-01-26 14:17:28.160 | DEBUG    | __main__:trials:24 - Trial = 12980/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.161 | DEBUG    | __main__:trials:29 - Trial = 12980/30000 | Total reward = 40.07
2022-01-26 14:17:28.165 | DEBUG    | __main__:trials:24 - Trial = 12981/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.166 | DEBUG    | __main__:trials:29 - Trial = 12981/30000 | Total reward = 42.29
2022-01-26 14:17:28.169 | DEBUG    | __main__:trials:24 - Trial = 12982/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.170 | DEBUG    | __main__:trials:29 - Trial = 12982/30000 | Total reward = 38.70
2022-01-26 14:17:28.174 | DEBUG    | __main__:trials:24 - Trial = 12983/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.174 | DEBUG    | __main__:trials:29 - Trial = 12983/30000 | Total reward = 34.13
2022-01-26 14:17:28.178 | DEBUG    | __main__:trials:24 - Trial = 12984/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.179 | DEBUG    | __main__:trials:29 - Trial = 12984/30000 | Total reward = 42.96
2022-01-26 14:17:28.182 | DEBUG    | __main__:trials:24 - Trial = 12985/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.184 | DEBUG    | __main__:trials:29 - Trial = 12985/30000 | Total reward = 41.14
2022-01-26 14:17:28.187 | DEBUG    | __main__:trials:24 - Trial = 12986/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.190 | DEBUG    | __main__:trials:29 - Trial = 12986/30000 | Total reward = 62.37
2022-01-26 14:17:28.194 | DEBUG    | __main__:trials:24 - Trial = 12987/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.195 | DEBUG    | __main__:trials:29 - Trial = 12987/30000 | Total reward = 45.39
2022-01-26 14:17:28.199 | DEBUG    | __main__:trials:24 - Trial = 12988/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.201 | DEBUG    | __main__:trials:29 - Trial = 12988/30000 | Total reward = 53.50
2022-01-26 14:17:28.204 | DEBUG    | __main__:trials:24 - Trial = 12989/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.206 | DEBUG    | __main__:trials:29 - Trial = 12989/30000 | Total reward = 43.22
2022-01-26 14:17:28.209 | DEBUG    | __main__:trials:24 - Trial = 12990/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.210 | DEBUG    | __main__:trials:29 - Trial = 12990/30000 | Total reward = 50.62
2022-01-26 14:17:28.215 | DEBUG    | __main__:trials:24 - Trial = 12991/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.216 | DEBUG    | __main__:trials:29 - Trial = 12991/30000 | Total reward = 50.31
2022-01-26 14:17:28.219 | DEBUG    | __main__:trials:24 - Trial = 12992/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.221 | DEBUG    | __main__:trials:29 - Trial = 12992/30000 | Total reward = 34.79
2022-01-26 14:17:28.224 | DEBUG    | __main__:trials:24 - Trial = 12993/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.226 | DEBUG    | __main__:trials:29 - Trial = 12993/30000 | Total reward = 44.79
2022-01-26 14:17:28.229 | DEBUG    | __main__:trials:24 - Trial = 12994/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.231 | DEBUG    | __main__:trials:29 - Trial = 12994/30000 | Total reward = 39.00
2022-01-26 14:17:28.234 | DEBUG    | __main__:trials:24 - Trial = 12995/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.236 | DEBUG    | __main__:trials:29 - Trial = 12995/30000 | Total reward = 46.52
2022-01-26 14:17:28.239 | DEBUG    | __main__:trials:24 - Trial = 12996/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.240 | DEBUG    | __main__:trials:29 - Trial = 12996/30000 | Total reward = 45.50
2022-01-26 14:17:28.245 | DEBUG    | __main__:trials:24 - Trial = 12997/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.246 | DEBUG    | __main__:trials:29 - Trial = 12997/30000 | Total reward = 51.89
2022-01-26 14:17:28.250 | DEBUG    | __main__:trials:24 - Trial = 12998/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.252 | DEBUG    | __main__:trials:29 - Trial = 12998/30000 | Total reward = 37.46
2022-01-26 14:17:28.255 | DEBUG    | __main__:trials:24 - Trial = 12999/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.257 | DEBUG    | __main__:trials:29 - Trial = 12999/30000 | Total reward = 34.82
2022-01-26 14:17:28.260 | DEBUG    | __main__:trials:24 - Trial = 13000/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.262 | DEBUG    | __main__:trials:29 - Trial = 13000/30000 | Total reward = 47.66
2022-01-26 14:17:28.265 | DEBUG    | __main__:trials:24 - Trial = 13001/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.266 | DEBUG    | __main__:trials:29 - Trial = 13001/30000 | Total reward = 40.87
2022-01-26 14:17:28.269 | DEBUG    | __main__:trials:24 - Trial = 13002/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.270 | DEBUG    | __main__:trials:29 - Trial = 13002/30000 | Total reward = 46.26
2022-01-26 14:17:28.273 | DEBUG    | __main__:trials:24 - Trial = 13003/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.274 | DEBUG    | __main__:trials:29 - Trial = 13003/30000 | Total reward = 40.82
2022-01-26 14:17:28.277 | DEBUG    | __main__:trials:24 - Trial = 13004/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.278 | DEBUG    | __main__:trials:29 - Trial = 13004/30000 | Total reward = 40.45
2022-01-26 14:17:28.281 | DEBUG    | __main__:trials:24 - Trial = 13005/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.283 | DEBUG    | __main__:trials:29 - Trial = 13005/30000 | Total reward = 53.72
2022-01-26 14:17:28.286 | DEBUG    | __main__:trials:24 - Trial = 13006/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.287 | DEBUG    | __main__:trials:29 - Trial = 13006/30000 | Total reward = 43.48
2022-01-26 14:17:28.290 | DEBUG    | __main__:trials:24 - Trial = 13007/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.292 | DEBUG    | __main__:trials:29 - Trial = 13007/30000 | Total reward = 33.78
2022-01-26 14:17:28.296 | DEBUG    | __main__:trials:24 - Trial = 13008/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.297 | DEBUG    | __main__:trials:29 - Trial = 13008/30000 | Total reward = 45.64
2022-01-26 14:17:28.300 | DEBUG    | __main__:trials:24 - Trial = 13009/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.302 | DEBUG    | __main__:trials:29 - Trial = 13009/30000 | Total reward = 44.67
2022-01-26 14:17:28.306 | DEBUG    | __main__:trials:24 - Trial = 13010/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.306 | DEBUG    | __main__:trials:29 - Trial = 13010/30000 | Total reward = 47.77
2022-01-26 14:17:28.311 | DEBUG    | __main__:trials:24 - Trial = 13011/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.312 | DEBUG    | __main__:trials:29 - Trial = 13011/30000 | Total reward = 34.38
2022-01-26 14:17:28.316 | DEBUG    | __main__:trials:24 - Trial = 13012/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.317 | DEBUG    | __main__:trials:29 - Trial = 13012/30000 | Total reward = 33.96
2022-01-26 14:17:28.321 | DEBUG    | __main__:trials:24 - Trial = 13013/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.321 | DEBUG    | __main__:trials:29 - Trial = 13013/30000 | Total reward = 31.33
2022-01-26 14:17:28.325 | DEBUG    | __main__:trials:24 - Trial = 13014/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.326 | DEBUG    | __main__:trials:29 - Trial = 13014/30000 | Total reward = 47.87
2022-01-26 14:17:28.330 | DEBUG    | __main__:trials:24 - Trial = 13015/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.331 | DEBUG    | __main__:trials:29 - Trial = 13015/30000 | Total reward = 42.96
2022-01-26 14:17:28.335 | DEBUG    | __main__:trials:24 - Trial = 13016/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.336 | DEBUG    | __main__:trials:29 - Trial = 13016/30000 | Total reward = 55.28
2022-01-26 14:17:28.340 | DEBUG    | __main__:trials:24 - Trial = 13017/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.341 | DEBUG    | __main__:trials:29 - Trial = 13017/30000 | Total reward = 39.07
2022-01-26 14:17:28.345 | DEBUG    | __main__:trials:24 - Trial = 13018/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.346 | DEBUG    | __main__:trials:29 - Trial = 13018/30000 | Total reward = 43.32
2022-01-26 14:17:28.350 | DEBUG    | __main__:trials:24 - Trial = 13019/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.351 | DEBUG    | __main__:trials:29 - Trial = 13019/30000 | Total reward = 44.99
2022-01-26 14:17:28.355 | DEBUG    | __main__:trials:24 - Trial = 13020/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.356 | DEBUG    | __main__:trials:29 - Trial = 13020/30000 | Total reward = 39.35
2022-01-26 14:17:28.360 | DEBUG    | __main__:trials:24 - Trial = 13021/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.361 | DEBUG    | __main__:trials:29 - Trial = 13021/30000 | Total reward = 46.50
2022-01-26 14:17:28.365 | DEBUG    | __main__:trials:24 - Trial = 13022/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.366 | DEBUG    | __main__:trials:29 - Trial = 13022/30000 | Total reward = 47.03
2022-01-26 14:17:28.369 | DEBUG    | __main__:trials:24 - Trial = 13023/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.371 | DEBUG    | __main__:trials:29 - Trial = 13023/30000 | Total reward = 47.55
2022-01-26 14:17:28.373 | DEBUG    | __main__:trials:24 - Trial = 13024/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.374 | DEBUG    | __main__:trials:29 - Trial = 13024/30000 | Total reward = 40.90
2022-01-26 14:17:28.378 | DEBUG    | __main__:trials:24 - Trial = 13025/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.379 | DEBUG    | __main__:trials:29 - Trial = 13025/30000 | Total reward = 47.03
2022-01-26 14:17:28.382 | DEBUG    | __main__:trials:24 - Trial = 13026/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.384 | DEBUG    | __main__:trials:29 - Trial = 13026/30000 | Total reward = 36.15
2022-01-26 14:17:28.387 | DEBUG    | __main__:trials:24 - Trial = 13027/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.389 | DEBUG    | __main__:trials:29 - Trial = 13027/30000 | Total reward = 57.31
2022-01-26 14:17:28.392 | DEBUG    | __main__:trials:24 - Trial = 13028/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.394 | DEBUG    | __main__:trials:29 - Trial = 13028/30000 | Total reward = 37.07
2022-01-26 14:17:28.396 | DEBUG    | __main__:trials:24 - Trial = 13029/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.398 | DEBUG    | __main__:trials:29 - Trial = 13029/30000 | Total reward = 50.69
2022-01-26 14:17:28.401 | DEBUG    | __main__:trials:24 - Trial = 13030/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.402 | DEBUG    | __main__:trials:29 - Trial = 13030/30000 | Total reward = 36.96
2022-01-26 14:17:28.405 | DEBUG    | __main__:trials:24 - Trial = 13031/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.406 | DEBUG    | __main__:trials:29 - Trial = 13031/30000 | Total reward = 61.52
2022-01-26 14:17:28.410 | DEBUG    | __main__:trials:24 - Trial = 13032/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.410 | DEBUG    | __main__:trials:29 - Trial = 13032/30000 | Total reward = 44.66
2022-01-26 14:17:28.414 | DEBUG    | __main__:trials:24 - Trial = 13033/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.416 | DEBUG    | __main__:trials:29 - Trial = 13033/30000 | Total reward = 45.09
2022-01-26 14:17:28.420 | DEBUG    | __main__:trials:24 - Trial = 13034/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.420 | DEBUG    | __main__:trials:29 - Trial = 13034/30000 | Total reward = 45.12
2022-01-26 14:17:28.424 | DEBUG    | __main__:trials:24 - Trial = 13035/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.425 | DEBUG    | __main__:trials:29 - Trial = 13035/30000 | Total reward = 43.73
2022-01-26 14:17:28.429 | DEBUG    | __main__:trials:24 - Trial = 13036/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.430 | DEBUG    | __main__:trials:29 - Trial = 13036/30000 | Total reward = 47.72
2022-01-26 14:17:28.434 | DEBUG    | __main__:trials:24 - Trial = 13037/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.435 | DEBUG    | __main__:trials:29 - Trial = 13037/30000 | Total reward = 37.47
2022-01-26 14:17:28.438 | DEBUG    | __main__:trials:24 - Trial = 13038/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.440 | DEBUG    | __main__:trials:29 - Trial = 13038/30000 | Total reward = 48.81
2022-01-26 14:17:28.443 | DEBUG    | __main__:trials:24 - Trial = 13039/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.444 | DEBUG    | __main__:trials:29 - Trial = 13039/30000 | Total reward = 40.60
2022-01-26 14:17:28.447 | DEBUG    | __main__:trials:24 - Trial = 13040/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.449 | DEBUG    | __main__:trials:29 - Trial = 13040/30000 | Total reward = 47.03
2022-01-26 14:17:28.452 | DEBUG    | __main__:trials:24 - Trial = 13041/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.453 | DEBUG    | __main__:trials:29 - Trial = 13041/30000 | Total reward = 51.79
2022-01-26 14:17:28.456 | DEBUG    | __main__:trials:26 - Trial = 13042/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:28.458 | DEBUG    | __main__:trials:29 - Trial = 13042/30000 | Total reward = 34.38
2022-01-26 14:17:28.461 | DEBUG    | __main__:trials:24 - Trial = 13043/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.461 | DEBUG    | __main__:trials:29 - Trial = 13043/30000 | Total reward = 54.13
2022-01-26 14:17:28.465 | DEBUG    | __main__:trials:24 - Trial = 13044/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.466 | DEBUG    | __main__:trials:29 - Trial = 13044/30000 | Total reward = 40.67
2022-01-26 14:17:28.469 | DEBUG    | __main__:trials:24 - Trial = 13045/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.471 | DEBUG    | __main__:trials:29 - Trial = 13045/30000 | Total reward = 44.10
2022-01-26 14:17:28.474 | DEBUG    | __main__:trials:24 - Trial = 13046/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.475 | DEBUG    | __main__:trials:29 - Trial = 13046/30000 | Total reward = 37.98
2022-01-26 14:17:28.478 | DEBUG    | __main__:trials:24 - Trial = 13047/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.480 | DEBUG    | __main__:trials:29 - Trial = 13047/30000 | Total reward = 34.78
2022-01-26 14:17:28.483 | DEBUG    | __main__:trials:24 - Trial = 13048/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.485 | DEBUG    | __main__:trials:29 - Trial = 13048/30000 | Total reward = 44.34
2022-01-26 14:17:28.488 | DEBUG    | __main__:trials:24 - Trial = 13049/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.489 | DEBUG    | __main__:trials:29 - Trial = 13049/30000 | Total reward = 40.97
2022-01-26 14:17:28.493 | DEBUG    | __main__:trials:24 - Trial = 13050/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.494 | DEBUG    | __main__:trials:29 - Trial = 13050/30000 | Total reward = 45.86
2022-01-26 14:17:28.498 | DEBUG    | __main__:trials:24 - Trial = 13051/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.498 | DEBUG    | __main__:trials:29 - Trial = 13051/30000 | Total reward = 38.09
2022-01-26 14:17:28.502 | DEBUG    | __main__:trials:24 - Trial = 13052/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.504 | DEBUG    | __main__:trials:29 - Trial = 13052/30000 | Total reward = 56.30
2022-01-26 14:17:28.507 | DEBUG    | __main__:trials:26 - Trial = 13053/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:28.509 | DEBUG    | __main__:trials:29 - Trial = 13053/30000 | Total reward = 31.11
2022-01-26 14:17:28.511 | DEBUG    | __main__:trials:24 - Trial = 13054/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.512 | DEBUG    | __main__:trials:29 - Trial = 13054/30000 | Total reward = 40.66
2022-01-26 14:17:28.515 | DEBUG    | __main__:trials:24 - Trial = 13055/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.517 | DEBUG    | __main__:trials:29 - Trial = 13055/30000 | Total reward = 48.63
2022-01-26 14:17:28.520 | DEBUG    | __main__:trials:24 - Trial = 13056/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.522 | DEBUG    | __main__:trials:29 - Trial = 13056/30000 | Total reward = 51.50
2022-01-26 14:17:28.525 | DEBUG    | __main__:trials:24 - Trial = 13057/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.526 | DEBUG    | __main__:trials:29 - Trial = 13057/30000 | Total reward = 54.09
2022-01-26 14:17:28.530 | DEBUG    | __main__:trials:24 - Trial = 13058/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.531 | DEBUG    | __main__:trials:29 - Trial = 13058/30000 | Total reward = 45.71
2022-01-26 14:17:28.535 | DEBUG    | __main__:trials:24 - Trial = 13059/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.535 | DEBUG    | __main__:trials:29 - Trial = 13059/30000 | Total reward = 49.77
2022-01-26 14:17:28.539 | DEBUG    | __main__:trials:24 - Trial = 13060/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.541 | DEBUG    | __main__:trials:29 - Trial = 13060/30000 | Total reward = 42.70
2022-01-26 14:17:28.544 | DEBUG    | __main__:trials:24 - Trial = 13061/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.544 | DEBUG    | __main__:trials:29 - Trial = 13061/30000 | Total reward = 49.20
2022-01-26 14:17:28.548 | DEBUG    | __main__:trials:24 - Trial = 13062/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.549 | DEBUG    | __main__:trials:29 - Trial = 13062/30000 | Total reward = 51.63
2022-01-26 14:17:28.553 | DEBUG    | __main__:trials:24 - Trial = 13063/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.554 | DEBUG    | __main__:trials:29 - Trial = 13063/30000 | Total reward = 41.71
2022-01-26 14:17:28.558 | DEBUG    | __main__:trials:24 - Trial = 13064/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.560 | DEBUG    | __main__:trials:29 - Trial = 13064/30000 | Total reward = 46.37
2022-01-26 14:17:28.562 | DEBUG    | __main__:trials:24 - Trial = 13065/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.563 | DEBUG    | __main__:trials:29 - Trial = 13065/30000 | Total reward = 43.30
2022-01-26 14:17:28.567 | DEBUG    | __main__:trials:24 - Trial = 13066/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.568 | DEBUG    | __main__:trials:29 - Trial = 13066/30000 | Total reward = 48.52
2022-01-26 14:17:28.571 | DEBUG    | __main__:trials:24 - Trial = 13067/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.573 | DEBUG    | __main__:trials:29 - Trial = 13067/30000 | Total reward = 48.88
2022-01-26 14:17:28.576 | DEBUG    | __main__:trials:24 - Trial = 13068/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.578 | DEBUG    | __main__:trials:29 - Trial = 13068/30000 | Total reward = 49.49
2022-01-26 14:17:28.581 | DEBUG    | __main__:trials:24 - Trial = 13069/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.581 | DEBUG    | __main__:trials:29 - Trial = 13069/30000 | Total reward = 41.41
2022-01-26 14:17:28.585 | DEBUG    | __main__:trials:24 - Trial = 13070/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.585 | DEBUG    | __main__:trials:29 - Trial = 13070/30000 | Total reward = 46.89
2022-01-26 14:17:28.589 | DEBUG    | __main__:trials:24 - Trial = 13071/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.590 | DEBUG    | __main__:trials:29 - Trial = 13071/30000 | Total reward = 37.06
2022-01-26 14:17:28.593 | DEBUG    | __main__:trials:24 - Trial = 13072/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.594 | DEBUG    | __main__:trials:29 - Trial = 13072/30000 | Total reward = 38.99
2022-01-26 14:17:28.598 | DEBUG    | __main__:trials:24 - Trial = 13073/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.599 | DEBUG    | __main__:trials:29 - Trial = 13073/30000 | Total reward = 50.59
2022-01-26 14:17:28.602 | DEBUG    | __main__:trials:24 - Trial = 13074/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.604 | DEBUG    | __main__:trials:29 - Trial = 13074/30000 | Total reward = 46.98
2022-01-26 14:17:28.607 | DEBUG    | __main__:trials:24 - Trial = 13075/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.609 | DEBUG    | __main__:trials:29 - Trial = 13075/30000 | Total reward = 32.43
2022-01-26 14:17:28.611 | DEBUG    | __main__:trials:24 - Trial = 13076/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.612 | DEBUG    | __main__:trials:29 - Trial = 13076/30000 | Total reward = 40.41
2022-01-26 14:17:28.616 | DEBUG    | __main__:trials:24 - Trial = 13077/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.617 | DEBUG    | __main__:trials:29 - Trial = 13077/30000 | Total reward = 42.18
2022-01-26 14:17:28.620 | DEBUG    | __main__:trials:26 - Trial = 13078/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:28.621 | DEBUG    | __main__:trials:29 - Trial = 13078/30000 | Total reward = 23.94
2022-01-26 14:17:28.624 | DEBUG    | __main__:trials:24 - Trial = 13079/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.626 | DEBUG    | __main__:trials:29 - Trial = 13079/30000 | Total reward = 52.79
2022-01-26 14:17:28.629 | DEBUG    | __main__:trials:24 - Trial = 13080/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.629 | DEBUG    | __main__:trials:29 - Trial = 13080/30000 | Total reward = 53.90
2022-01-26 14:17:28.633 | DEBUG    | __main__:trials:26 - Trial = 13081/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:28.634 | DEBUG    | __main__:trials:29 - Trial = 13081/30000 | Total reward = 31.08
2022-01-26 14:17:28.637 | DEBUG    | __main__:trials:24 - Trial = 13082/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.638 | DEBUG    | __main__:trials:29 - Trial = 13082/30000 | Total reward = 41.29
2022-01-26 14:17:28.641 | DEBUG    | __main__:trials:24 - Trial = 13083/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.642 | DEBUG    | __main__:trials:29 - Trial = 13083/30000 | Total reward = 37.50
2022-01-26 14:17:28.645 | DEBUG    | __main__:trials:24 - Trial = 13084/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.646 | DEBUG    | __main__:trials:29 - Trial = 13084/30000 | Total reward = 47.97
2022-01-26 14:17:28.650 | DEBUG    | __main__:trials:24 - Trial = 13085/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.652 | DEBUG    | __main__:trials:29 - Trial = 13085/30000 | Total reward = 31.18
2022-01-26 14:17:28.655 | DEBUG    | __main__:trials:24 - Trial = 13086/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.655 | DEBUG    | __main__:trials:29 - Trial = 13086/30000 | Total reward = 42.21
2022-01-26 14:17:28.659 | DEBUG    | __main__:trials:24 - Trial = 13087/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.660 | DEBUG    | __main__:trials:29 - Trial = 13087/30000 | Total reward = 47.36
2022-01-26 14:17:28.663 | DEBUG    | __main__:trials:24 - Trial = 13088/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.664 | DEBUG    | __main__:trials:29 - Trial = 13088/30000 | Total reward = 48.81
2022-01-26 14:17:28.668 | DEBUG    | __main__:trials:24 - Trial = 13089/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.669 | DEBUG    | __main__:trials:29 - Trial = 13089/30000 | Total reward = 45.76
2022-01-26 14:17:28.672 | DEBUG    | __main__:trials:24 - Trial = 13090/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.673 | DEBUG    | __main__:trials:29 - Trial = 13090/30000 | Total reward = 47.33
2022-01-26 14:17:28.677 | DEBUG    | __main__:trials:24 - Trial = 13091/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.677 | DEBUG    | __main__:trials:29 - Trial = 13091/30000 | Total reward = 61.03
2022-01-26 14:17:28.681 | DEBUG    | __main__:trials:24 - Trial = 13092/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.682 | DEBUG    | __main__:trials:29 - Trial = 13092/30000 | Total reward = 44.72
2022-01-26 14:17:28.685 | DEBUG    | __main__:trials:24 - Trial = 13093/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.686 | DEBUG    | __main__:trials:29 - Trial = 13093/30000 | Total reward = 47.21
2022-01-26 14:17:28.689 | DEBUG    | __main__:trials:24 - Trial = 13094/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.691 | DEBUG    | __main__:trials:29 - Trial = 13094/30000 | Total reward = 56.66
2022-01-26 14:17:28.694 | DEBUG    | __main__:trials:24 - Trial = 13095/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.696 | DEBUG    | __main__:trials:29 - Trial = 13095/30000 | Total reward = 47.45
2022-01-26 14:17:28.699 | DEBUG    | __main__:trials:24 - Trial = 13096/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.701 | DEBUG    | __main__:trials:29 - Trial = 13096/30000 | Total reward = 48.93
2022-01-26 14:17:28.704 | DEBUG    | __main__:trials:24 - Trial = 13097/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.706 | DEBUG    | __main__:trials:29 - Trial = 13097/30000 | Total reward = 47.62
2022-01-26 14:17:28.710 | DEBUG    | __main__:trials:24 - Trial = 13098/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.711 | DEBUG    | __main__:trials:29 - Trial = 13098/30000 | Total reward = 49.11
2022-01-26 14:17:28.715 | DEBUG    | __main__:trials:24 - Trial = 13099/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.717 | DEBUG    | __main__:trials:29 - Trial = 13099/30000 | Total reward = 44.57
2022-01-26 14:17:28.720 | DEBUG    | __main__:trials:24 - Trial = 13100/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.721 | DEBUG    | __main__:trials:29 - Trial = 13100/30000 | Total reward = 39.05
2022-01-26 14:17:28.725 | DEBUG    | __main__:trials:24 - Trial = 13101/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.726 | DEBUG    | __main__:trials:29 - Trial = 13101/30000 | Total reward = 67.33
2022-01-26 14:17:28.730 | DEBUG    | __main__:trials:24 - Trial = 13102/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.732 | DEBUG    | __main__:trials:29 - Trial = 13102/30000 | Total reward = 58.08
2022-01-26 14:17:28.735 | DEBUG    | __main__:trials:24 - Trial = 13103/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.736 | DEBUG    | __main__:trials:29 - Trial = 13103/30000 | Total reward = 47.03
2022-01-26 14:17:28.740 | DEBUG    | __main__:trials:24 - Trial = 13104/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.742 | DEBUG    | __main__:trials:29 - Trial = 13104/30000 | Total reward = 65.32
2022-01-26 14:17:28.745 | DEBUG    | __main__:trials:24 - Trial = 13105/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.747 | DEBUG    | __main__:trials:29 - Trial = 13105/30000 | Total reward = 48.40
2022-01-26 14:17:28.751 | DEBUG    | __main__:trials:24 - Trial = 13106/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.752 | DEBUG    | __main__:trials:29 - Trial = 13106/30000 | Total reward = 39.76
2022-01-26 14:17:28.756 | DEBUG    | __main__:trials:24 - Trial = 13107/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.757 | DEBUG    | __main__:trials:29 - Trial = 13107/30000 | Total reward = 46.49
2022-01-26 14:17:28.761 | DEBUG    | __main__:trials:24 - Trial = 13108/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.763 | DEBUG    | __main__:trials:29 - Trial = 13108/30000 | Total reward = 47.03
2022-01-26 14:17:28.766 | DEBUG    | __main__:trials:24 - Trial = 13109/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.768 | DEBUG    | __main__:trials:29 - Trial = 13109/30000 | Total reward = 39.67
2022-01-26 14:17:28.772 | DEBUG    | __main__:trials:24 - Trial = 13110/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.773 | DEBUG    | __main__:trials:29 - Trial = 13110/30000 | Total reward = 47.03
2022-01-26 14:17:28.776 | DEBUG    | __main__:trials:24 - Trial = 13111/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.777 | DEBUG    | __main__:trials:29 - Trial = 13111/30000 | Total reward = 48.82
2022-01-26 14:17:28.780 | DEBUG    | __main__:trials:24 - Trial = 13112/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.782 | DEBUG    | __main__:trials:29 - Trial = 13112/30000 | Total reward = 42.17
2022-01-26 14:17:28.785 | DEBUG    | __main__:trials:24 - Trial = 13113/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.786 | DEBUG    | __main__:trials:29 - Trial = 13113/30000 | Total reward = 45.22
2022-01-26 14:17:28.790 | DEBUG    | __main__:trials:24 - Trial = 13114/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.791 | DEBUG    | __main__:trials:29 - Trial = 13114/30000 | Total reward = 45.66
2022-01-26 14:17:28.794 | DEBUG    | __main__:trials:24 - Trial = 13115/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.796 | DEBUG    | __main__:trials:29 - Trial = 13115/30000 | Total reward = 45.69
2022-01-26 14:17:28.800 | DEBUG    | __main__:trials:24 - Trial = 13116/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.801 | DEBUG    | __main__:trials:29 - Trial = 13116/30000 | Total reward = 47.03
2022-01-26 14:17:28.805 | DEBUG    | __main__:trials:24 - Trial = 13117/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.806 | DEBUG    | __main__:trials:29 - Trial = 13117/30000 | Total reward = 49.52
2022-01-26 14:17:28.810 | DEBUG    | __main__:trials:24 - Trial = 13118/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.811 | DEBUG    | __main__:trials:29 - Trial = 13118/30000 | Total reward = 50.41
2022-01-26 14:17:28.815 | DEBUG    | __main__:trials:24 - Trial = 13119/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.817 | DEBUG    | __main__:trials:29 - Trial = 13119/30000 | Total reward = 40.29
2022-01-26 14:17:28.820 | DEBUG    | __main__:trials:24 - Trial = 13120/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.822 | DEBUG    | __main__:trials:29 - Trial = 13120/30000 | Total reward = 42.45
2022-01-26 14:17:28.825 | DEBUG    | __main__:trials:24 - Trial = 13121/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.827 | DEBUG    | __main__:trials:29 - Trial = 13121/30000 | Total reward = 48.11
2022-01-26 14:17:28.831 | DEBUG    | __main__:trials:24 - Trial = 13122/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.832 | DEBUG    | __main__:trials:29 - Trial = 13122/30000 | Total reward = 34.61
2022-01-26 14:17:28.835 | DEBUG    | __main__:trials:24 - Trial = 13123/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.837 | DEBUG    | __main__:trials:29 - Trial = 13123/30000 | Total reward = 44.03
2022-01-26 14:17:28.841 | DEBUG    | __main__:trials:24 - Trial = 13124/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.842 | DEBUG    | __main__:trials:29 - Trial = 13124/30000 | Total reward = 44.59
2022-01-26 14:17:28.845 | DEBUG    | __main__:trials:24 - Trial = 13125/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.847 | DEBUG    | __main__:trials:29 - Trial = 13125/30000 | Total reward = 51.59
2022-01-26 14:17:28.850 | DEBUG    | __main__:trials:24 - Trial = 13126/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.852 | DEBUG    | __main__:trials:29 - Trial = 13126/30000 | Total reward = 37.62
2022-01-26 14:17:28.856 | DEBUG    | __main__:trials:24 - Trial = 13127/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.856 | DEBUG    | __main__:trials:29 - Trial = 13127/30000 | Total reward = 37.33
2022-01-26 14:17:28.861 | DEBUG    | __main__:trials:24 - Trial = 13128/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.862 | DEBUG    | __main__:trials:29 - Trial = 13128/30000 | Total reward = 47.03
2022-01-26 14:17:28.866 | DEBUG    | __main__:trials:24 - Trial = 13129/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.867 | DEBUG    | __main__:trials:29 - Trial = 13129/30000 | Total reward = 46.08
2022-01-26 14:17:28.871 | DEBUG    | __main__:trials:24 - Trial = 13130/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.873 | DEBUG    | __main__:trials:29 - Trial = 13130/30000 | Total reward = 51.79
2022-01-26 14:17:28.876 | DEBUG    | __main__:trials:24 - Trial = 13131/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.878 | DEBUG    | __main__:trials:29 - Trial = 13131/30000 | Total reward = 41.35
2022-01-26 14:17:28.881 | DEBUG    | __main__:trials:24 - Trial = 13132/30000 | Max number of steps (20) reached
2022-01-26 14:17:28.883 | DEBUG    | __main__:trials:29 - Trial = 13132/30000 | Total reward = 33.87
2022-01-26 14:17:29.118 | DEBUG    | __main__:trials:26 - Trial = 13133/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:29.119 | DEBUG    | __main__:trials:29 - Trial = 13133/30000 | Total reward = 20.88
2022-01-26 14:17:29.123 | DEBUG    | __main__:trials:24 - Trial = 13134/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.125 | DEBUG    | __main__:trials:29 - Trial = 13134/30000 | Total reward = 40.49
2022-01-26 14:17:29.128 | DEBUG    | __main__:trials:24 - Trial = 13135/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.130 | DEBUG    | __main__:trials:29 - Trial = 13135/30000 | Total reward = 42.08
2022-01-26 14:17:29.133 | DEBUG    | __main__:trials:24 - Trial = 13136/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.134 | DEBUG    | __main__:trials:29 - Trial = 13136/30000 | Total reward = 44.07
2022-01-26 14:17:29.137 | DEBUG    | __main__:trials:24 - Trial = 13137/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.138 | DEBUG    | __main__:trials:29 - Trial = 13137/30000 | Total reward = 54.72
2022-01-26 14:17:29.142 | DEBUG    | __main__:trials:24 - Trial = 13138/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.143 | DEBUG    | __main__:trials:29 - Trial = 13138/30000 | Total reward = 47.07
2022-01-26 14:17:29.148 | DEBUG    | __main__:trials:24 - Trial = 13139/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.148 | DEBUG    | __main__:trials:29 - Trial = 13139/30000 | Total reward = 40.44
2022-01-26 14:17:29.152 | DEBUG    | __main__:trials:24 - Trial = 13140/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.153 | DEBUG    | __main__:trials:29 - Trial = 13140/30000 | Total reward = 40.08
2022-01-26 14:17:29.157 | DEBUG    | __main__:trials:24 - Trial = 13141/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.158 | DEBUG    | __main__:trials:29 - Trial = 13141/30000 | Total reward = 49.03
2022-01-26 14:17:29.161 | DEBUG    | __main__:trials:24 - Trial = 13142/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.162 | DEBUG    | __main__:trials:29 - Trial = 13142/30000 | Total reward = 56.23
2022-01-26 14:17:29.165 | DEBUG    | __main__:trials:24 - Trial = 13143/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.167 | DEBUG    | __main__:trials:29 - Trial = 13143/30000 | Total reward = 45.45
2022-01-26 14:17:29.171 | DEBUG    | __main__:trials:24 - Trial = 13144/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.172 | DEBUG    | __main__:trials:29 - Trial = 13144/30000 | Total reward = 51.41
2022-01-26 14:17:29.176 | DEBUG    | __main__:trials:24 - Trial = 13145/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.178 | DEBUG    | __main__:trials:29 - Trial = 13145/30000 | Total reward = 41.99
2022-01-26 14:17:29.181 | DEBUG    | __main__:trials:24 - Trial = 13146/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.182 | DEBUG    | __main__:trials:29 - Trial = 13146/30000 | Total reward = 45.99
2022-01-26 14:17:29.186 | DEBUG    | __main__:trials:24 - Trial = 13147/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.187 | DEBUG    | __main__:trials:29 - Trial = 13147/30000 | Total reward = 42.75
2022-01-26 14:17:29.190 | DEBUG    | __main__:trials:24 - Trial = 13148/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.192 | DEBUG    | __main__:trials:29 - Trial = 13148/30000 | Total reward = 47.45
2022-01-26 14:17:29.196 | DEBUG    | __main__:trials:24 - Trial = 13149/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.197 | DEBUG    | __main__:trials:29 - Trial = 13149/30000 | Total reward = 33.19
2022-01-26 14:17:29.201 | DEBUG    | __main__:trials:24 - Trial = 13150/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.202 | DEBUG    | __main__:trials:29 - Trial = 13150/30000 | Total reward = 48.27
2022-01-26 14:17:29.206 | DEBUG    | __main__:trials:24 - Trial = 13151/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.208 | DEBUG    | __main__:trials:29 - Trial = 13151/30000 | Total reward = 40.77
2022-01-26 14:17:29.211 | DEBUG    | __main__:trials:24 - Trial = 13152/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.212 | DEBUG    | __main__:trials:29 - Trial = 13152/30000 | Total reward = 45.74
2022-01-26 14:17:29.215 | DEBUG    | __main__:trials:24 - Trial = 13153/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.217 | DEBUG    | __main__:trials:29 - Trial = 13153/30000 | Total reward = 40.28
2022-01-26 14:17:29.221 | DEBUG    | __main__:trials:24 - Trial = 13154/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.222 | DEBUG    | __main__:trials:29 - Trial = 13154/30000 | Total reward = 49.89
2022-01-26 14:17:29.226 | DEBUG    | __main__:trials:24 - Trial = 13155/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.227 | DEBUG    | __main__:trials:29 - Trial = 13155/30000 | Total reward = 41.39
2022-01-26 14:17:29.231 | DEBUG    | __main__:trials:24 - Trial = 13156/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.232 | DEBUG    | __main__:trials:29 - Trial = 13156/30000 | Total reward = 41.98
2022-01-26 14:17:29.236 | DEBUG    | __main__:trials:24 - Trial = 13157/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.237 | DEBUG    | __main__:trials:29 - Trial = 13157/30000 | Total reward = 38.09
2022-01-26 14:17:29.240 | DEBUG    | __main__:trials:24 - Trial = 13158/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.242 | DEBUG    | __main__:trials:29 - Trial = 13158/30000 | Total reward = 46.41
2022-01-26 14:17:29.245 | DEBUG    | __main__:trials:24 - Trial = 13159/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.246 | DEBUG    | __main__:trials:29 - Trial = 13159/30000 | Total reward = 34.66
2022-01-26 14:17:29.250 | DEBUG    | __main__:trials:24 - Trial = 13160/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.250 | DEBUG    | __main__:trials:29 - Trial = 13160/30000 | Total reward = 43.19
2022-01-26 14:17:29.254 | DEBUG    | __main__:trials:24 - Trial = 13161/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.255 | DEBUG    | __main__:trials:29 - Trial = 13161/30000 | Total reward = 29.16
2022-01-26 14:17:29.259 | DEBUG    | __main__:trials:24 - Trial = 13162/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.260 | DEBUG    | __main__:trials:29 - Trial = 13162/30000 | Total reward = 46.57
2022-01-26 14:17:29.263 | DEBUG    | __main__:trials:24 - Trial = 13163/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.265 | DEBUG    | __main__:trials:29 - Trial = 13163/30000 | Total reward = 45.33
2022-01-26 14:17:29.268 | DEBUG    | __main__:trials:24 - Trial = 13164/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.270 | DEBUG    | __main__:trials:29 - Trial = 13164/30000 | Total reward = 34.07
2022-01-26 14:17:29.273 | DEBUG    | __main__:trials:24 - Trial = 13165/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.274 | DEBUG    | __main__:trials:29 - Trial = 13165/30000 | Total reward = 41.51
2022-01-26 14:17:29.277 | DEBUG    | __main__:trials:24 - Trial = 13166/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.279 | DEBUG    | __main__:trials:29 - Trial = 13166/30000 | Total reward = 37.89
2022-01-26 14:17:29.282 | DEBUG    | __main__:trials:24 - Trial = 13167/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.283 | DEBUG    | __main__:trials:29 - Trial = 13167/30000 | Total reward = 52.54
2022-01-26 14:17:29.287 | DEBUG    | __main__:trials:24 - Trial = 13168/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.288 | DEBUG    | __main__:trials:29 - Trial = 13168/30000 | Total reward = 43.14
2022-01-26 14:17:29.292 | DEBUG    | __main__:trials:24 - Trial = 13169/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.293 | DEBUG    | __main__:trials:29 - Trial = 13169/30000 | Total reward = 44.37
2022-01-26 14:17:29.297 | DEBUG    | __main__:trials:24 - Trial = 13170/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.299 | DEBUG    | __main__:trials:29 - Trial = 13170/30000 | Total reward = 41.81
2022-01-26 14:17:29.303 | DEBUG    | __main__:trials:24 - Trial = 13171/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.303 | DEBUG    | __main__:trials:29 - Trial = 13171/30000 | Total reward = 49.48
2022-01-26 14:17:29.308 | DEBUG    | __main__:trials:24 - Trial = 13172/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.308 | DEBUG    | __main__:trials:29 - Trial = 13172/30000 | Total reward = 40.74
2022-01-26 14:17:29.312 | DEBUG    | __main__:trials:24 - Trial = 13173/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.313 | DEBUG    | __main__:trials:29 - Trial = 13173/30000 | Total reward = 41.92
2022-01-26 14:17:29.317 | DEBUG    | __main__:trials:24 - Trial = 13174/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.318 | DEBUG    | __main__:trials:29 - Trial = 13174/30000 | Total reward = 38.41
2022-01-26 14:17:29.322 | DEBUG    | __main__:trials:24 - Trial = 13175/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.324 | DEBUG    | __main__:trials:29 - Trial = 13175/30000 | Total reward = 41.06
2022-01-26 14:17:29.327 | DEBUG    | __main__:trials:24 - Trial = 13176/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.328 | DEBUG    | __main__:trials:29 - Trial = 13176/30000 | Total reward = 47.21
2022-01-26 14:17:29.332 | DEBUG    | __main__:trials:24 - Trial = 13177/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.333 | DEBUG    | __main__:trials:29 - Trial = 13177/30000 | Total reward = 46.83
2022-01-26 14:17:29.337 | DEBUG    | __main__:trials:24 - Trial = 13178/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.338 | DEBUG    | __main__:trials:29 - Trial = 13178/30000 | Total reward = 48.76
2022-01-26 14:17:29.341 | DEBUG    | __main__:trials:24 - Trial = 13179/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.342 | DEBUG    | __main__:trials:29 - Trial = 13179/30000 | Total reward = 42.28
2022-01-26 14:17:29.345 | DEBUG    | __main__:trials:24 - Trial = 13180/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.346 | DEBUG    | __main__:trials:29 - Trial = 13180/30000 | Total reward = 49.11
2022-01-26 14:17:29.349 | DEBUG    | __main__:trials:24 - Trial = 13181/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.350 | DEBUG    | __main__:trials:29 - Trial = 13181/30000 | Total reward = 42.53
2022-01-26 14:17:29.353 | DEBUG    | __main__:trials:24 - Trial = 13182/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.355 | DEBUG    | __main__:trials:29 - Trial = 13182/30000 | Total reward = 43.42
2022-01-26 14:17:29.358 | DEBUG    | __main__:trials:24 - Trial = 13183/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.360 | DEBUG    | __main__:trials:29 - Trial = 13183/30000 | Total reward = 42.70
2022-01-26 14:17:29.363 | DEBUG    | __main__:trials:24 - Trial = 13184/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.364 | DEBUG    | __main__:trials:29 - Trial = 13184/30000 | Total reward = 40.47
2022-01-26 14:17:29.367 | DEBUG    | __main__:trials:24 - Trial = 13185/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.368 | DEBUG    | __main__:trials:29 - Trial = 13185/30000 | Total reward = 31.09
2022-01-26 14:17:29.371 | DEBUG    | __main__:trials:24 - Trial = 13186/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.373 | DEBUG    | __main__:trials:29 - Trial = 13186/30000 | Total reward = 45.87
2022-01-26 14:17:29.376 | DEBUG    | __main__:trials:24 - Trial = 13187/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.376 | DEBUG    | __main__:trials:29 - Trial = 13187/30000 | Total reward = 40.31
2022-01-26 14:17:29.380 | DEBUG    | __main__:trials:24 - Trial = 13188/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.381 | DEBUG    | __main__:trials:29 - Trial = 13188/30000 | Total reward = 48.05
2022-01-26 14:17:29.384 | DEBUG    | __main__:trials:24 - Trial = 13189/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.386 | DEBUG    | __main__:trials:29 - Trial = 13189/30000 | Total reward = 43.80
2022-01-26 14:17:29.389 | DEBUG    | __main__:trials:24 - Trial = 13190/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.390 | DEBUG    | __main__:trials:29 - Trial = 13190/30000 | Total reward = 53.85
2022-01-26 14:17:29.394 | DEBUG    | __main__:trials:24 - Trial = 13191/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.394 | DEBUG    | __main__:trials:29 - Trial = 13191/30000 | Total reward = 45.73
2022-01-26 14:17:29.398 | DEBUG    | __main__:trials:24 - Trial = 13192/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.399 | DEBUG    | __main__:trials:29 - Trial = 13192/30000 | Total reward = 35.43
2022-01-26 14:17:29.403 | DEBUG    | __main__:trials:24 - Trial = 13193/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.404 | DEBUG    | __main__:trials:29 - Trial = 13193/30000 | Total reward = 42.08
2022-01-26 14:17:29.408 | DEBUG    | __main__:trials:24 - Trial = 13194/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.409 | DEBUG    | __main__:trials:29 - Trial = 13194/30000 | Total reward = 31.94
2022-01-26 14:17:29.412 | DEBUG    | __main__:trials:24 - Trial = 13195/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.413 | DEBUG    | __main__:trials:29 - Trial = 13195/30000 | Total reward = 42.58
2022-01-26 14:17:29.416 | DEBUG    | __main__:trials:24 - Trial = 13196/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.417 | DEBUG    | __main__:trials:29 - Trial = 13196/30000 | Total reward = 49.30
2022-01-26 14:17:29.420 | DEBUG    | __main__:trials:24 - Trial = 13197/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.421 | DEBUG    | __main__:trials:29 - Trial = 13197/30000 | Total reward = 41.54
2022-01-26 14:17:29.424 | DEBUG    | __main__:trials:24 - Trial = 13198/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.426 | DEBUG    | __main__:trials:29 - Trial = 13198/30000 | Total reward = 44.14
2022-01-26 14:17:29.429 | DEBUG    | __main__:trials:24 - Trial = 13199/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.431 | DEBUG    | __main__:trials:29 - Trial = 13199/30000 | Total reward = 20.74
2022-01-26 14:17:29.434 | DEBUG    | __main__:trials:24 - Trial = 13200/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.434 | DEBUG    | __main__:trials:29 - Trial = 13200/30000 | Total reward = 41.06
2022-01-26 14:17:29.438 | DEBUG    | __main__:trials:24 - Trial = 13201/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.439 | DEBUG    | __main__:trials:29 - Trial = 13201/30000 | Total reward = 37.53
2022-01-26 14:17:29.442 | DEBUG    | __main__:trials:24 - Trial = 13202/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.443 | DEBUG    | __main__:trials:29 - Trial = 13202/30000 | Total reward = 37.28
2022-01-26 14:17:29.446 | DEBUG    | __main__:trials:24 - Trial = 13203/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.448 | DEBUG    | __main__:trials:29 - Trial = 13203/30000 | Total reward = 43.39
2022-01-26 14:17:29.451 | DEBUG    | __main__:trials:24 - Trial = 13204/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.452 | DEBUG    | __main__:trials:29 - Trial = 13204/30000 | Total reward = 46.22
2022-01-26 14:17:29.455 | DEBUG    | __main__:trials:24 - Trial = 13205/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.457 | DEBUG    | __main__:trials:29 - Trial = 13205/30000 | Total reward = 41.23
2022-01-26 14:17:29.460 | DEBUG    | __main__:trials:24 - Trial = 13206/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.462 | DEBUG    | __main__:trials:29 - Trial = 13206/30000 | Total reward = 41.20
2022-01-26 14:17:29.465 | DEBUG    | __main__:trials:24 - Trial = 13207/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.466 | DEBUG    | __main__:trials:29 - Trial = 13207/30000 | Total reward = 34.81
2022-01-26 14:17:29.469 | DEBUG    | __main__:trials:24 - Trial = 13208/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.470 | DEBUG    | __main__:trials:29 - Trial = 13208/30000 | Total reward = 44.11
2022-01-26 14:17:29.473 | DEBUG    | __main__:trials:24 - Trial = 13209/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.474 | DEBUG    | __main__:trials:29 - Trial = 13209/30000 | Total reward = 30.92
2022-01-26 14:17:29.477 | DEBUG    | __main__:trials:24 - Trial = 13210/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.478 | DEBUG    | __main__:trials:29 - Trial = 13210/30000 | Total reward = 42.25
2022-01-26 14:17:29.481 | DEBUG    | __main__:trials:24 - Trial = 13211/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.484 | DEBUG    | __main__:trials:29 - Trial = 13211/30000 | Total reward = 39.59
2022-01-26 14:17:29.487 | DEBUG    | __main__:trials:24 - Trial = 13212/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.488 | DEBUG    | __main__:trials:29 - Trial = 13212/30000 | Total reward = 40.62
2022-01-26 14:17:29.492 | DEBUG    | __main__:trials:24 - Trial = 13213/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.492 | DEBUG    | __main__:trials:29 - Trial = 13213/30000 | Total reward = 41.06
2022-01-26 14:17:29.496 | DEBUG    | __main__:trials:24 - Trial = 13214/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.497 | DEBUG    | __main__:trials:29 - Trial = 13214/30000 | Total reward = 37.40
2022-01-26 14:17:29.500 | DEBUG    | __main__:trials:24 - Trial = 13215/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.502 | DEBUG    | __main__:trials:29 - Trial = 13215/30000 | Total reward = 48.93
2022-01-26 14:17:29.505 | DEBUG    | __main__:trials:24 - Trial = 13216/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.506 | DEBUG    | __main__:trials:29 - Trial = 13216/30000 | Total reward = 49.34
2022-01-26 14:17:29.509 | DEBUG    | __main__:trials:24 - Trial = 13217/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.511 | DEBUG    | __main__:trials:29 - Trial = 13217/30000 | Total reward = 41.06
2022-01-26 14:17:29.514 | DEBUG    | __main__:trials:24 - Trial = 13218/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.516 | DEBUG    | __main__:trials:29 - Trial = 13218/30000 | Total reward = 46.63
2022-01-26 14:17:29.518 | DEBUG    | __main__:trials:24 - Trial = 13219/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.519 | DEBUG    | __main__:trials:29 - Trial = 13219/30000 | Total reward = 50.29
2022-01-26 14:17:29.523 | DEBUG    | __main__:trials:24 - Trial = 13220/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.523 | DEBUG    | __main__:trials:29 - Trial = 13220/30000 | Total reward = 41.10
2022-01-26 14:17:29.527 | DEBUG    | __main__:trials:24 - Trial = 13221/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.528 | DEBUG    | __main__:trials:29 - Trial = 13221/30000 | Total reward = 41.98
2022-01-26 14:17:29.531 | DEBUG    | __main__:trials:24 - Trial = 13222/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.533 | DEBUG    | __main__:trials:29 - Trial = 13222/30000 | Total reward = 40.01
2022-01-26 14:17:29.536 | DEBUG    | __main__:trials:24 - Trial = 13223/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.537 | DEBUG    | __main__:trials:29 - Trial = 13223/30000 | Total reward = 47.05
2022-01-26 14:17:29.541 | DEBUG    | __main__:trials:24 - Trial = 13224/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.542 | DEBUG    | __main__:trials:29 - Trial = 13224/30000 | Total reward = 40.21
2022-01-26 14:17:29.545 | DEBUG    | __main__:trials:24 - Trial = 13225/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.547 | DEBUG    | __main__:trials:29 - Trial = 13225/30000 | Total reward = 52.69
2022-01-26 14:17:29.550 | DEBUG    | __main__:trials:24 - Trial = 13226/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.551 | DEBUG    | __main__:trials:29 - Trial = 13226/30000 | Total reward = 44.68
2022-01-26 14:17:29.554 | DEBUG    | __main__:trials:24 - Trial = 13227/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.554 | DEBUG    | __main__:trials:29 - Trial = 13227/30000 | Total reward = 46.29
2022-01-26 14:17:29.558 | DEBUG    | __main__:trials:24 - Trial = 13228/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.559 | DEBUG    | __main__:trials:29 - Trial = 13228/30000 | Total reward = 45.51
2022-01-26 14:17:29.562 | DEBUG    | __main__:trials:24 - Trial = 13229/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.564 | DEBUG    | __main__:trials:29 - Trial = 13229/30000 | Total reward = 45.57
2022-01-26 14:17:29.567 | DEBUG    | __main__:trials:24 - Trial = 13230/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.567 | DEBUG    | __main__:trials:29 - Trial = 13230/30000 | Total reward = 39.02
2022-01-26 14:17:29.571 | DEBUG    | __main__:trials:24 - Trial = 13231/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.572 | DEBUG    | __main__:trials:29 - Trial = 13231/30000 | Total reward = 42.68
2022-01-26 14:17:29.575 | DEBUG    | __main__:trials:24 - Trial = 13232/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.577 | DEBUG    | __main__:trials:29 - Trial = 13232/30000 | Total reward = 47.46
2022-01-26 14:17:29.580 | DEBUG    | __main__:trials:24 - Trial = 13233/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.581 | DEBUG    | __main__:trials:29 - Trial = 13233/30000 | Total reward = 52.65
2022-01-26 14:17:29.584 | DEBUG    | __main__:trials:24 - Trial = 13234/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.585 | DEBUG    | __main__:trials:29 - Trial = 13234/30000 | Total reward = 41.25
2022-01-26 14:17:29.588 | DEBUG    | __main__:trials:24 - Trial = 13235/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.590 | DEBUG    | __main__:trials:29 - Trial = 13235/30000 | Total reward = 45.40
2022-01-26 14:17:29.593 | DEBUG    | __main__:trials:24 - Trial = 13236/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.594 | DEBUG    | __main__:trials:29 - Trial = 13236/30000 | Total reward = 36.55
2022-01-26 14:17:29.597 | DEBUG    | __main__:trials:24 - Trial = 13237/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.599 | DEBUG    | __main__:trials:29 - Trial = 13237/30000 | Total reward = 43.92
2022-01-26 14:17:29.603 | DEBUG    | __main__:trials:24 - Trial = 13238/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.604 | DEBUG    | __main__:trials:29 - Trial = 13238/30000 | Total reward = 37.43
2022-01-26 14:17:29.608 | DEBUG    | __main__:trials:24 - Trial = 13239/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.609 | DEBUG    | __main__:trials:29 - Trial = 13239/30000 | Total reward = 57.22
2022-01-26 14:17:29.612 | DEBUG    | __main__:trials:24 - Trial = 13240/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.614 | DEBUG    | __main__:trials:29 - Trial = 13240/30000 | Total reward = 44.36
2022-01-26 14:17:29.617 | DEBUG    | __main__:trials:24 - Trial = 13241/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.617 | DEBUG    | __main__:trials:29 - Trial = 13241/30000 | Total reward = 39.44
2022-01-26 14:17:29.621 | DEBUG    | __main__:trials:24 - Trial = 13242/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.622 | DEBUG    | __main__:trials:29 - Trial = 13242/30000 | Total reward = 45.80
2022-01-26 14:17:29.626 | DEBUG    | __main__:trials:24 - Trial = 13243/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.626 | DEBUG    | __main__:trials:29 - Trial = 13243/30000 | Total reward = 37.51
2022-01-26 14:17:29.630 | DEBUG    | __main__:trials:24 - Trial = 13244/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.630 | DEBUG    | __main__:trials:29 - Trial = 13244/30000 | Total reward = 42.39
2022-01-26 14:17:29.634 | DEBUG    | __main__:trials:24 - Trial = 13245/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.635 | DEBUG    | __main__:trials:29 - Trial = 13245/30000 | Total reward = 42.71
2022-01-26 14:17:29.638 | DEBUG    | __main__:trials:24 - Trial = 13246/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.640 | DEBUG    | __main__:trials:29 - Trial = 13246/30000 | Total reward = 56.43
2022-01-26 14:17:29.644 | DEBUG    | __main__:trials:24 - Trial = 13247/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.644 | DEBUG    | __main__:trials:29 - Trial = 13247/30000 | Total reward = 37.36
2022-01-26 14:17:29.648 | DEBUG    | __main__:trials:24 - Trial = 13248/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.649 | DEBUG    | __main__:trials:29 - Trial = 13248/30000 | Total reward = 47.20
2022-01-26 14:17:29.653 | DEBUG    | __main__:trials:24 - Trial = 13249/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.653 | DEBUG    | __main__:trials:29 - Trial = 13249/30000 | Total reward = 47.46
2022-01-26 14:17:29.657 | DEBUG    | __main__:trials:24 - Trial = 13250/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.658 | DEBUG    | __main__:trials:29 - Trial = 13250/30000 | Total reward = 46.91
2022-01-26 14:17:29.662 | DEBUG    | __main__:trials:24 - Trial = 13251/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.663 | DEBUG    | __main__:trials:29 - Trial = 13251/30000 | Total reward = 47.05
2022-01-26 14:17:29.666 | DEBUG    | __main__:trials:24 - Trial = 13252/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.668 | DEBUG    | __main__:trials:29 - Trial = 13252/30000 | Total reward = 47.88
2022-01-26 14:17:29.670 | DEBUG    | __main__:trials:24 - Trial = 13253/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.672 | DEBUG    | __main__:trials:29 - Trial = 13253/30000 | Total reward = 48.21
2022-01-26 14:17:29.675 | DEBUG    | __main__:trials:24 - Trial = 13254/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.676 | DEBUG    | __main__:trials:29 - Trial = 13254/30000 | Total reward = 43.22
2022-01-26 14:17:29.680 | DEBUG    | __main__:trials:24 - Trial = 13255/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.681 | DEBUG    | __main__:trials:29 - Trial = 13255/30000 | Total reward = 56.90
2022-01-26 14:17:29.685 | DEBUG    | __main__:trials:24 - Trial = 13256/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.687 | DEBUG    | __main__:trials:29 - Trial = 13256/30000 | Total reward = 46.71
2022-01-26 14:17:29.690 | DEBUG    | __main__:trials:24 - Trial = 13257/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.691 | DEBUG    | __main__:trials:29 - Trial = 13257/30000 | Total reward = 47.20
2022-01-26 14:17:29.695 | DEBUG    | __main__:trials:24 - Trial = 13258/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.696 | DEBUG    | __main__:trials:29 - Trial = 13258/30000 | Total reward = 48.94
2022-01-26 14:17:29.699 | DEBUG    | __main__:trials:24 - Trial = 13259/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.700 | DEBUG    | __main__:trials:29 - Trial = 13259/30000 | Total reward = 53.39
2022-01-26 14:17:29.703 | DEBUG    | __main__:trials:24 - Trial = 13260/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.705 | DEBUG    | __main__:trials:29 - Trial = 13260/30000 | Total reward = 43.36
2022-01-26 14:17:29.709 | DEBUG    | __main__:trials:24 - Trial = 13261/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.710 | DEBUG    | __main__:trials:29 - Trial = 13261/30000 | Total reward = 46.61
2022-01-26 14:17:29.714 | DEBUG    | __main__:trials:24 - Trial = 13262/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.716 | DEBUG    | __main__:trials:29 - Trial = 13262/30000 | Total reward = 46.68
2022-01-26 14:17:29.720 | DEBUG    | __main__:trials:24 - Trial = 13263/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.721 | DEBUG    | __main__:trials:29 - Trial = 13263/30000 | Total reward = 44.04
2022-01-26 14:17:29.724 | DEBUG    | __main__:trials:24 - Trial = 13264/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.725 | DEBUG    | __main__:trials:29 - Trial = 13264/30000 | Total reward = 41.47
2022-01-26 14:17:29.729 | DEBUG    | __main__:trials:24 - Trial = 13265/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.731 | DEBUG    | __main__:trials:29 - Trial = 13265/30000 | Total reward = 51.48
2022-01-26 14:17:29.734 | DEBUG    | __main__:trials:24 - Trial = 13266/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.734 | DEBUG    | __main__:trials:29 - Trial = 13266/30000 | Total reward = 46.61
2022-01-26 14:17:29.739 | DEBUG    | __main__:trials:24 - Trial = 13267/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.741 | DEBUG    | __main__:trials:29 - Trial = 13267/30000 | Total reward = 44.54
2022-01-26 14:17:29.745 | DEBUG    | __main__:trials:24 - Trial = 13268/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.747 | DEBUG    | __main__:trials:29 - Trial = 13268/30000 | Total reward = 48.50
2022-01-26 14:17:29.750 | DEBUG    | __main__:trials:24 - Trial = 13269/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.751 | DEBUG    | __main__:trials:29 - Trial = 13269/30000 | Total reward = 48.55
2022-01-26 14:17:29.754 | DEBUG    | __main__:trials:24 - Trial = 13270/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.754 | DEBUG    | __main__:trials:29 - Trial = 13270/30000 | Total reward = 47.46
2022-01-26 14:17:29.758 | DEBUG    | __main__:trials:24 - Trial = 13271/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.759 | DEBUG    | __main__:trials:29 - Trial = 13271/30000 | Total reward = 40.81
2022-01-26 14:17:29.763 | DEBUG    | __main__:trials:24 - Trial = 13272/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.764 | DEBUG    | __main__:trials:29 - Trial = 13272/30000 | Total reward = 44.06
2022-01-26 14:17:29.768 | DEBUG    | __main__:trials:24 - Trial = 13273/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.768 | DEBUG    | __main__:trials:29 - Trial = 13273/30000 | Total reward = 41.14
2022-01-26 14:17:29.773 | DEBUG    | __main__:trials:24 - Trial = 13274/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.774 | DEBUG    | __main__:trials:29 - Trial = 13274/30000 | Total reward = 47.71
2022-01-26 14:17:29.777 | DEBUG    | __main__:trials:24 - Trial = 13275/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.779 | DEBUG    | __main__:trials:29 - Trial = 13275/30000 | Total reward = 44.62
2022-01-26 14:17:29.783 | DEBUG    | __main__:trials:24 - Trial = 13276/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.785 | DEBUG    | __main__:trials:29 - Trial = 13276/30000 | Total reward = 47.05
2022-01-26 14:17:29.788 | DEBUG    | __main__:trials:24 - Trial = 13277/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.791 | DEBUG    | __main__:trials:29 - Trial = 13277/30000 | Total reward = 33.69
2022-01-26 14:17:29.795 | DEBUG    | __main__:trials:24 - Trial = 13278/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.797 | DEBUG    | __main__:trials:29 - Trial = 13278/30000 | Total reward = 40.70
2022-01-26 14:17:29.800 | DEBUG    | __main__:trials:24 - Trial = 13279/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.802 | DEBUG    | __main__:trials:29 - Trial = 13279/30000 | Total reward = 35.70
2022-01-26 14:17:29.805 | DEBUG    | __main__:trials:24 - Trial = 13280/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.807 | DEBUG    | __main__:trials:29 - Trial = 13280/30000 | Total reward = 42.41
2022-01-26 14:17:29.811 | DEBUG    | __main__:trials:24 - Trial = 13281/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.813 | DEBUG    | __main__:trials:29 - Trial = 13281/30000 | Total reward = 42.99
2022-01-26 14:17:29.816 | DEBUG    | __main__:trials:24 - Trial = 13282/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.818 | DEBUG    | __main__:trials:29 - Trial = 13282/30000 | Total reward = 42.97
2022-01-26 14:17:29.822 | DEBUG    | __main__:trials:24 - Trial = 13283/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.823 | DEBUG    | __main__:trials:29 - Trial = 13283/30000 | Total reward = 39.84
2022-01-26 14:17:29.827 | DEBUG    | __main__:trials:24 - Trial = 13284/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.828 | DEBUG    | __main__:trials:29 - Trial = 13284/30000 | Total reward = 47.05
2022-01-26 14:17:29.832 | DEBUG    | __main__:trials:24 - Trial = 13285/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.833 | DEBUG    | __main__:trials:29 - Trial = 13285/30000 | Total reward = 43.52
2022-01-26 14:17:29.838 | DEBUG    | __main__:trials:24 - Trial = 13286/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.839 | DEBUG    | __main__:trials:29 - Trial = 13286/30000 | Total reward = 41.80
2022-01-26 14:17:29.843 | DEBUG    | __main__:trials:24 - Trial = 13287/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.845 | DEBUG    | __main__:trials:29 - Trial = 13287/30000 | Total reward = 27.12
2022-01-26 14:17:29.848 | DEBUG    | __main__:trials:24 - Trial = 13288/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.849 | DEBUG    | __main__:trials:29 - Trial = 13288/30000 | Total reward = 44.26
2022-01-26 14:17:29.853 | DEBUG    | __main__:trials:24 - Trial = 13289/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.855 | DEBUG    | __main__:trials:29 - Trial = 13289/30000 | Total reward = 45.86
2022-01-26 14:17:29.857 | DEBUG    | __main__:trials:24 - Trial = 13290/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.859 | DEBUG    | __main__:trials:29 - Trial = 13290/30000 | Total reward = 40.73
2022-01-26 14:17:29.863 | DEBUG    | __main__:trials:24 - Trial = 13291/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.867 | DEBUG    | __main__:trials:29 - Trial = 13291/30000 | Total reward = 40.58
2022-01-26 14:17:29.871 | DEBUG    | __main__:trials:24 - Trial = 13292/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.872 | DEBUG    | __main__:trials:29 - Trial = 13292/30000 | Total reward = 41.00
2022-01-26 14:17:29.876 | DEBUG    | __main__:trials:24 - Trial = 13293/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.878 | DEBUG    | __main__:trials:29 - Trial = 13293/30000 | Total reward = 31.99
2022-01-26 14:17:29.881 | DEBUG    | __main__:trials:24 - Trial = 13294/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.883 | DEBUG    | __main__:trials:29 - Trial = 13294/30000 | Total reward = 21.74
2022-01-26 14:17:29.887 | DEBUG    | __main__:trials:24 - Trial = 13295/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.889 | DEBUG    | __main__:trials:29 - Trial = 13295/30000 | Total reward = 46.02
2022-01-26 14:17:29.892 | DEBUG    | __main__:trials:24 - Trial = 13296/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.894 | DEBUG    | __main__:trials:29 - Trial = 13296/30000 | Total reward = 44.61
2022-01-26 14:17:29.898 | DEBUG    | __main__:trials:24 - Trial = 13297/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.901 | DEBUG    | __main__:trials:29 - Trial = 13297/30000 | Total reward = 38.25
2022-01-26 14:17:29.904 | DEBUG    | __main__:trials:24 - Trial = 13298/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.906 | DEBUG    | __main__:trials:29 - Trial = 13298/30000 | Total reward = 41.54
2022-01-26 14:17:29.909 | DEBUG    | __main__:trials:24 - Trial = 13299/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.911 | DEBUG    | __main__:trials:29 - Trial = 13299/30000 | Total reward = 52.21
2022-01-26 14:17:29.914 | DEBUG    | __main__:trials:24 - Trial = 13300/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.916 | DEBUG    | __main__:trials:29 - Trial = 13300/30000 | Total reward = 43.40
2022-01-26 14:17:29.919 | DEBUG    | __main__:trials:24 - Trial = 13301/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.920 | DEBUG    | __main__:trials:29 - Trial = 13301/30000 | Total reward = 41.91
2022-01-26 14:17:29.924 | DEBUG    | __main__:trials:24 - Trial = 13302/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.925 | DEBUG    | __main__:trials:29 - Trial = 13302/30000 | Total reward = 39.28
2022-01-26 14:17:29.928 | DEBUG    | __main__:trials:26 - Trial = 13303/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:29.930 | DEBUG    | __main__:trials:29 - Trial = 13303/30000 | Total reward = 25.00
2022-01-26 14:17:29.934 | DEBUG    | __main__:trials:24 - Trial = 13304/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.935 | DEBUG    | __main__:trials:29 - Trial = 13304/30000 | Total reward = 43.27
2022-01-26 14:17:29.939 | DEBUG    | __main__:trials:24 - Trial = 13305/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.940 | DEBUG    | __main__:trials:29 - Trial = 13305/30000 | Total reward = 48.35
2022-01-26 14:17:29.944 | DEBUG    | __main__:trials:24 - Trial = 13306/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.945 | DEBUG    | __main__:trials:29 - Trial = 13306/30000 | Total reward = 45.10
2022-01-26 14:17:29.949 | DEBUG    | __main__:trials:24 - Trial = 13307/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.950 | DEBUG    | __main__:trials:29 - Trial = 13307/30000 | Total reward = 48.08
2022-01-26 14:17:29.954 | DEBUG    | __main__:trials:24 - Trial = 13308/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.954 | DEBUG    | __main__:trials:29 - Trial = 13308/30000 | Total reward = 47.41
2022-01-26 14:17:29.959 | DEBUG    | __main__:trials:24 - Trial = 13309/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.960 | DEBUG    | __main__:trials:29 - Trial = 13309/30000 | Total reward = 42.69
2022-01-26 14:17:29.964 | DEBUG    | __main__:trials:24 - Trial = 13310/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.966 | DEBUG    | __main__:trials:29 - Trial = 13310/30000 | Total reward = 35.85
2022-01-26 14:17:29.969 | DEBUG    | __main__:trials:24 - Trial = 13311/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.971 | DEBUG    | __main__:trials:29 - Trial = 13311/30000 | Total reward = 42.27
2022-01-26 14:17:29.974 | DEBUG    | __main__:trials:24 - Trial = 13312/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.976 | DEBUG    | __main__:trials:29 - Trial = 13312/30000 | Total reward = 36.94
2022-01-26 14:17:29.980 | DEBUG    | __main__:trials:24 - Trial = 13313/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.981 | DEBUG    | __main__:trials:29 - Trial = 13313/30000 | Total reward = 40.32
2022-01-26 14:17:29.985 | DEBUG    | __main__:trials:24 - Trial = 13314/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.987 | DEBUG    | __main__:trials:29 - Trial = 13314/30000 | Total reward = 44.35
2022-01-26 14:17:29.990 | DEBUG    | __main__:trials:24 - Trial = 13315/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.992 | DEBUG    | __main__:trials:29 - Trial = 13315/30000 | Total reward = 42.78
2022-01-26 14:17:29.996 | DEBUG    | __main__:trials:24 - Trial = 13316/30000 | Max number of steps (20) reached
2022-01-26 14:17:29.997 | DEBUG    | __main__:trials:29 - Trial = 13316/30000 | Total reward = 55.62
2022-01-26 14:17:30.001 | DEBUG    | __main__:trials:24 - Trial = 13317/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.002 | DEBUG    | __main__:trials:29 - Trial = 13317/30000 | Total reward = 47.05
2022-01-26 14:17:30.006 | DEBUG    | __main__:trials:24 - Trial = 13318/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.007 | DEBUG    | __main__:trials:29 - Trial = 13318/30000 | Total reward = 38.42
2022-01-26 14:17:30.011 | DEBUG    | __main__:trials:24 - Trial = 13319/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.013 | DEBUG    | __main__:trials:29 - Trial = 13319/30000 | Total reward = 45.64
2022-01-26 14:17:30.016 | DEBUG    | __main__:trials:24 - Trial = 13320/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.017 | DEBUG    | __main__:trials:29 - Trial = 13320/30000 | Total reward = 59.80
2022-01-26 14:17:30.021 | DEBUG    | __main__:trials:24 - Trial = 13321/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.023 | DEBUG    | __main__:trials:29 - Trial = 13321/30000 | Total reward = 45.31
2022-01-26 14:17:30.026 | DEBUG    | __main__:trials:24 - Trial = 13322/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.028 | DEBUG    | __main__:trials:29 - Trial = 13322/30000 | Total reward = 40.74
2022-01-26 14:17:30.032 | DEBUG    | __main__:trials:24 - Trial = 13323/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.033 | DEBUG    | __main__:trials:29 - Trial = 13323/30000 | Total reward = 39.74
2022-01-26 14:17:30.037 | DEBUG    | __main__:trials:24 - Trial = 13324/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.038 | DEBUG    | __main__:trials:29 - Trial = 13324/30000 | Total reward = 53.21
2022-01-26 14:17:30.041 | DEBUG    | __main__:trials:24 - Trial = 13325/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.044 | DEBUG    | __main__:trials:29 - Trial = 13325/30000 | Total reward = 42.83
2022-01-26 14:17:30.048 | DEBUG    | __main__:trials:24 - Trial = 13326/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.049 | DEBUG    | __main__:trials:29 - Trial = 13326/30000 | Total reward = 46.02
2022-01-26 14:17:30.052 | DEBUG    | __main__:trials:24 - Trial = 13327/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.054 | DEBUG    | __main__:trials:29 - Trial = 13327/30000 | Total reward = 52.76
2022-01-26 14:17:30.058 | DEBUG    | __main__:trials:24 - Trial = 13328/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.059 | DEBUG    | __main__:trials:29 - Trial = 13328/30000 | Total reward = 37.36
2022-01-26 14:17:30.062 | DEBUG    | __main__:trials:24 - Trial = 13329/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.064 | DEBUG    | __main__:trials:29 - Trial = 13329/30000 | Total reward = 45.37
2022-01-26 14:17:30.069 | DEBUG    | __main__:trials:24 - Trial = 13330/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.071 | DEBUG    | __main__:trials:29 - Trial = 13330/30000 | Total reward = 43.14
2022-01-26 14:17:30.074 | DEBUG    | __main__:trials:24 - Trial = 13331/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.075 | DEBUG    | __main__:trials:29 - Trial = 13331/30000 | Total reward = 45.49
2022-01-26 14:17:30.079 | DEBUG    | __main__:trials:24 - Trial = 13332/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.081 | DEBUG    | __main__:trials:29 - Trial = 13332/30000 | Total reward = 46.46
2022-01-26 14:17:30.084 | DEBUG    | __main__:trials:24 - Trial = 13333/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.086 | DEBUG    | __main__:trials:29 - Trial = 13333/30000 | Total reward = 47.19
2022-01-26 14:17:30.089 | DEBUG    | __main__:trials:24 - Trial = 13334/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.091 | DEBUG    | __main__:trials:29 - Trial = 13334/30000 | Total reward = 52.71
2022-01-26 14:17:30.095 | DEBUG    | __main__:trials:24 - Trial = 13335/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.096 | DEBUG    | __main__:trials:29 - Trial = 13335/30000 | Total reward = 44.63
2022-01-26 14:17:30.100 | DEBUG    | __main__:trials:24 - Trial = 13336/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.101 | DEBUG    | __main__:trials:29 - Trial = 13336/30000 | Total reward = 53.77
2022-01-26 14:17:30.105 | DEBUG    | __main__:trials:24 - Trial = 13337/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.106 | DEBUG    | __main__:trials:29 - Trial = 13337/30000 | Total reward = 42.57
2022-01-26 14:17:30.110 | DEBUG    | __main__:trials:24 - Trial = 13338/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.111 | DEBUG    | __main__:trials:29 - Trial = 13338/30000 | Total reward = 47.20
2022-01-26 14:17:30.115 | DEBUG    | __main__:trials:24 - Trial = 13339/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.117 | DEBUG    | __main__:trials:29 - Trial = 13339/30000 | Total reward = 42.74
2022-01-26 14:17:30.120 | DEBUG    | __main__:trials:24 - Trial = 13340/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.122 | DEBUG    | __main__:trials:29 - Trial = 13340/30000 | Total reward = 43.67
2022-01-26 14:17:30.126 | DEBUG    | __main__:trials:24 - Trial = 13341/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.127 | DEBUG    | __main__:trials:29 - Trial = 13341/30000 | Total reward = 41.71
2022-01-26 14:17:30.131 | DEBUG    | __main__:trials:24 - Trial = 13342/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.132 | DEBUG    | __main__:trials:29 - Trial = 13342/30000 | Total reward = 43.41
2022-01-26 14:17:30.136 | DEBUG    | __main__:trials:24 - Trial = 13343/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.138 | DEBUG    | __main__:trials:29 - Trial = 13343/30000 | Total reward = 42.91
2022-01-26 14:17:30.141 | DEBUG    | __main__:trials:24 - Trial = 13344/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.143 | DEBUG    | __main__:trials:29 - Trial = 13344/30000 | Total reward = 47.92
2022-01-26 14:17:30.147 | DEBUG    | __main__:trials:24 - Trial = 13345/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.148 | DEBUG    | __main__:trials:29 - Trial = 13345/30000 | Total reward = 44.56
2022-01-26 14:17:30.152 | DEBUG    | __main__:trials:24 - Trial = 13346/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.153 | DEBUG    | __main__:trials:29 - Trial = 13346/30000 | Total reward = 43.58
2022-01-26 14:17:30.157 | DEBUG    | __main__:trials:24 - Trial = 13347/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.158 | DEBUG    | __main__:trials:29 - Trial = 13347/30000 | Total reward = 38.02
2022-01-26 14:17:30.162 | DEBUG    | __main__:trials:24 - Trial = 13348/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.163 | DEBUG    | __main__:trials:29 - Trial = 13348/30000 | Total reward = 45.22
2022-01-26 14:17:30.167 | DEBUG    | __main__:trials:24 - Trial = 13349/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.169 | DEBUG    | __main__:trials:29 - Trial = 13349/30000 | Total reward = 42.91
2022-01-26 14:17:30.172 | DEBUG    | __main__:trials:24 - Trial = 13350/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.174 | DEBUG    | __main__:trials:29 - Trial = 13350/30000 | Total reward = 43.63
2022-01-26 14:17:30.178 | DEBUG    | __main__:trials:24 - Trial = 13351/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.179 | DEBUG    | __main__:trials:29 - Trial = 13351/30000 | Total reward = 51.05
2022-01-26 14:17:30.182 | DEBUG    | __main__:trials:24 - Trial = 13352/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.184 | DEBUG    | __main__:trials:29 - Trial = 13352/30000 | Total reward = 45.65
2022-01-26 14:17:30.188 | DEBUG    | __main__:trials:24 - Trial = 13353/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.189 | DEBUG    | __main__:trials:29 - Trial = 13353/30000 | Total reward = 42.57
2022-01-26 14:17:30.193 | DEBUG    | __main__:trials:24 - Trial = 13354/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.194 | DEBUG    | __main__:trials:29 - Trial = 13354/30000 | Total reward = 47.05
2022-01-26 14:17:30.198 | DEBUG    | __main__:trials:24 - Trial = 13355/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.200 | DEBUG    | __main__:trials:29 - Trial = 13355/30000 | Total reward = 54.28
2022-01-26 14:17:30.203 | DEBUG    | __main__:trials:24 - Trial = 13356/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.204 | DEBUG    | __main__:trials:29 - Trial = 13356/30000 | Total reward = 37.03
2022-01-26 14:17:30.208 | DEBUG    | __main__:trials:24 - Trial = 13357/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.209 | DEBUG    | __main__:trials:29 - Trial = 13357/30000 | Total reward = 46.36
2022-01-26 14:17:30.213 | DEBUG    | __main__:trials:24 - Trial = 13358/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.215 | DEBUG    | __main__:trials:29 - Trial = 13358/30000 | Total reward = 43.14
2022-01-26 14:17:30.218 | DEBUG    | __main__:trials:24 - Trial = 13359/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.220 | DEBUG    | __main__:trials:29 - Trial = 13359/30000 | Total reward = 40.80
2022-01-26 14:17:30.223 | DEBUG    | __main__:trials:24 - Trial = 13360/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.225 | DEBUG    | __main__:trials:29 - Trial = 13360/30000 | Total reward = 40.45
2022-01-26 14:17:30.228 | DEBUG    | __main__:trials:24 - Trial = 13361/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.230 | DEBUG    | __main__:trials:29 - Trial = 13361/30000 | Total reward = 39.52
2022-01-26 14:17:30.234 | DEBUG    | __main__:trials:24 - Trial = 13362/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.235 | DEBUG    | __main__:trials:29 - Trial = 13362/30000 | Total reward = 40.92
2022-01-26 14:17:30.239 | DEBUG    | __main__:trials:24 - Trial = 13363/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.240 | DEBUG    | __main__:trials:29 - Trial = 13363/30000 | Total reward = 51.15
2022-01-26 14:17:30.244 | DEBUG    | __main__:trials:24 - Trial = 13364/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.246 | DEBUG    | __main__:trials:29 - Trial = 13364/30000 | Total reward = 42.02
2022-01-26 14:17:30.250 | DEBUG    | __main__:trials:24 - Trial = 13365/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.251 | DEBUG    | __main__:trials:29 - Trial = 13365/30000 | Total reward = 41.17
2022-01-26 14:17:30.255 | DEBUG    | __main__:trials:24 - Trial = 13366/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.257 | DEBUG    | __main__:trials:29 - Trial = 13366/30000 | Total reward = 44.11
2022-01-26 14:17:30.260 | DEBUG    | __main__:trials:24 - Trial = 13367/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.262 | DEBUG    | __main__:trials:29 - Trial = 13367/30000 | Total reward = 41.11
2022-01-26 14:17:30.265 | DEBUG    | __main__:trials:24 - Trial = 13368/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.266 | DEBUG    | __main__:trials:29 - Trial = 13368/30000 | Total reward = 41.23
2022-01-26 14:17:30.269 | DEBUG    | __main__:trials:24 - Trial = 13369/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.270 | DEBUG    | __main__:trials:29 - Trial = 13369/30000 | Total reward = 46.83
2022-01-26 14:17:30.274 | DEBUG    | __main__:trials:24 - Trial = 13370/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.274 | DEBUG    | __main__:trials:29 - Trial = 13370/30000 | Total reward = 39.52
2022-01-26 14:17:30.278 | DEBUG    | __main__:trials:24 - Trial = 13371/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.280 | DEBUG    | __main__:trials:29 - Trial = 13371/30000 | Total reward = 39.43
2022-01-26 14:17:30.283 | DEBUG    | __main__:trials:24 - Trial = 13372/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.285 | DEBUG    | __main__:trials:29 - Trial = 13372/30000 | Total reward = 46.72
2022-01-26 14:17:30.289 | DEBUG    | __main__:trials:24 - Trial = 13373/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.290 | DEBUG    | __main__:trials:29 - Trial = 13373/30000 | Total reward = 43.27
2022-01-26 14:17:30.294 | DEBUG    | __main__:trials:24 - Trial = 13374/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.295 | DEBUG    | __main__:trials:29 - Trial = 13374/30000 | Total reward = 44.74
2022-01-26 14:17:30.299 | DEBUG    | __main__:trials:24 - Trial = 13375/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.299 | DEBUG    | __main__:trials:29 - Trial = 13375/30000 | Total reward = 42.09
2022-01-26 14:17:30.304 | DEBUG    | __main__:trials:24 - Trial = 13376/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.305 | DEBUG    | __main__:trials:29 - Trial = 13376/30000 | Total reward = 49.17
2022-01-26 14:17:30.309 | DEBUG    | __main__:trials:24 - Trial = 13377/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.310 | DEBUG    | __main__:trials:29 - Trial = 13377/30000 | Total reward = 51.93
2022-01-26 14:17:30.314 | DEBUG    | __main__:trials:24 - Trial = 13378/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.315 | DEBUG    | __main__:trials:29 - Trial = 13378/30000 | Total reward = 47.05
2022-01-26 14:17:30.318 | DEBUG    | __main__:trials:24 - Trial = 13379/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.320 | DEBUG    | __main__:trials:29 - Trial = 13379/30000 | Total reward = 49.34
2022-01-26 14:17:30.323 | DEBUG    | __main__:trials:24 - Trial = 13380/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.325 | DEBUG    | __main__:trials:29 - Trial = 13380/30000 | Total reward = 48.17
2022-01-26 14:17:30.328 | DEBUG    | __main__:trials:24 - Trial = 13381/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.330 | DEBUG    | __main__:trials:29 - Trial = 13381/30000 | Total reward = 46.43
2022-01-26 14:17:30.334 | DEBUG    | __main__:trials:24 - Trial = 13382/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.335 | DEBUG    | __main__:trials:29 - Trial = 13382/30000 | Total reward = 49.16
2022-01-26 14:17:30.339 | DEBUG    | __main__:trials:24 - Trial = 13383/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.341 | DEBUG    | __main__:trials:29 - Trial = 13383/30000 | Total reward = 41.10
2022-01-26 14:17:30.344 | DEBUG    | __main__:trials:24 - Trial = 13384/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.346 | DEBUG    | __main__:trials:29 - Trial = 13384/30000 | Total reward = 44.93
2022-01-26 14:17:30.350 | DEBUG    | __main__:trials:24 - Trial = 13385/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.351 | DEBUG    | __main__:trials:29 - Trial = 13385/30000 | Total reward = 35.57
2022-01-26 14:17:30.355 | DEBUG    | __main__:trials:24 - Trial = 13386/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.357 | DEBUG    | __main__:trials:29 - Trial = 13386/30000 | Total reward = 54.84
2022-01-26 14:17:30.360 | DEBUG    | __main__:trials:24 - Trial = 13387/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.361 | DEBUG    | __main__:trials:29 - Trial = 13387/30000 | Total reward = 36.47
2022-01-26 14:17:30.365 | DEBUG    | __main__:trials:24 - Trial = 13388/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.367 | DEBUG    | __main__:trials:29 - Trial = 13388/30000 | Total reward = 39.78
2022-01-26 14:17:30.370 | DEBUG    | __main__:trials:24 - Trial = 13389/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.372 | DEBUG    | __main__:trials:29 - Trial = 13389/30000 | Total reward = 35.50
2022-01-26 14:17:30.376 | DEBUG    | __main__:trials:24 - Trial = 13390/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.378 | DEBUG    | __main__:trials:29 - Trial = 13390/30000 | Total reward = 47.78
2022-01-26 14:17:30.381 | DEBUG    | __main__:trials:24 - Trial = 13391/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.383 | DEBUG    | __main__:trials:29 - Trial = 13391/30000 | Total reward = 43.39
2022-01-26 14:17:30.386 | DEBUG    | __main__:trials:24 - Trial = 13392/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.388 | DEBUG    | __main__:trials:29 - Trial = 13392/30000 | Total reward = 41.33
2022-01-26 14:17:30.392 | DEBUG    | __main__:trials:24 - Trial = 13393/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.393 | DEBUG    | __main__:trials:29 - Trial = 13393/30000 | Total reward = 41.59
2022-01-26 14:17:30.396 | DEBUG    | __main__:trials:24 - Trial = 13394/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.397 | DEBUG    | __main__:trials:29 - Trial = 13394/30000 | Total reward = 45.58
2022-01-26 14:17:30.401 | DEBUG    | __main__:trials:24 - Trial = 13395/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.402 | DEBUG    | __main__:trials:29 - Trial = 13395/30000 | Total reward = 48.38
2022-01-26 14:17:30.405 | DEBUG    | __main__:trials:24 - Trial = 13396/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.407 | DEBUG    | __main__:trials:29 - Trial = 13396/30000 | Total reward = 30.71
2022-01-26 14:17:30.411 | DEBUG    | __main__:trials:24 - Trial = 13397/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.412 | DEBUG    | __main__:trials:29 - Trial = 13397/30000 | Total reward = 46.53
2022-01-26 14:17:30.415 | DEBUG    | __main__:trials:24 - Trial = 13398/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.417 | DEBUG    | __main__:trials:29 - Trial = 13398/30000 | Total reward = 29.77
2022-01-26 14:17:30.422 | DEBUG    | __main__:trials:24 - Trial = 13399/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.424 | DEBUG    | __main__:trials:29 - Trial = 13399/30000 | Total reward = 44.25
2022-01-26 14:17:30.427 | DEBUG    | __main__:trials:24 - Trial = 13400/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.429 | DEBUG    | __main__:trials:29 - Trial = 13400/30000 | Total reward = 42.08
2022-01-26 14:17:30.432 | DEBUG    | __main__:trials:24 - Trial = 13401/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.433 | DEBUG    | __main__:trials:29 - Trial = 13401/30000 | Total reward = 42.67
2022-01-26 14:17:30.436 | DEBUG    | __main__:trials:24 - Trial = 13402/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.438 | DEBUG    | __main__:trials:29 - Trial = 13402/30000 | Total reward = 39.63
2022-01-26 14:17:30.441 | DEBUG    | __main__:trials:24 - Trial = 13403/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.443 | DEBUG    | __main__:trials:29 - Trial = 13403/30000 | Total reward = 40.28
2022-01-26 14:17:30.446 | DEBUG    | __main__:trials:24 - Trial = 13404/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.448 | DEBUG    | __main__:trials:29 - Trial = 13404/30000 | Total reward = 43.96
2022-01-26 14:17:30.451 | DEBUG    | __main__:trials:24 - Trial = 13405/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.453 | DEBUG    | __main__:trials:29 - Trial = 13405/30000 | Total reward = 54.82
2022-01-26 14:17:30.456 | DEBUG    | __main__:trials:24 - Trial = 13406/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.458 | DEBUG    | __main__:trials:29 - Trial = 13406/30000 | Total reward = 40.73
2022-01-26 14:17:30.461 | DEBUG    | __main__:trials:24 - Trial = 13407/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.462 | DEBUG    | __main__:trials:29 - Trial = 13407/30000 | Total reward = 43.88
2022-01-26 14:17:30.466 | DEBUG    | __main__:trials:24 - Trial = 13408/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.468 | DEBUG    | __main__:trials:29 - Trial = 13408/30000 | Total reward = 40.11
2022-01-26 14:17:30.471 | DEBUG    | __main__:trials:24 - Trial = 13409/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.473 | DEBUG    | __main__:trials:29 - Trial = 13409/30000 | Total reward = 44.85
2022-01-26 14:17:30.476 | DEBUG    | __main__:trials:24 - Trial = 13410/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.478 | DEBUG    | __main__:trials:29 - Trial = 13410/30000 | Total reward = 40.96
2022-01-26 14:17:30.482 | DEBUG    | __main__:trials:24 - Trial = 13411/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.484 | DEBUG    | __main__:trials:29 - Trial = 13411/30000 | Total reward = 40.12
2022-01-26 14:17:30.486 | DEBUG    | __main__:trials:24 - Trial = 13412/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.488 | DEBUG    | __main__:trials:29 - Trial = 13412/30000 | Total reward = 40.48
2022-01-26 14:17:30.492 | DEBUG    | __main__:trials:24 - Trial = 13413/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.494 | DEBUG    | __main__:trials:29 - Trial = 13413/30000 | Total reward = 40.63
2022-01-26 14:17:30.497 | DEBUG    | __main__:trials:24 - Trial = 13414/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.499 | DEBUG    | __main__:trials:29 - Trial = 13414/30000 | Total reward = 45.30
2022-01-26 14:17:30.503 | DEBUG    | __main__:trials:24 - Trial = 13415/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.504 | DEBUG    | __main__:trials:29 - Trial = 13415/30000 | Total reward = 44.54
2022-01-26 14:17:30.507 | DEBUG    | __main__:trials:24 - Trial = 13416/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.509 | DEBUG    | __main__:trials:29 - Trial = 13416/30000 | Total reward = 49.91
2022-01-26 14:17:30.513 | DEBUG    | __main__:trials:24 - Trial = 13417/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.514 | DEBUG    | __main__:trials:29 - Trial = 13417/30000 | Total reward = 50.77
2022-01-26 14:17:30.518 | DEBUG    | __main__:trials:24 - Trial = 13418/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.519 | DEBUG    | __main__:trials:29 - Trial = 13418/30000 | Total reward = 41.20
2022-01-26 14:17:30.522 | DEBUG    | __main__:trials:24 - Trial = 13419/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.524 | DEBUG    | __main__:trials:29 - Trial = 13419/30000 | Total reward = 45.07
2022-01-26 14:17:30.527 | DEBUG    | __main__:trials:24 - Trial = 13420/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.529 | DEBUG    | __main__:trials:29 - Trial = 13420/30000 | Total reward = 49.64
2022-01-26 14:17:30.533 | DEBUG    | __main__:trials:24 - Trial = 13421/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.535 | DEBUG    | __main__:trials:29 - Trial = 13421/30000 | Total reward = 53.74
2022-01-26 14:17:30.539 | DEBUG    | __main__:trials:24 - Trial = 13422/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.540 | DEBUG    | __main__:trials:29 - Trial = 13422/30000 | Total reward = 57.47
2022-01-26 14:17:30.544 | DEBUG    | __main__:trials:24 - Trial = 13423/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.545 | DEBUG    | __main__:trials:29 - Trial = 13423/30000 | Total reward = 50.37
2022-01-26 14:17:30.549 | DEBUG    | __main__:trials:24 - Trial = 13424/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.551 | DEBUG    | __main__:trials:29 - Trial = 13424/30000 | Total reward = 55.88
2022-01-26 14:17:30.554 | DEBUG    | __main__:trials:24 - Trial = 13425/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.556 | DEBUG    | __main__:trials:29 - Trial = 13425/30000 | Total reward = 55.79
2022-01-26 14:17:30.559 | DEBUG    | __main__:trials:24 - Trial = 13426/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.561 | DEBUG    | __main__:trials:29 - Trial = 13426/30000 | Total reward = 49.57
2022-01-26 14:17:30.565 | DEBUG    | __main__:trials:24 - Trial = 13427/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.565 | DEBUG    | __main__:trials:29 - Trial = 13427/30000 | Total reward = 55.03
2022-01-26 14:17:30.568 | DEBUG    | __main__:trials:24 - Trial = 13428/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.569 | DEBUG    | __main__:trials:29 - Trial = 13428/30000 | Total reward = 52.28
2022-01-26 14:17:30.573 | DEBUG    | __main__:trials:24 - Trial = 13429/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.575 | DEBUG    | __main__:trials:29 - Trial = 13429/30000 | Total reward = 32.76
2022-01-26 14:17:30.578 | DEBUG    | __main__:trials:24 - Trial = 13430/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.580 | DEBUG    | __main__:trials:29 - Trial = 13430/30000 | Total reward = 37.00
2022-01-26 14:17:30.583 | DEBUG    | __main__:trials:24 - Trial = 13431/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.584 | DEBUG    | __main__:trials:29 - Trial = 13431/30000 | Total reward = 60.22
2022-01-26 14:17:30.588 | DEBUG    | __main__:trials:24 - Trial = 13432/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.590 | DEBUG    | __main__:trials:29 - Trial = 13432/30000 | Total reward = 34.85
2022-01-26 14:17:30.594 | DEBUG    | __main__:trials:24 - Trial = 13433/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.596 | DEBUG    | __main__:trials:29 - Trial = 13433/30000 | Total reward = 41.07
2022-01-26 14:17:30.599 | DEBUG    | __main__:trials:24 - Trial = 13434/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.601 | DEBUG    | __main__:trials:29 - Trial = 13434/30000 | Total reward = 51.80
2022-01-26 14:17:30.605 | DEBUG    | __main__:trials:24 - Trial = 13435/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.605 | DEBUG    | __main__:trials:29 - Trial = 13435/30000 | Total reward = 40.73
2022-01-26 14:17:30.609 | DEBUG    | __main__:trials:24 - Trial = 13436/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.611 | DEBUG    | __main__:trials:29 - Trial = 13436/30000 | Total reward = 42.05
2022-01-26 14:17:30.615 | DEBUG    | __main__:trials:24 - Trial = 13437/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.616 | DEBUG    | __main__:trials:29 - Trial = 13437/30000 | Total reward = 45.75
2022-01-26 14:17:30.620 | DEBUG    | __main__:trials:24 - Trial = 13438/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.621 | DEBUG    | __main__:trials:29 - Trial = 13438/30000 | Total reward = 39.03
2022-01-26 14:17:30.625 | DEBUG    | __main__:trials:24 - Trial = 13439/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.626 | DEBUG    | __main__:trials:29 - Trial = 13439/30000 | Total reward = 33.31
2022-01-26 14:17:30.630 | DEBUG    | __main__:trials:24 - Trial = 13440/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.633 | DEBUG    | __main__:trials:29 - Trial = 13440/30000 | Total reward = 19.46
2022-01-26 14:17:30.635 | DEBUG    | __main__:trials:24 - Trial = 13441/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.637 | DEBUG    | __main__:trials:29 - Trial = 13441/30000 | Total reward = 43.14
2022-01-26 14:17:30.641 | DEBUG    | __main__:trials:24 - Trial = 13442/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.641 | DEBUG    | __main__:trials:29 - Trial = 13442/30000 | Total reward = 41.35
2022-01-26 14:17:30.645 | DEBUG    | __main__:trials:24 - Trial = 13443/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.645 | DEBUG    | __main__:trials:29 - Trial = 13443/30000 | Total reward = 41.67
2022-01-26 14:17:30.649 | DEBUG    | __main__:trials:24 - Trial = 13444/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.650 | DEBUG    | __main__:trials:29 - Trial = 13444/30000 | Total reward = 47.33
2022-01-26 14:17:30.654 | DEBUG    | __main__:trials:24 - Trial = 13445/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.655 | DEBUG    | __main__:trials:29 - Trial = 13445/30000 | Total reward = 40.73
2022-01-26 14:17:30.658 | DEBUG    | __main__:trials:24 - Trial = 13446/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.660 | DEBUG    | __main__:trials:29 - Trial = 13446/30000 | Total reward = 32.53
2022-01-26 14:17:30.664 | DEBUG    | __main__:trials:24 - Trial = 13447/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.665 | DEBUG    | __main__:trials:29 - Trial = 13447/30000 | Total reward = 35.56
2022-01-26 14:17:30.669 | DEBUG    | __main__:trials:24 - Trial = 13448/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.671 | DEBUG    | __main__:trials:29 - Trial = 13448/30000 | Total reward = 43.25
2022-01-26 14:17:30.675 | DEBUG    | __main__:trials:24 - Trial = 13449/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.676 | DEBUG    | __main__:trials:29 - Trial = 13449/30000 | Total reward = 35.42
2022-01-26 14:17:30.680 | DEBUG    | __main__:trials:24 - Trial = 13450/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.682 | DEBUG    | __main__:trials:29 - Trial = 13450/30000 | Total reward = 42.68
2022-01-26 14:17:30.685 | DEBUG    | __main__:trials:24 - Trial = 13451/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.687 | DEBUG    | __main__:trials:29 - Trial = 13451/30000 | Total reward = 37.73
2022-01-26 14:17:30.691 | DEBUG    | __main__:trials:24 - Trial = 13452/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.692 | DEBUG    | __main__:trials:29 - Trial = 13452/30000 | Total reward = 38.90
2022-01-26 14:17:30.696 | DEBUG    | __main__:trials:24 - Trial = 13453/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.698 | DEBUG    | __main__:trials:29 - Trial = 13453/30000 | Total reward = 51.41
2022-01-26 14:17:30.701 | DEBUG    | __main__:trials:26 - Trial = 13454/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:30.703 | DEBUG    | __main__:trials:29 - Trial = 13454/30000 | Total reward = 23.00
2022-01-26 14:17:30.706 | DEBUG    | __main__:trials:24 - Trial = 13455/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.708 | DEBUG    | __main__:trials:29 - Trial = 13455/30000 | Total reward = 41.56
2022-01-26 14:17:30.712 | DEBUG    | __main__:trials:24 - Trial = 13456/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.713 | DEBUG    | __main__:trials:29 - Trial = 13456/30000 | Total reward = 45.70
2022-01-26 14:17:30.717 | DEBUG    | __main__:trials:24 - Trial = 13457/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.718 | DEBUG    | __main__:trials:29 - Trial = 13457/30000 | Total reward = 46.65
2022-01-26 14:17:30.722 | DEBUG    | __main__:trials:24 - Trial = 13458/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.724 | DEBUG    | __main__:trials:29 - Trial = 13458/30000 | Total reward = 48.31
2022-01-26 14:17:30.727 | DEBUG    | __main__:trials:24 - Trial = 13459/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.729 | DEBUG    | __main__:trials:29 - Trial = 13459/30000 | Total reward = 57.82
2022-01-26 14:17:30.732 | DEBUG    | __main__:trials:24 - Trial = 13460/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.734 | DEBUG    | __main__:trials:29 - Trial = 13460/30000 | Total reward = 48.10
2022-01-26 14:17:30.738 | DEBUG    | __main__:trials:24 - Trial = 13461/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.739 | DEBUG    | __main__:trials:29 - Trial = 13461/30000 | Total reward = 53.49
2022-01-26 14:17:30.742 | DEBUG    | __main__:trials:24 - Trial = 13462/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.744 | DEBUG    | __main__:trials:29 - Trial = 13462/30000 | Total reward = 52.56
2022-01-26 14:17:30.748 | DEBUG    | __main__:trials:24 - Trial = 13463/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.750 | DEBUG    | __main__:trials:29 - Trial = 13463/30000 | Total reward = 46.01
2022-01-26 14:17:30.753 | DEBUG    | __main__:trials:24 - Trial = 13464/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.755 | DEBUG    | __main__:trials:29 - Trial = 13464/30000 | Total reward = 45.61
2022-01-26 14:17:30.759 | DEBUG    | __main__:trials:24 - Trial = 13465/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.760 | DEBUG    | __main__:trials:29 - Trial = 13465/30000 | Total reward = 38.45
2022-01-26 14:17:30.763 | DEBUG    | __main__:trials:24 - Trial = 13466/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.765 | DEBUG    | __main__:trials:29 - Trial = 13466/30000 | Total reward = 49.39
2022-01-26 14:17:30.769 | DEBUG    | __main__:trials:24 - Trial = 13467/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.771 | DEBUG    | __main__:trials:29 - Trial = 13467/30000 | Total reward = 47.73
2022-01-26 14:17:30.775 | DEBUG    | __main__:trials:24 - Trial = 13468/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.776 | DEBUG    | __main__:trials:29 - Trial = 13468/30000 | Total reward = 66.01
2022-01-26 14:17:30.780 | DEBUG    | __main__:trials:24 - Trial = 13469/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.782 | DEBUG    | __main__:trials:29 - Trial = 13469/30000 | Total reward = 47.14
2022-01-26 14:17:30.785 | DEBUG    | __main__:trials:24 - Trial = 13470/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.786 | DEBUG    | __main__:trials:29 - Trial = 13470/30000 | Total reward = 45.47
2022-01-26 14:17:30.791 | DEBUG    | __main__:trials:24 - Trial = 13471/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.792 | DEBUG    | __main__:trials:29 - Trial = 13471/30000 | Total reward = 45.52
2022-01-26 14:17:30.796 | DEBUG    | __main__:trials:24 - Trial = 13472/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.798 | DEBUG    | __main__:trials:29 - Trial = 13472/30000 | Total reward = 44.07
2022-01-26 14:17:30.802 | DEBUG    | __main__:trials:24 - Trial = 13473/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.803 | DEBUG    | __main__:trials:29 - Trial = 13473/30000 | Total reward = 51.78
2022-01-26 14:17:30.807 | DEBUG    | __main__:trials:24 - Trial = 13474/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.809 | DEBUG    | __main__:trials:29 - Trial = 13474/30000 | Total reward = 37.93
2022-01-26 14:17:30.811 | DEBUG    | __main__:trials:26 - Trial = 13475/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:30.813 | DEBUG    | __main__:trials:29 - Trial = 13475/30000 | Total reward = 36.09
2022-01-26 14:17:30.817 | DEBUG    | __main__:trials:24 - Trial = 13476/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.819 | DEBUG    | __main__:trials:29 - Trial = 13476/30000 | Total reward = 54.73
2022-01-26 14:17:30.823 | DEBUG    | __main__:trials:24 - Trial = 13477/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.824 | DEBUG    | __main__:trials:29 - Trial = 13477/30000 | Total reward = 54.85
2022-01-26 14:17:30.828 | DEBUG    | __main__:trials:24 - Trial = 13478/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.830 | DEBUG    | __main__:trials:29 - Trial = 13478/30000 | Total reward = 49.96
2022-01-26 14:17:30.834 | DEBUG    | __main__:trials:24 - Trial = 13479/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.836 | DEBUG    | __main__:trials:29 - Trial = 13479/30000 | Total reward = 48.20
2022-01-26 14:17:30.839 | DEBUG    | __main__:trials:24 - Trial = 13480/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.840 | DEBUG    | __main__:trials:29 - Trial = 13480/30000 | Total reward = 50.48
2022-01-26 14:17:30.844 | DEBUG    | __main__:trials:24 - Trial = 13481/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.846 | DEBUG    | __main__:trials:29 - Trial = 13481/30000 | Total reward = 38.22
2022-01-26 14:17:30.849 | DEBUG    | __main__:trials:24 - Trial = 13482/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.850 | DEBUG    | __main__:trials:29 - Trial = 13482/30000 | Total reward = 42.49
2022-01-26 14:17:30.854 | DEBUG    | __main__:trials:24 - Trial = 13483/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.856 | DEBUG    | __main__:trials:29 - Trial = 13483/30000 | Total reward = 47.21
2022-01-26 14:17:30.860 | DEBUG    | __main__:trials:24 - Trial = 13484/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.861 | DEBUG    | __main__:trials:29 - Trial = 13484/30000 | Total reward = 38.01
2022-01-26 14:17:30.865 | DEBUG    | __main__:trials:24 - Trial = 13485/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.867 | DEBUG    | __main__:trials:29 - Trial = 13485/30000 | Total reward = 44.18
2022-01-26 14:17:30.870 | DEBUG    | __main__:trials:24 - Trial = 13486/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.872 | DEBUG    | __main__:trials:29 - Trial = 13486/30000 | Total reward = 32.52
2022-01-26 14:17:30.875 | DEBUG    | __main__:trials:24 - Trial = 13487/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.877 | DEBUG    | __main__:trials:29 - Trial = 13487/30000 | Total reward = 40.19
2022-01-26 14:17:30.880 | DEBUG    | __main__:trials:24 - Trial = 13488/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.882 | DEBUG    | __main__:trials:29 - Trial = 13488/30000 | Total reward = 35.92
2022-01-26 14:17:30.885 | DEBUG    | __main__:trials:24 - Trial = 13489/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.886 | DEBUG    | __main__:trials:29 - Trial = 13489/30000 | Total reward = 39.71
2022-01-26 14:17:30.891 | DEBUG    | __main__:trials:24 - Trial = 13490/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.893 | DEBUG    | __main__:trials:29 - Trial = 13490/30000 | Total reward = 46.11
2022-01-26 14:17:30.896 | DEBUG    | __main__:trials:24 - Trial = 13491/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.897 | DEBUG    | __main__:trials:29 - Trial = 13491/30000 | Total reward = 42.08
2022-01-26 14:17:30.901 | DEBUG    | __main__:trials:24 - Trial = 13492/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.902 | DEBUG    | __main__:trials:29 - Trial = 13492/30000 | Total reward = 42.64
2022-01-26 14:17:30.906 | DEBUG    | __main__:trials:24 - Trial = 13493/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.907 | DEBUG    | __main__:trials:29 - Trial = 13493/30000 | Total reward = 43.81
2022-01-26 14:17:30.911 | DEBUG    | __main__:trials:24 - Trial = 13494/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.913 | DEBUG    | __main__:trials:29 - Trial = 13494/30000 | Total reward = 47.32
2022-01-26 14:17:30.916 | DEBUG    | __main__:trials:24 - Trial = 13495/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.917 | DEBUG    | __main__:trials:29 - Trial = 13495/30000 | Total reward = 37.34
2022-01-26 14:17:30.922 | DEBUG    | __main__:trials:24 - Trial = 13496/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.922 | DEBUG    | __main__:trials:29 - Trial = 13496/30000 | Total reward = 48.06
2022-01-26 14:17:30.926 | DEBUG    | __main__:trials:24 - Trial = 13497/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.927 | DEBUG    | __main__:trials:29 - Trial = 13497/30000 | Total reward = 38.08
2022-01-26 14:17:30.931 | DEBUG    | __main__:trials:24 - Trial = 13498/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.932 | DEBUG    | __main__:trials:29 - Trial = 13498/30000 | Total reward = 48.58
2022-01-26 14:17:30.936 | DEBUG    | __main__:trials:24 - Trial = 13499/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.937 | DEBUG    | __main__:trials:29 - Trial = 13499/30000 | Total reward = 48.17
2022-01-26 14:17:30.941 | DEBUG    | __main__:trials:24 - Trial = 13500/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.943 | DEBUG    | __main__:trials:29 - Trial = 13500/30000 | Total reward = 50.00
2022-01-26 14:17:30.947 | DEBUG    | __main__:trials:24 - Trial = 13501/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.948 | DEBUG    | __main__:trials:29 - Trial = 13501/30000 | Total reward = 41.92
2022-01-26 14:17:30.952 | DEBUG    | __main__:trials:24 - Trial = 13502/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.954 | DEBUG    | __main__:trials:29 - Trial = 13502/30000 | Total reward = 28.40
2022-01-26 14:17:30.957 | DEBUG    | __main__:trials:24 - Trial = 13503/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.959 | DEBUG    | __main__:trials:29 - Trial = 13503/30000 | Total reward = 47.34
2022-01-26 14:17:30.963 | DEBUG    | __main__:trials:24 - Trial = 13504/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.964 | DEBUG    | __main__:trials:29 - Trial = 13504/30000 | Total reward = 43.17
2022-01-26 14:17:30.968 | DEBUG    | __main__:trials:24 - Trial = 13505/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.969 | DEBUG    | __main__:trials:29 - Trial = 13505/30000 | Total reward = 44.96
2022-01-26 14:17:30.973 | DEBUG    | __main__:trials:24 - Trial = 13506/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.973 | DEBUG    | __main__:trials:29 - Trial = 13506/30000 | Total reward = 42.58
2022-01-26 14:17:30.977 | DEBUG    | __main__:trials:24 - Trial = 13507/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.978 | DEBUG    | __main__:trials:29 - Trial = 13507/30000 | Total reward = 45.62
2022-01-26 14:17:30.981 | DEBUG    | __main__:trials:24 - Trial = 13508/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.982 | DEBUG    | __main__:trials:29 - Trial = 13508/30000 | Total reward = 47.93
2022-01-26 14:17:30.986 | DEBUG    | __main__:trials:24 - Trial = 13509/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.988 | DEBUG    | __main__:trials:29 - Trial = 13509/30000 | Total reward = 50.74
2022-01-26 14:17:30.991 | DEBUG    | __main__:trials:24 - Trial = 13510/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.992 | DEBUG    | __main__:trials:29 - Trial = 13510/30000 | Total reward = 42.24
2022-01-26 14:17:30.996 | DEBUG    | __main__:trials:24 - Trial = 13511/30000 | Max number of steps (20) reached
2022-01-26 14:17:30.998 | DEBUG    | __main__:trials:29 - Trial = 13511/30000 | Total reward = 60.35
2022-01-26 14:17:31.002 | DEBUG    | __main__:trials:24 - Trial = 13512/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.002 | DEBUG    | __main__:trials:29 - Trial = 13512/30000 | Total reward = 47.38
2022-01-26 14:17:31.007 | DEBUG    | __main__:trials:24 - Trial = 13513/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.008 | DEBUG    | __main__:trials:29 - Trial = 13513/30000 | Total reward = 53.40
2022-01-26 14:17:31.011 | DEBUG    | __main__:trials:24 - Trial = 13514/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.013 | DEBUG    | __main__:trials:29 - Trial = 13514/30000 | Total reward = 45.03
2022-01-26 14:17:31.016 | DEBUG    | __main__:trials:24 - Trial = 13515/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.018 | DEBUG    | __main__:trials:29 - Trial = 13515/30000 | Total reward = 49.22
2022-01-26 14:17:31.022 | DEBUG    | __main__:trials:24 - Trial = 13516/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.023 | DEBUG    | __main__:trials:29 - Trial = 13516/30000 | Total reward = 46.43
2022-01-26 14:17:31.027 | DEBUG    | __main__:trials:24 - Trial = 13517/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.028 | DEBUG    | __main__:trials:29 - Trial = 13517/30000 | Total reward = 39.29
2022-01-26 14:17:31.032 | DEBUG    | __main__:trials:24 - Trial = 13518/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.034 | DEBUG    | __main__:trials:29 - Trial = 13518/30000 | Total reward = 32.42
2022-01-26 14:17:31.038 | DEBUG    | __main__:trials:24 - Trial = 13519/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.040 | DEBUG    | __main__:trials:29 - Trial = 13519/30000 | Total reward = 45.21
2022-01-26 14:17:31.043 | DEBUG    | __main__:trials:24 - Trial = 13520/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.045 | DEBUG    | __main__:trials:29 - Trial = 13520/30000 | Total reward = 40.16
2022-01-26 14:17:31.049 | DEBUG    | __main__:trials:24 - Trial = 13521/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.050 | DEBUG    | __main__:trials:29 - Trial = 13521/30000 | Total reward = 47.46
2022-01-26 14:17:31.053 | DEBUG    | __main__:trials:24 - Trial = 13522/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.054 | DEBUG    | __main__:trials:29 - Trial = 13522/30000 | Total reward = 44.38
2022-01-26 14:17:31.058 | DEBUG    | __main__:trials:24 - Trial = 13523/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.059 | DEBUG    | __main__:trials:29 - Trial = 13523/30000 | Total reward = 37.40
2022-01-26 14:17:31.062 | DEBUG    | __main__:trials:24 - Trial = 13524/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.064 | DEBUG    | __main__:trials:29 - Trial = 13524/30000 | Total reward = 38.49
2022-01-26 14:17:31.068 | DEBUG    | __main__:trials:24 - Trial = 13525/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.070 | DEBUG    | __main__:trials:29 - Trial = 13525/30000 | Total reward = 44.46
2022-01-26 14:17:31.074 | DEBUG    | __main__:trials:24 - Trial = 13526/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.075 | DEBUG    | __main__:trials:29 - Trial = 13526/30000 | Total reward = 45.34
2022-01-26 14:17:31.079 | DEBUG    | __main__:trials:24 - Trial = 13527/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.081 | DEBUG    | __main__:trials:29 - Trial = 13527/30000 | Total reward = 51.15
2022-01-26 14:17:31.084 | DEBUG    | __main__:trials:24 - Trial = 13528/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.086 | DEBUG    | __main__:trials:29 - Trial = 13528/30000 | Total reward = 50.94
2022-01-26 14:17:31.090 | DEBUG    | __main__:trials:24 - Trial = 13529/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.090 | DEBUG    | __main__:trials:29 - Trial = 13529/30000 | Total reward = 43.05
2022-01-26 14:17:31.095 | DEBUG    | __main__:trials:24 - Trial = 13530/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.096 | DEBUG    | __main__:trials:29 - Trial = 13530/30000 | Total reward = 46.41
2022-01-26 14:17:31.100 | DEBUG    | __main__:trials:24 - Trial = 13531/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.101 | DEBUG    | __main__:trials:29 - Trial = 13531/30000 | Total reward = 54.86
2022-01-26 14:17:31.105 | DEBUG    | __main__:trials:24 - Trial = 13532/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.107 | DEBUG    | __main__:trials:29 - Trial = 13532/30000 | Total reward = 45.25
2022-01-26 14:17:31.111 | DEBUG    | __main__:trials:24 - Trial = 13533/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.112 | DEBUG    | __main__:trials:29 - Trial = 13533/30000 | Total reward = 49.42
2022-01-26 14:17:31.116 | DEBUG    | __main__:trials:24 - Trial = 13534/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.118 | DEBUG    | __main__:trials:29 - Trial = 13534/30000 | Total reward = 44.21
2022-01-26 14:17:31.122 | DEBUG    | __main__:trials:24 - Trial = 13535/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.124 | DEBUG    | __main__:trials:29 - Trial = 13535/30000 | Total reward = 44.83
2022-01-26 14:17:31.127 | DEBUG    | __main__:trials:24 - Trial = 13536/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.129 | DEBUG    | __main__:trials:29 - Trial = 13536/30000 | Total reward = 56.95
2022-01-26 14:17:31.132 | DEBUG    | __main__:trials:24 - Trial = 13537/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.133 | DEBUG    | __main__:trials:29 - Trial = 13537/30000 | Total reward = 46.23
2022-01-26 14:17:31.136 | DEBUG    | __main__:trials:24 - Trial = 13538/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.137 | DEBUG    | __main__:trials:29 - Trial = 13538/30000 | Total reward = 54.56
2022-01-26 14:17:31.142 | DEBUG    | __main__:trials:24 - Trial = 13539/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.142 | DEBUG    | __main__:trials:29 - Trial = 13539/30000 | Total reward = 41.33
2022-01-26 14:17:31.147 | DEBUG    | __main__:trials:24 - Trial = 13540/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.148 | DEBUG    | __main__:trials:29 - Trial = 13540/30000 | Total reward = 27.84
2022-01-26 14:17:31.152 | DEBUG    | __main__:trials:24 - Trial = 13541/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.153 | DEBUG    | __main__:trials:29 - Trial = 13541/30000 | Total reward = 47.36
2022-01-26 14:17:31.157 | DEBUG    | __main__:trials:24 - Trial = 13542/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.159 | DEBUG    | __main__:trials:29 - Trial = 13542/30000 | Total reward = 46.61
2022-01-26 14:17:31.163 | DEBUG    | __main__:trials:24 - Trial = 13543/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.163 | DEBUG    | __main__:trials:29 - Trial = 13543/30000 | Total reward = 49.91
2022-01-26 14:17:31.167 | DEBUG    | __main__:trials:24 - Trial = 13544/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.168 | DEBUG    | __main__:trials:29 - Trial = 13544/30000 | Total reward = 45.86
2022-01-26 14:17:31.172 | DEBUG    | __main__:trials:24 - Trial = 13545/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.173 | DEBUG    | __main__:trials:29 - Trial = 13545/30000 | Total reward = 44.10
2022-01-26 14:17:31.176 | DEBUG    | __main__:trials:24 - Trial = 13546/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.178 | DEBUG    | __main__:trials:29 - Trial = 13546/30000 | Total reward = 48.51
2022-01-26 14:17:31.182 | DEBUG    | __main__:trials:24 - Trial = 13547/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.184 | DEBUG    | __main__:trials:29 - Trial = 13547/30000 | Total reward = 38.99
2022-01-26 14:17:31.187 | DEBUG    | __main__:trials:24 - Trial = 13548/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.187 | DEBUG    | __main__:trials:29 - Trial = 13548/30000 | Total reward = 50.38
2022-01-26 14:17:31.191 | DEBUG    | __main__:trials:24 - Trial = 13549/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.193 | DEBUG    | __main__:trials:29 - Trial = 13549/30000 | Total reward = 47.05
2022-01-26 14:17:31.196 | DEBUG    | __main__:trials:24 - Trial = 13550/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.197 | DEBUG    | __main__:trials:29 - Trial = 13550/30000 | Total reward = 35.82
2022-01-26 14:17:31.201 | DEBUG    | __main__:trials:24 - Trial = 13551/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.202 | DEBUG    | __main__:trials:29 - Trial = 13551/30000 | Total reward = 47.65
2022-01-26 14:17:31.205 | DEBUG    | __main__:trials:24 - Trial = 13552/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.207 | DEBUG    | __main__:trials:29 - Trial = 13552/30000 | Total reward = 45.57
2022-01-26 14:17:31.210 | DEBUG    | __main__:trials:24 - Trial = 13553/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.212 | DEBUG    | __main__:trials:29 - Trial = 13553/30000 | Total reward = 56.11
2022-01-26 14:17:31.215 | DEBUG    | __main__:trials:24 - Trial = 13554/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.217 | DEBUG    | __main__:trials:29 - Trial = 13554/30000 | Total reward = 44.72
2022-01-26 14:17:31.220 | DEBUG    | __main__:trials:24 - Trial = 13555/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.221 | DEBUG    | __main__:trials:29 - Trial = 13555/30000 | Total reward = 57.24
2022-01-26 14:17:31.225 | DEBUG    | __main__:trials:24 - Trial = 13556/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.225 | DEBUG    | __main__:trials:29 - Trial = 13556/30000 | Total reward = 35.02
2022-01-26 14:17:31.228 | DEBUG    | __main__:trials:24 - Trial = 13557/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.229 | DEBUG    | __main__:trials:29 - Trial = 13557/30000 | Total reward = 40.61
2022-01-26 14:17:31.232 | DEBUG    | __main__:trials:24 - Trial = 13558/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.233 | DEBUG    | __main__:trials:29 - Trial = 13558/30000 | Total reward = 45.44
2022-01-26 14:17:31.236 | DEBUG    | __main__:trials:24 - Trial = 13559/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.238 | DEBUG    | __main__:trials:29 - Trial = 13559/30000 | Total reward = 37.97
2022-01-26 14:17:31.242 | DEBUG    | __main__:trials:24 - Trial = 13560/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.243 | DEBUG    | __main__:trials:29 - Trial = 13560/30000 | Total reward = 41.35
2022-01-26 14:17:31.247 | DEBUG    | __main__:trials:24 - Trial = 13561/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.248 | DEBUG    | __main__:trials:29 - Trial = 13561/30000 | Total reward = 67.66
2022-01-26 14:17:31.252 | DEBUG    | __main__:trials:24 - Trial = 13562/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.253 | DEBUG    | __main__:trials:29 - Trial = 13562/30000 | Total reward = 46.67
2022-01-26 14:17:31.257 | DEBUG    | __main__:trials:24 - Trial = 13563/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.258 | DEBUG    | __main__:trials:29 - Trial = 13563/30000 | Total reward = 39.31
2022-01-26 14:17:31.263 | DEBUG    | __main__:trials:24 - Trial = 13564/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.264 | DEBUG    | __main__:trials:29 - Trial = 13564/30000 | Total reward = 39.93
2022-01-26 14:17:31.268 | DEBUG    | __main__:trials:24 - Trial = 13565/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.270 | DEBUG    | __main__:trials:29 - Trial = 13565/30000 | Total reward = 46.16
2022-01-26 14:17:31.273 | DEBUG    | __main__:trials:24 - Trial = 13566/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.274 | DEBUG    | __main__:trials:29 - Trial = 13566/30000 | Total reward = 43.32
2022-01-26 14:17:31.278 | DEBUG    | __main__:trials:24 - Trial = 13567/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.280 | DEBUG    | __main__:trials:29 - Trial = 13567/30000 | Total reward = 40.59
2022-01-26 14:17:31.284 | DEBUG    | __main__:trials:24 - Trial = 13568/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.285 | DEBUG    | __main__:trials:29 - Trial = 13568/30000 | Total reward = 38.92
2022-01-26 14:17:31.289 | DEBUG    | __main__:trials:24 - Trial = 13569/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.291 | DEBUG    | __main__:trials:29 - Trial = 13569/30000 | Total reward = 49.76
2022-01-26 14:17:31.295 | DEBUG    | __main__:trials:24 - Trial = 13570/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.297 | DEBUG    | __main__:trials:29 - Trial = 13570/30000 | Total reward = 40.31
2022-01-26 14:17:31.301 | DEBUG    | __main__:trials:24 - Trial = 13571/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.301 | DEBUG    | __main__:trials:29 - Trial = 13571/30000 | Total reward = 56.42
2022-01-26 14:17:31.304 | DEBUG    | __main__:trials:24 - Trial = 13572/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.305 | DEBUG    | __main__:trials:29 - Trial = 13572/30000 | Total reward = 46.72
2022-01-26 14:17:31.309 | DEBUG    | __main__:trials:24 - Trial = 13573/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.309 | DEBUG    | __main__:trials:29 - Trial = 13573/30000 | Total reward = 53.13
2022-01-26 14:17:31.314 | DEBUG    | __main__:trials:24 - Trial = 13574/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.316 | DEBUG    | __main__:trials:29 - Trial = 13574/30000 | Total reward = 42.22
2022-01-26 14:17:31.318 | DEBUG    | __main__:trials:26 - Trial = 13575/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:31.320 | DEBUG    | __main__:trials:29 - Trial = 13575/30000 | Total reward = 20.45
2022-01-26 14:17:31.324 | DEBUG    | __main__:trials:24 - Trial = 13576/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.325 | DEBUG    | __main__:trials:29 - Trial = 13576/30000 | Total reward = 45.64
2022-01-26 14:17:31.329 | DEBUG    | __main__:trials:24 - Trial = 13577/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.331 | DEBUG    | __main__:trials:29 - Trial = 13577/30000 | Total reward = 35.38
2022-01-26 14:17:31.335 | DEBUG    | __main__:trials:24 - Trial = 13578/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.336 | DEBUG    | __main__:trials:29 - Trial = 13578/30000 | Total reward = 32.78
2022-01-26 14:17:31.339 | DEBUG    | __main__:trials:24 - Trial = 13579/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.341 | DEBUG    | __main__:trials:29 - Trial = 13579/30000 | Total reward = 51.66
2022-01-26 14:17:31.344 | DEBUG    | __main__:trials:24 - Trial = 13580/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.346 | DEBUG    | __main__:trials:29 - Trial = 13580/30000 | Total reward = 47.22
2022-01-26 14:17:31.350 | DEBUG    | __main__:trials:24 - Trial = 13581/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.351 | DEBUG    | __main__:trials:29 - Trial = 13581/30000 | Total reward = 45.03
2022-01-26 14:17:31.354 | DEBUG    | __main__:trials:24 - Trial = 13582/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.356 | DEBUG    | __main__:trials:29 - Trial = 13582/30000 | Total reward = 46.58
2022-01-26 14:17:31.360 | DEBUG    | __main__:trials:24 - Trial = 13583/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.361 | DEBUG    | __main__:trials:29 - Trial = 13583/30000 | Total reward = 47.72
2022-01-26 14:17:31.364 | DEBUG    | __main__:trials:24 - Trial = 13584/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.365 | DEBUG    | __main__:trials:29 - Trial = 13584/30000 | Total reward = 43.84
2022-01-26 14:17:31.369 | DEBUG    | __main__:trials:24 - Trial = 13585/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.369 | DEBUG    | __main__:trials:29 - Trial = 13585/30000 | Total reward = 30.58
2022-01-26 14:17:31.373 | DEBUG    | __main__:trials:24 - Trial = 13586/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.374 | DEBUG    | __main__:trials:29 - Trial = 13586/30000 | Total reward = 39.58
2022-01-26 14:17:31.378 | DEBUG    | __main__:trials:24 - Trial = 13587/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.379 | DEBUG    | __main__:trials:29 - Trial = 13587/30000 | Total reward = 52.76
2022-01-26 14:17:31.382 | DEBUG    | __main__:trials:24 - Trial = 13588/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.383 | DEBUG    | __main__:trials:29 - Trial = 13588/30000 | Total reward = 40.56
2022-01-26 14:17:31.387 | DEBUG    | __main__:trials:24 - Trial = 13589/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.388 | DEBUG    | __main__:trials:29 - Trial = 13589/30000 | Total reward = 39.89
2022-01-26 14:17:31.391 | DEBUG    | __main__:trials:24 - Trial = 13590/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.393 | DEBUG    | __main__:trials:29 - Trial = 13590/30000 | Total reward = 51.82
2022-01-26 14:17:31.396 | DEBUG    | __main__:trials:24 - Trial = 13591/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.397 | DEBUG    | __main__:trials:29 - Trial = 13591/30000 | Total reward = 48.59
2022-01-26 14:17:31.401 | DEBUG    | __main__:trials:24 - Trial = 13592/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.401 | DEBUG    | __main__:trials:29 - Trial = 13592/30000 | Total reward = 46.23
2022-01-26 14:17:31.405 | DEBUG    | __main__:trials:24 - Trial = 13593/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.407 | DEBUG    | __main__:trials:29 - Trial = 13593/30000 | Total reward = 42.54
2022-01-26 14:17:31.410 | DEBUG    | __main__:trials:24 - Trial = 13594/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.412 | DEBUG    | __main__:trials:29 - Trial = 13594/30000 | Total reward = 42.89
2022-01-26 14:17:31.416 | DEBUG    | __main__:trials:24 - Trial = 13595/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.417 | DEBUG    | __main__:trials:29 - Trial = 13595/30000 | Total reward = 38.79
2022-01-26 14:17:31.421 | DEBUG    | __main__:trials:24 - Trial = 13596/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.422 | DEBUG    | __main__:trials:29 - Trial = 13596/30000 | Total reward = 42.59
2022-01-26 14:17:31.425 | DEBUG    | __main__:trials:24 - Trial = 13597/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.426 | DEBUG    | __main__:trials:29 - Trial = 13597/30000 | Total reward = 51.00
2022-01-26 14:17:31.429 | DEBUG    | __main__:trials:24 - Trial = 13598/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.430 | DEBUG    | __main__:trials:29 - Trial = 13598/30000 | Total reward = 47.63
2022-01-26 14:17:31.433 | DEBUG    | __main__:trials:24 - Trial = 13599/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.435 | DEBUG    | __main__:trials:29 - Trial = 13599/30000 | Total reward = 46.87
2022-01-26 14:17:31.438 | DEBUG    | __main__:trials:24 - Trial = 13600/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.440 | DEBUG    | __main__:trials:29 - Trial = 13600/30000 | Total reward = 40.40
2022-01-26 14:17:31.443 | DEBUG    | __main__:trials:24 - Trial = 13601/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.445 | DEBUG    | __main__:trials:29 - Trial = 13601/30000 | Total reward = 49.36
2022-01-26 14:17:31.449 | DEBUG    | __main__:trials:24 - Trial = 13602/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.450 | DEBUG    | __main__:trials:29 - Trial = 13602/30000 | Total reward = 57.01
2022-01-26 14:17:31.454 | DEBUG    | __main__:trials:24 - Trial = 13603/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.456 | DEBUG    | __main__:trials:29 - Trial = 13603/30000 | Total reward = 47.25
2022-01-26 14:17:31.460 | DEBUG    | __main__:trials:24 - Trial = 13604/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.462 | DEBUG    | __main__:trials:29 - Trial = 13604/30000 | Total reward = 48.10
2022-01-26 14:17:31.465 | DEBUG    | __main__:trials:24 - Trial = 13605/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.467 | DEBUG    | __main__:trials:29 - Trial = 13605/30000 | Total reward = 56.97
2022-01-26 14:17:31.471 | DEBUG    | __main__:trials:24 - Trial = 13606/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.472 | DEBUG    | __main__:trials:29 - Trial = 13606/30000 | Total reward = 55.60
2022-01-26 14:17:31.476 | DEBUG    | __main__:trials:24 - Trial = 13607/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.477 | DEBUG    | __main__:trials:29 - Trial = 13607/30000 | Total reward = 47.34
2022-01-26 14:17:31.481 | DEBUG    | __main__:trials:24 - Trial = 13608/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.483 | DEBUG    | __main__:trials:29 - Trial = 13608/30000 | Total reward = 46.44
2022-01-26 14:17:31.487 | DEBUG    | __main__:trials:24 - Trial = 13609/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.488 | DEBUG    | __main__:trials:29 - Trial = 13609/30000 | Total reward = 38.67
2022-01-26 14:17:31.492 | DEBUG    | __main__:trials:24 - Trial = 13610/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.494 | DEBUG    | __main__:trials:29 - Trial = 13610/30000 | Total reward = 36.66
2022-01-26 14:17:31.498 | DEBUG    | __main__:trials:24 - Trial = 13611/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.499 | DEBUG    | __main__:trials:29 - Trial = 13611/30000 | Total reward = 42.17
2022-01-26 14:17:31.503 | DEBUG    | __main__:trials:24 - Trial = 13612/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.505 | DEBUG    | __main__:trials:29 - Trial = 13612/30000 | Total reward = 49.73
2022-01-26 14:17:31.508 | DEBUG    | __main__:trials:24 - Trial = 13613/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.510 | DEBUG    | __main__:trials:29 - Trial = 13613/30000 | Total reward = 54.11
2022-01-26 14:17:31.514 | DEBUG    | __main__:trials:24 - Trial = 13614/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.516 | DEBUG    | __main__:trials:29 - Trial = 13614/30000 | Total reward = 52.56
2022-01-26 14:17:31.519 | DEBUG    | __main__:trials:24 - Trial = 13615/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.521 | DEBUG    | __main__:trials:29 - Trial = 13615/30000 | Total reward = 49.52
2022-01-26 14:17:31.524 | DEBUG    | __main__:trials:24 - Trial = 13616/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.525 | DEBUG    | __main__:trials:29 - Trial = 13616/30000 | Total reward = 41.44
2022-01-26 14:17:31.529 | DEBUG    | __main__:trials:24 - Trial = 13617/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.530 | DEBUG    | __main__:trials:29 - Trial = 13617/30000 | Total reward = 45.13
2022-01-26 14:17:31.533 | DEBUG    | __main__:trials:24 - Trial = 13618/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.534 | DEBUG    | __main__:trials:29 - Trial = 13618/30000 | Total reward = 41.15
2022-01-26 14:17:31.538 | DEBUG    | __main__:trials:24 - Trial = 13619/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.540 | DEBUG    | __main__:trials:29 - Trial = 13619/30000 | Total reward = 30.46
2022-01-26 14:17:31.543 | DEBUG    | __main__:trials:24 - Trial = 13620/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.543 | DEBUG    | __main__:trials:29 - Trial = 13620/30000 | Total reward = 47.71
2022-01-26 14:17:31.547 | DEBUG    | __main__:trials:24 - Trial = 13621/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.548 | DEBUG    | __main__:trials:29 - Trial = 13621/30000 | Total reward = 43.53
2022-01-26 14:17:31.551 | DEBUG    | __main__:trials:24 - Trial = 13622/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.552 | DEBUG    | __main__:trials:29 - Trial = 13622/30000 | Total reward = 40.37
2022-01-26 14:17:31.555 | DEBUG    | __main__:trials:24 - Trial = 13623/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.557 | DEBUG    | __main__:trials:29 - Trial = 13623/30000 | Total reward = 47.46
2022-01-26 14:17:31.561 | DEBUG    | __main__:trials:24 - Trial = 13624/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.562 | DEBUG    | __main__:trials:29 - Trial = 13624/30000 | Total reward = 35.45
2022-01-26 14:17:31.566 | DEBUG    | __main__:trials:24 - Trial = 13625/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.567 | DEBUG    | __main__:trials:29 - Trial = 13625/30000 | Total reward = 47.05
2022-01-26 14:17:31.571 | DEBUG    | __main__:trials:24 - Trial = 13626/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.573 | DEBUG    | __main__:trials:29 - Trial = 13626/30000 | Total reward = 44.18
2022-01-26 14:17:31.577 | DEBUG    | __main__:trials:24 - Trial = 13627/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.578 | DEBUG    | __main__:trials:29 - Trial = 13627/30000 | Total reward = 44.31
2022-01-26 14:17:31.582 | DEBUG    | __main__:trials:24 - Trial = 13628/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.584 | DEBUG    | __main__:trials:29 - Trial = 13628/30000 | Total reward = 44.20
2022-01-26 14:17:31.587 | DEBUG    | __main__:trials:24 - Trial = 13629/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.589 | DEBUG    | __main__:trials:29 - Trial = 13629/30000 | Total reward = 45.50
2022-01-26 14:17:31.592 | DEBUG    | __main__:trials:24 - Trial = 13630/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.594 | DEBUG    | __main__:trials:29 - Trial = 13630/30000 | Total reward = 42.83
2022-01-26 14:17:31.598 | DEBUG    | __main__:trials:24 - Trial = 13631/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.599 | DEBUG    | __main__:trials:29 - Trial = 13631/30000 | Total reward = 46.22
2022-01-26 14:17:31.603 | DEBUG    | __main__:trials:24 - Trial = 13632/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.605 | DEBUG    | __main__:trials:29 - Trial = 13632/30000 | Total reward = 47.05
2022-01-26 14:17:31.609 | DEBUG    | __main__:trials:24 - Trial = 13633/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.611 | DEBUG    | __main__:trials:29 - Trial = 13633/30000 | Total reward = 41.47
2022-01-26 14:17:31.614 | DEBUG    | __main__:trials:24 - Trial = 13634/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.616 | DEBUG    | __main__:trials:29 - Trial = 13634/30000 | Total reward = 36.73
2022-01-26 14:17:31.619 | DEBUG    | __main__:trials:24 - Trial = 13635/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.621 | DEBUG    | __main__:trials:29 - Trial = 13635/30000 | Total reward = 38.99
2022-01-26 14:17:31.625 | DEBUG    | __main__:trials:24 - Trial = 13636/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.627 | DEBUG    | __main__:trials:29 - Trial = 13636/30000 | Total reward = 38.75
2022-01-26 14:17:31.631 | DEBUG    | __main__:trials:24 - Trial = 13637/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.632 | DEBUG    | __main__:trials:29 - Trial = 13637/30000 | Total reward = 38.37
2022-01-26 14:17:31.636 | DEBUG    | __main__:trials:24 - Trial = 13638/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.637 | DEBUG    | __main__:trials:29 - Trial = 13638/30000 | Total reward = 40.92
2022-01-26 14:17:31.641 | DEBUG    | __main__:trials:24 - Trial = 13639/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.643 | DEBUG    | __main__:trials:29 - Trial = 13639/30000 | Total reward = 38.83
2022-01-26 14:17:31.646 | DEBUG    | __main__:trials:24 - Trial = 13640/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.648 | DEBUG    | __main__:trials:29 - Trial = 13640/30000 | Total reward = 38.15
2022-01-26 14:17:31.652 | DEBUG    | __main__:trials:24 - Trial = 13641/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.653 | DEBUG    | __main__:trials:29 - Trial = 13641/30000 | Total reward = 46.76
2022-01-26 14:17:31.656 | DEBUG    | __main__:trials:24 - Trial = 13642/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.658 | DEBUG    | __main__:trials:29 - Trial = 13642/30000 | Total reward = 42.84
2022-01-26 14:17:31.662 | DEBUG    | __main__:trials:24 - Trial = 13643/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.663 | DEBUG    | __main__:trials:29 - Trial = 13643/30000 | Total reward = 57.87
2022-01-26 14:17:31.667 | DEBUG    | __main__:trials:24 - Trial = 13644/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.669 | DEBUG    | __main__:trials:29 - Trial = 13644/30000 | Total reward = 47.20
2022-01-26 14:17:31.672 | DEBUG    | __main__:trials:24 - Trial = 13645/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.674 | DEBUG    | __main__:trials:29 - Trial = 13645/30000 | Total reward = 54.17
2022-01-26 14:17:31.678 | DEBUG    | __main__:trials:24 - Trial = 13646/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.679 | DEBUG    | __main__:trials:29 - Trial = 13646/30000 | Total reward = 52.00
2022-01-26 14:17:31.683 | DEBUG    | __main__:trials:24 - Trial = 13647/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.685 | DEBUG    | __main__:trials:29 - Trial = 13647/30000 | Total reward = 38.33
2022-01-26 14:17:31.688 | DEBUG    | __main__:trials:24 - Trial = 13648/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.690 | DEBUG    | __main__:trials:29 - Trial = 13648/30000 | Total reward = 43.27
2022-01-26 14:17:31.694 | DEBUG    | __main__:trials:24 - Trial = 13649/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.695 | DEBUG    | __main__:trials:29 - Trial = 13649/30000 | Total reward = 32.44
2022-01-26 14:17:31.699 | DEBUG    | __main__:trials:24 - Trial = 13650/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.701 | DEBUG    | __main__:trials:29 - Trial = 13650/30000 | Total reward = 34.60
2022-01-26 14:17:31.705 | DEBUG    | __main__:trials:24 - Trial = 13651/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.706 | DEBUG    | __main__:trials:29 - Trial = 13651/30000 | Total reward = 38.41
2022-01-26 14:17:31.709 | DEBUG    | __main__:trials:24 - Trial = 13652/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.711 | DEBUG    | __main__:trials:29 - Trial = 13652/30000 | Total reward = 39.98
2022-01-26 14:17:31.715 | DEBUG    | __main__:trials:24 - Trial = 13653/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.717 | DEBUG    | __main__:trials:29 - Trial = 13653/30000 | Total reward = 41.49
2022-01-26 14:17:31.720 | DEBUG    | __main__:trials:24 - Trial = 13654/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.722 | DEBUG    | __main__:trials:29 - Trial = 13654/30000 | Total reward = 51.21
2022-01-26 14:17:31.725 | DEBUG    | __main__:trials:24 - Trial = 13655/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.725 | DEBUG    | __main__:trials:29 - Trial = 13655/30000 | Total reward = 39.40
2022-01-26 14:17:31.729 | DEBUG    | __main__:trials:24 - Trial = 13656/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.730 | DEBUG    | __main__:trials:29 - Trial = 13656/30000 | Total reward = 41.66
2022-01-26 14:17:31.734 | DEBUG    | __main__:trials:24 - Trial = 13657/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.736 | DEBUG    | __main__:trials:29 - Trial = 13657/30000 | Total reward = 37.00
2022-01-26 14:17:31.739 | DEBUG    | __main__:trials:24 - Trial = 13658/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.741 | DEBUG    | __main__:trials:29 - Trial = 13658/30000 | Total reward = 41.87
2022-01-26 14:17:31.744 | DEBUG    | __main__:trials:24 - Trial = 13659/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.745 | DEBUG    | __main__:trials:29 - Trial = 13659/30000 | Total reward = 46.67
2022-01-26 14:17:31.749 | DEBUG    | __main__:trials:24 - Trial = 13660/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.749 | DEBUG    | __main__:trials:29 - Trial = 13660/30000 | Total reward = 53.21
2022-01-26 14:17:31.754 | DEBUG    | __main__:trials:24 - Trial = 13661/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.756 | DEBUG    | __main__:trials:29 - Trial = 13661/30000 | Total reward = 46.10
2022-01-26 14:17:31.759 | DEBUG    | __main__:trials:24 - Trial = 13662/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.760 | DEBUG    | __main__:trials:29 - Trial = 13662/30000 | Total reward = 46.23
2022-01-26 14:17:31.765 | DEBUG    | __main__:trials:24 - Trial = 13663/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.766 | DEBUG    | __main__:trials:29 - Trial = 13663/30000 | Total reward = 47.86
2022-01-26 14:17:31.770 | DEBUG    | __main__:trials:24 - Trial = 13664/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.772 | DEBUG    | __main__:trials:29 - Trial = 13664/30000 | Total reward = 43.60
2022-01-26 14:17:31.776 | DEBUG    | __main__:trials:24 - Trial = 13665/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.777 | DEBUG    | __main__:trials:29 - Trial = 13665/30000 | Total reward = 45.19
2022-01-26 14:17:31.781 | DEBUG    | __main__:trials:24 - Trial = 13666/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.782 | DEBUG    | __main__:trials:29 - Trial = 13666/30000 | Total reward = 45.73
2022-01-26 14:17:31.785 | DEBUG    | __main__:trials:24 - Trial = 13667/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.786 | DEBUG    | __main__:trials:29 - Trial = 13667/30000 | Total reward = 55.10
2022-01-26 14:17:31.790 | DEBUG    | __main__:trials:24 - Trial = 13668/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.792 | DEBUG    | __main__:trials:29 - Trial = 13668/30000 | Total reward = 50.22
2022-01-26 14:17:31.795 | DEBUG    | __main__:trials:24 - Trial = 13669/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.796 | DEBUG    | __main__:trials:29 - Trial = 13669/30000 | Total reward = 40.29
2022-01-26 14:17:31.800 | DEBUG    | __main__:trials:24 - Trial = 13670/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.802 | DEBUG    | __main__:trials:29 - Trial = 13670/30000 | Total reward = 43.70
2022-01-26 14:17:31.807 | DEBUG    | __main__:trials:24 - Trial = 13671/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.809 | DEBUG    | __main__:trials:29 - Trial = 13671/30000 | Total reward = 40.64
2022-01-26 14:17:31.811 | DEBUG    | __main__:trials:24 - Trial = 13672/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.813 | DEBUG    | __main__:trials:29 - Trial = 13672/30000 | Total reward = 41.55
2022-01-26 14:17:31.816 | DEBUG    | __main__:trials:24 - Trial = 13673/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.819 | DEBUG    | __main__:trials:29 - Trial = 13673/30000 | Total reward = 43.13
2022-01-26 14:17:31.822 | DEBUG    | __main__:trials:24 - Trial = 13674/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.824 | DEBUG    | __main__:trials:29 - Trial = 13674/30000 | Total reward = 38.50
2022-01-26 14:17:31.828 | DEBUG    | __main__:trials:24 - Trial = 13675/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.829 | DEBUG    | __main__:trials:29 - Trial = 13675/30000 | Total reward = 53.45
2022-01-26 14:17:31.833 | DEBUG    | __main__:trials:24 - Trial = 13676/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.834 | DEBUG    | __main__:trials:29 - Trial = 13676/30000 | Total reward = 53.13
2022-01-26 14:17:31.838 | DEBUG    | __main__:trials:24 - Trial = 13677/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.840 | DEBUG    | __main__:trials:29 - Trial = 13677/30000 | Total reward = 45.32
2022-01-26 14:17:31.844 | DEBUG    | __main__:trials:24 - Trial = 13678/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.845 | DEBUG    | __main__:trials:29 - Trial = 13678/30000 | Total reward = 52.59
2022-01-26 14:17:31.849 | DEBUG    | __main__:trials:24 - Trial = 13679/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.850 | DEBUG    | __main__:trials:29 - Trial = 13679/30000 | Total reward = 48.18
2022-01-26 14:17:31.853 | DEBUG    | __main__:trials:24 - Trial = 13680/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.854 | DEBUG    | __main__:trials:29 - Trial = 13680/30000 | Total reward = 46.64
2022-01-26 14:17:31.857 | DEBUG    | __main__:trials:24 - Trial = 13681/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.859 | DEBUG    | __main__:trials:29 - Trial = 13681/30000 | Total reward = 33.69
2022-01-26 14:17:31.862 | DEBUG    | __main__:trials:24 - Trial = 13682/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.864 | DEBUG    | __main__:trials:29 - Trial = 13682/30000 | Total reward = 52.40
2022-01-26 14:17:31.867 | DEBUG    | __main__:trials:24 - Trial = 13683/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.869 | DEBUG    | __main__:trials:29 - Trial = 13683/30000 | Total reward = 49.05
2022-01-26 14:17:31.873 | DEBUG    | __main__:trials:24 - Trial = 13684/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.875 | DEBUG    | __main__:trials:29 - Trial = 13684/30000 | Total reward = 57.79
2022-01-26 14:17:31.879 | DEBUG    | __main__:trials:24 - Trial = 13685/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.880 | DEBUG    | __main__:trials:29 - Trial = 13685/30000 | Total reward = 53.61
2022-01-26 14:17:31.884 | DEBUG    | __main__:trials:24 - Trial = 13686/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.886 | DEBUG    | __main__:trials:29 - Trial = 13686/30000 | Total reward = 40.61
2022-01-26 14:17:31.889 | DEBUG    | __main__:trials:24 - Trial = 13687/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.891 | DEBUG    | __main__:trials:29 - Trial = 13687/30000 | Total reward = 43.03
2022-01-26 14:17:31.895 | DEBUG    | __main__:trials:24 - Trial = 13688/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.896 | DEBUG    | __main__:trials:29 - Trial = 13688/30000 | Total reward = 39.45
2022-01-26 14:17:31.900 | DEBUG    | __main__:trials:24 - Trial = 13689/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.901 | DEBUG    | __main__:trials:29 - Trial = 13689/30000 | Total reward = 40.84
2022-01-26 14:17:31.905 | DEBUG    | __main__:trials:24 - Trial = 13690/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.906 | DEBUG    | __main__:trials:29 - Trial = 13690/30000 | Total reward = 33.50
2022-01-26 14:17:31.910 | DEBUG    | __main__:trials:24 - Trial = 13691/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.912 | DEBUG    | __main__:trials:29 - Trial = 13691/30000 | Total reward = 40.59
2022-01-26 14:17:31.915 | DEBUG    | __main__:trials:24 - Trial = 13692/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.916 | DEBUG    | __main__:trials:29 - Trial = 13692/30000 | Total reward = 34.27
2022-01-26 14:17:31.920 | DEBUG    | __main__:trials:24 - Trial = 13693/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.922 | DEBUG    | __main__:trials:29 - Trial = 13693/30000 | Total reward = 47.45
2022-01-26 14:17:31.925 | DEBUG    | __main__:trials:24 - Trial = 13694/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.927 | DEBUG    | __main__:trials:29 - Trial = 13694/30000 | Total reward = 49.80
2022-01-26 14:17:31.931 | DEBUG    | __main__:trials:24 - Trial = 13695/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.932 | DEBUG    | __main__:trials:29 - Trial = 13695/30000 | Total reward = 41.31
2022-01-26 14:17:31.935 | DEBUG    | __main__:trials:24 - Trial = 13696/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.937 | DEBUG    | __main__:trials:29 - Trial = 13696/30000 | Total reward = 42.58
2022-01-26 14:17:31.941 | DEBUG    | __main__:trials:24 - Trial = 13697/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.942 | DEBUG    | __main__:trials:29 - Trial = 13697/30000 | Total reward = 42.58
2022-01-26 14:17:31.946 | DEBUG    | __main__:trials:24 - Trial = 13698/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.948 | DEBUG    | __main__:trials:29 - Trial = 13698/30000 | Total reward = 42.38
2022-01-26 14:17:31.951 | DEBUG    | __main__:trials:24 - Trial = 13699/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.953 | DEBUG    | __main__:trials:29 - Trial = 13699/30000 | Total reward = 38.66
2022-01-26 14:17:31.956 | DEBUG    | __main__:trials:24 - Trial = 13700/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.958 | DEBUG    | __main__:trials:29 - Trial = 13700/30000 | Total reward = 38.86
2022-01-26 14:17:31.962 | DEBUG    | __main__:trials:24 - Trial = 13701/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.963 | DEBUG    | __main__:trials:29 - Trial = 13701/30000 | Total reward = 52.11
2022-01-26 14:17:31.966 | DEBUG    | __main__:trials:24 - Trial = 13702/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.968 | DEBUG    | __main__:trials:29 - Trial = 13702/30000 | Total reward = 47.05
2022-01-26 14:17:31.972 | DEBUG    | __main__:trials:24 - Trial = 13703/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.974 | DEBUG    | __main__:trials:29 - Trial = 13703/30000 | Total reward = 45.50
2022-01-26 14:17:31.978 | DEBUG    | __main__:trials:24 - Trial = 13704/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.979 | DEBUG    | __main__:trials:29 - Trial = 13704/30000 | Total reward = 41.79
2022-01-26 14:17:31.983 | DEBUG    | __main__:trials:24 - Trial = 13705/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.985 | DEBUG    | __main__:trials:29 - Trial = 13705/30000 | Total reward = 47.02
2022-01-26 14:17:31.988 | DEBUG    | __main__:trials:24 - Trial = 13706/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.990 | DEBUG    | __main__:trials:29 - Trial = 13706/30000 | Total reward = 45.88
2022-01-26 14:17:31.994 | DEBUG    | __main__:trials:24 - Trial = 13707/30000 | Max number of steps (20) reached
2022-01-26 14:17:31.995 | DEBUG    | __main__:trials:29 - Trial = 13707/30000 | Total reward = 41.27
2022-01-26 14:17:31.999 | DEBUG    | __main__:trials:24 - Trial = 13708/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.001 | DEBUG    | __main__:trials:29 - Trial = 13708/30000 | Total reward = 36.70
2022-01-26 14:17:32.004 | DEBUG    | __main__:trials:24 - Trial = 13709/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.005 | DEBUG    | __main__:trials:29 - Trial = 13709/30000 | Total reward = 47.46
2022-01-26 14:17:32.008 | DEBUG    | __main__:trials:24 - Trial = 13710/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.010 | DEBUG    | __main__:trials:29 - Trial = 13710/30000 | Total reward = 53.84
2022-01-26 14:17:32.014 | DEBUG    | __main__:trials:24 - Trial = 13711/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.015 | DEBUG    | __main__:trials:29 - Trial = 13711/30000 | Total reward = 53.05
2022-01-26 14:17:32.019 | DEBUG    | __main__:trials:24 - Trial = 13712/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.020 | DEBUG    | __main__:trials:29 - Trial = 13712/30000 | Total reward = 42.77
2022-01-26 14:17:32.024 | DEBUG    | __main__:trials:24 - Trial = 13713/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.026 | DEBUG    | __main__:trials:29 - Trial = 13713/30000 | Total reward = 41.64
2022-01-26 14:17:32.030 | DEBUG    | __main__:trials:24 - Trial = 13714/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.032 | DEBUG    | __main__:trials:29 - Trial = 13714/30000 | Total reward = 49.09
2022-01-26 14:17:32.036 | DEBUG    | __main__:trials:24 - Trial = 13715/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.037 | DEBUG    | __main__:trials:29 - Trial = 13715/30000 | Total reward = 41.74
2022-01-26 14:17:32.041 | DEBUG    | __main__:trials:24 - Trial = 13716/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.043 | DEBUG    | __main__:trials:29 - Trial = 13716/30000 | Total reward = 43.11
2022-01-26 14:17:32.047 | DEBUG    | __main__:trials:24 - Trial = 13717/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.048 | DEBUG    | __main__:trials:29 - Trial = 13717/30000 | Total reward = 40.48
2022-01-26 14:17:32.052 | DEBUG    | __main__:trials:24 - Trial = 13718/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.054 | DEBUG    | __main__:trials:29 - Trial = 13718/30000 | Total reward = 51.10
2022-01-26 14:17:32.057 | DEBUG    | __main__:trials:24 - Trial = 13719/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.059 | DEBUG    | __main__:trials:29 - Trial = 13719/30000 | Total reward = 39.75
2022-01-26 14:17:32.063 | DEBUG    | __main__:trials:24 - Trial = 13720/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.064 | DEBUG    | __main__:trials:29 - Trial = 13720/30000 | Total reward = 38.64
2022-01-26 14:17:32.068 | DEBUG    | __main__:trials:24 - Trial = 13721/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.069 | DEBUG    | __main__:trials:29 - Trial = 13721/30000 | Total reward = 50.27
2022-01-26 14:17:32.072 | DEBUG    | __main__:trials:24 - Trial = 13722/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.074 | DEBUG    | __main__:trials:29 - Trial = 13722/30000 | Total reward = 38.28
2022-01-26 14:17:32.078 | DEBUG    | __main__:trials:24 - Trial = 13723/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.079 | DEBUG    | __main__:trials:29 - Trial = 13723/30000 | Total reward = 47.05
2022-01-26 14:17:32.083 | DEBUG    | __main__:trials:24 - Trial = 13724/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.084 | DEBUG    | __main__:trials:29 - Trial = 13724/30000 | Total reward = 46.83
2022-01-26 14:17:32.087 | DEBUG    | __main__:trials:24 - Trial = 13725/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.089 | DEBUG    | __main__:trials:29 - Trial = 13725/30000 | Total reward = 39.28
2022-01-26 14:17:32.093 | DEBUG    | __main__:trials:24 - Trial = 13726/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.095 | DEBUG    | __main__:trials:29 - Trial = 13726/30000 | Total reward = 47.20
2022-01-26 14:17:32.099 | DEBUG    | __main__:trials:24 - Trial = 13727/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.100 | DEBUG    | __main__:trials:29 - Trial = 13727/30000 | Total reward = 51.66
2022-01-26 14:17:32.104 | DEBUG    | __main__:trials:24 - Trial = 13728/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.105 | DEBUG    | __main__:trials:29 - Trial = 13728/30000 | Total reward = 46.87
2022-01-26 14:17:32.109 | DEBUG    | __main__:trials:24 - Trial = 13729/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.110 | DEBUG    | __main__:trials:29 - Trial = 13729/30000 | Total reward = 36.51
2022-01-26 14:17:32.114 | DEBUG    | __main__:trials:24 - Trial = 13730/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.116 | DEBUG    | __main__:trials:29 - Trial = 13730/30000 | Total reward = 46.52
2022-01-26 14:17:32.119 | DEBUG    | __main__:trials:24 - Trial = 13731/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.121 | DEBUG    | __main__:trials:29 - Trial = 13731/30000 | Total reward = 43.13
2022-01-26 14:17:32.124 | DEBUG    | __main__:trials:24 - Trial = 13732/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.126 | DEBUG    | __main__:trials:29 - Trial = 13732/30000 | Total reward = 44.42
2022-01-26 14:17:32.129 | DEBUG    | __main__:trials:24 - Trial = 13733/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.130 | DEBUG    | __main__:trials:29 - Trial = 13733/30000 | Total reward = 48.33
2022-01-26 14:17:32.133 | DEBUG    | __main__:trials:24 - Trial = 13734/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.134 | DEBUG    | __main__:trials:29 - Trial = 13734/30000 | Total reward = 37.69
2022-01-26 14:17:32.138 | DEBUG    | __main__:trials:24 - Trial = 13735/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.140 | DEBUG    | __main__:trials:29 - Trial = 13735/30000 | Total reward = 43.39
2022-01-26 14:17:32.144 | DEBUG    | __main__:trials:24 - Trial = 13736/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.145 | DEBUG    | __main__:trials:29 - Trial = 13736/30000 | Total reward = 40.57
2022-01-26 14:17:32.149 | DEBUG    | __main__:trials:24 - Trial = 13737/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.150 | DEBUG    | __main__:trials:29 - Trial = 13737/30000 | Total reward = 47.73
2022-01-26 14:17:32.153 | DEBUG    | __main__:trials:24 - Trial = 13738/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.154 | DEBUG    | __main__:trials:29 - Trial = 13738/30000 | Total reward = 44.18
2022-01-26 14:17:32.157 | DEBUG    | __main__:trials:24 - Trial = 13739/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.158 | DEBUG    | __main__:trials:29 - Trial = 13739/30000 | Total reward = 65.65
2022-01-26 14:17:32.161 | DEBUG    | __main__:trials:24 - Trial = 13740/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.162 | DEBUG    | __main__:trials:29 - Trial = 13740/30000 | Total reward = 49.46
2022-01-26 14:17:32.165 | DEBUG    | __main__:trials:24 - Trial = 13741/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.167 | DEBUG    | __main__:trials:29 - Trial = 13741/30000 | Total reward = 56.97
2022-01-26 14:17:32.171 | DEBUG    | __main__:trials:24 - Trial = 13742/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.172 | DEBUG    | __main__:trials:29 - Trial = 13742/30000 | Total reward = 48.43
2022-01-26 14:17:32.176 | DEBUG    | __main__:trials:24 - Trial = 13743/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.178 | DEBUG    | __main__:trials:29 - Trial = 13743/30000 | Total reward = 40.40
2022-01-26 14:17:32.182 | DEBUG    | __main__:trials:24 - Trial = 13744/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.183 | DEBUG    | __main__:trials:29 - Trial = 13744/30000 | Total reward = 39.97
2022-01-26 14:17:32.187 | DEBUG    | __main__:trials:24 - Trial = 13745/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.189 | DEBUG    | __main__:trials:29 - Trial = 13745/30000 | Total reward = 42.26
2022-01-26 14:17:32.192 | DEBUG    | __main__:trials:24 - Trial = 13746/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.193 | DEBUG    | __main__:trials:29 - Trial = 13746/30000 | Total reward = 55.85
2022-01-26 14:17:32.197 | DEBUG    | __main__:trials:24 - Trial = 13747/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.199 | DEBUG    | __main__:trials:29 - Trial = 13747/30000 | Total reward = 33.34
2022-01-26 14:17:32.202 | DEBUG    | __main__:trials:24 - Trial = 13748/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.204 | DEBUG    | __main__:trials:29 - Trial = 13748/30000 | Total reward = 44.41
2022-01-26 14:17:32.207 | DEBUG    | __main__:trials:24 - Trial = 13749/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.210 | DEBUG    | __main__:trials:29 - Trial = 13749/30000 | Total reward = 47.46
2022-01-26 14:17:32.213 | DEBUG    | __main__:trials:24 - Trial = 13750/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.215 | DEBUG    | __main__:trials:29 - Trial = 13750/30000 | Total reward = 46.23
2022-01-26 14:17:32.219 | DEBUG    | __main__:trials:24 - Trial = 13751/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.220 | DEBUG    | __main__:trials:29 - Trial = 13751/30000 | Total reward = 53.95
2022-01-26 14:17:32.224 | DEBUG    | __main__:trials:24 - Trial = 13752/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.224 | DEBUG    | __main__:trials:29 - Trial = 13752/30000 | Total reward = 44.14
2022-01-26 14:17:32.229 | DEBUG    | __main__:trials:24 - Trial = 13753/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.229 | DEBUG    | __main__:trials:29 - Trial = 13753/30000 | Total reward = 43.25
2022-01-26 14:17:32.233 | DEBUG    | __main__:trials:24 - Trial = 13754/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.234 | DEBUG    | __main__:trials:29 - Trial = 13754/30000 | Total reward = 47.20
2022-01-26 14:17:32.238 | DEBUG    | __main__:trials:24 - Trial = 13755/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.240 | DEBUG    | __main__:trials:29 - Trial = 13755/30000 | Total reward = 46.82
2022-01-26 14:17:32.243 | DEBUG    | __main__:trials:24 - Trial = 13756/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.245 | DEBUG    | __main__:trials:29 - Trial = 13756/30000 | Total reward = 34.94
2022-01-26 14:17:32.249 | DEBUG    | __main__:trials:24 - Trial = 13757/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.250 | DEBUG    | __main__:trials:29 - Trial = 13757/30000 | Total reward = 39.50
2022-01-26 14:17:32.254 | DEBUG    | __main__:trials:24 - Trial = 13758/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.256 | DEBUG    | __main__:trials:29 - Trial = 13758/30000 | Total reward = 38.59
2022-01-26 14:17:32.260 | DEBUG    | __main__:trials:24 - Trial = 13759/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.261 | DEBUG    | __main__:trials:29 - Trial = 13759/30000 | Total reward = 48.47
2022-01-26 14:17:32.265 | DEBUG    | __main__:trials:24 - Trial = 13760/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.267 | DEBUG    | __main__:trials:29 - Trial = 13760/30000 | Total reward = 44.74
2022-01-26 14:17:32.271 | DEBUG    | __main__:trials:24 - Trial = 13761/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.273 | DEBUG    | __main__:trials:29 - Trial = 13761/30000 | Total reward = 61.50
2022-01-26 14:17:32.276 | DEBUG    | __main__:trials:24 - Trial = 13762/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.278 | DEBUG    | __main__:trials:29 - Trial = 13762/30000 | Total reward = 57.04
2022-01-26 14:17:32.282 | DEBUG    | __main__:trials:24 - Trial = 13763/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.283 | DEBUG    | __main__:trials:29 - Trial = 13763/30000 | Total reward = 56.55
2022-01-26 14:17:32.286 | DEBUG    | __main__:trials:24 - Trial = 13764/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.288 | DEBUG    | __main__:trials:29 - Trial = 13764/30000 | Total reward = 39.98
2022-01-26 14:17:32.292 | DEBUG    | __main__:trials:24 - Trial = 13765/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.294 | DEBUG    | __main__:trials:29 - Trial = 13765/30000 | Total reward = 49.11
2022-01-26 14:17:32.297 | DEBUG    | __main__:trials:24 - Trial = 13766/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.298 | DEBUG    | __main__:trials:29 - Trial = 13766/30000 | Total reward = 46.70
2022-01-26 14:17:32.301 | DEBUG    | __main__:trials:24 - Trial = 13767/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.303 | DEBUG    | __main__:trials:29 - Trial = 13767/30000 | Total reward = 34.50
2022-01-26 14:17:32.306 | DEBUG    | __main__:trials:24 - Trial = 13768/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.308 | DEBUG    | __main__:trials:29 - Trial = 13768/30000 | Total reward = 50.62
2022-01-26 14:17:32.312 | DEBUG    | __main__:trials:24 - Trial = 13769/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.313 | DEBUG    | __main__:trials:29 - Trial = 13769/30000 | Total reward = 46.26
2022-01-26 14:17:32.317 | DEBUG    | __main__:trials:24 - Trial = 13770/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.319 | DEBUG    | __main__:trials:29 - Trial = 13770/30000 | Total reward = 47.11
2022-01-26 14:17:32.322 | DEBUG    | __main__:trials:24 - Trial = 13771/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.324 | DEBUG    | __main__:trials:29 - Trial = 13771/30000 | Total reward = 50.95
2022-01-26 14:17:32.327 | DEBUG    | __main__:trials:24 - Trial = 13772/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.328 | DEBUG    | __main__:trials:29 - Trial = 13772/30000 | Total reward = 49.46
2022-01-26 14:17:32.332 | DEBUG    | __main__:trials:24 - Trial = 13773/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.334 | DEBUG    | __main__:trials:29 - Trial = 13773/30000 | Total reward = 49.93
2022-01-26 14:17:32.338 | DEBUG    | __main__:trials:24 - Trial = 13774/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.339 | DEBUG    | __main__:trials:29 - Trial = 13774/30000 | Total reward = 47.51
2022-01-26 14:17:32.343 | DEBUG    | __main__:trials:24 - Trial = 13775/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.344 | DEBUG    | __main__:trials:29 - Trial = 13775/30000 | Total reward = 45.50
2022-01-26 14:17:32.348 | DEBUG    | __main__:trials:24 - Trial = 13776/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.349 | DEBUG    | __main__:trials:29 - Trial = 13776/30000 | Total reward = 44.65
2022-01-26 14:17:32.353 | DEBUG    | __main__:trials:24 - Trial = 13777/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.355 | DEBUG    | __main__:trials:29 - Trial = 13777/30000 | Total reward = 48.93
2022-01-26 14:17:32.358 | DEBUG    | __main__:trials:24 - Trial = 13778/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.359 | DEBUG    | __main__:trials:29 - Trial = 13778/30000 | Total reward = 46.21
2022-01-26 14:17:32.364 | DEBUG    | __main__:trials:24 - Trial = 13779/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.365 | DEBUG    | __main__:trials:29 - Trial = 13779/30000 | Total reward = 47.54
2022-01-26 14:17:32.369 | DEBUG    | __main__:trials:24 - Trial = 13780/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.371 | DEBUG    | __main__:trials:29 - Trial = 13780/30000 | Total reward = 44.91
2022-01-26 14:17:32.375 | DEBUG    | __main__:trials:24 - Trial = 13781/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.375 | DEBUG    | __main__:trials:29 - Trial = 13781/30000 | Total reward = 47.76
2022-01-26 14:17:32.380 | DEBUG    | __main__:trials:24 - Trial = 13782/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.381 | DEBUG    | __main__:trials:29 - Trial = 13782/30000 | Total reward = 48.98
2022-01-26 14:17:32.384 | DEBUG    | __main__:trials:24 - Trial = 13783/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.386 | DEBUG    | __main__:trials:29 - Trial = 13783/30000 | Total reward = 44.49
2022-01-26 14:17:32.390 | DEBUG    | __main__:trials:24 - Trial = 13784/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.392 | DEBUG    | __main__:trials:29 - Trial = 13784/30000 | Total reward = 62.25
2022-01-26 14:17:32.394 | DEBUG    | __main__:trials:24 - Trial = 13785/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.396 | DEBUG    | __main__:trials:29 - Trial = 13785/30000 | Total reward = 51.41
2022-01-26 14:17:32.399 | DEBUG    | __main__:trials:24 - Trial = 13786/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.401 | DEBUG    | __main__:trials:29 - Trial = 13786/30000 | Total reward = 38.48
2022-01-26 14:17:32.404 | DEBUG    | __main__:trials:24 - Trial = 13787/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.406 | DEBUG    | __main__:trials:29 - Trial = 13787/30000 | Total reward = 53.41
2022-01-26 14:17:32.409 | DEBUG    | __main__:trials:24 - Trial = 13788/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.410 | DEBUG    | __main__:trials:29 - Trial = 13788/30000 | Total reward = 54.41
2022-01-26 14:17:32.414 | DEBUG    | __main__:trials:24 - Trial = 13789/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.416 | DEBUG    | __main__:trials:29 - Trial = 13789/30000 | Total reward = 43.26
2022-01-26 14:17:32.420 | DEBUG    | __main__:trials:24 - Trial = 13790/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.421 | DEBUG    | __main__:trials:29 - Trial = 13790/30000 | Total reward = 33.75
2022-01-26 14:17:32.425 | DEBUG    | __main__:trials:24 - Trial = 13791/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.427 | DEBUG    | __main__:trials:29 - Trial = 13791/30000 | Total reward = 41.72
2022-01-26 14:17:32.431 | DEBUG    | __main__:trials:24 - Trial = 13792/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.432 | DEBUG    | __main__:trials:29 - Trial = 13792/30000 | Total reward = 51.47
2022-01-26 14:17:32.436 | DEBUG    | __main__:trials:24 - Trial = 13793/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.438 | DEBUG    | __main__:trials:29 - Trial = 13793/30000 | Total reward = 47.65
2022-01-26 14:17:32.441 | DEBUG    | __main__:trials:24 - Trial = 13794/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.443 | DEBUG    | __main__:trials:29 - Trial = 13794/30000 | Total reward = 63.33
2022-01-26 14:17:32.447 | DEBUG    | __main__:trials:24 - Trial = 13795/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.449 | DEBUG    | __main__:trials:29 - Trial = 13795/30000 | Total reward = 45.62
2022-01-26 14:17:32.453 | DEBUG    | __main__:trials:24 - Trial = 13796/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.453 | DEBUG    | __main__:trials:29 - Trial = 13796/30000 | Total reward = 47.40
2022-01-26 14:17:32.458 | DEBUG    | __main__:trials:24 - Trial = 13797/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.459 | DEBUG    | __main__:trials:29 - Trial = 13797/30000 | Total reward = 64.47
2022-01-26 14:17:32.463 | DEBUG    | __main__:trials:24 - Trial = 13798/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.464 | DEBUG    | __main__:trials:29 - Trial = 13798/30000 | Total reward = 41.79
2022-01-26 14:17:32.468 | DEBUG    | __main__:trials:24 - Trial = 13799/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.470 | DEBUG    | __main__:trials:29 - Trial = 13799/30000 | Total reward = 47.11
2022-01-26 14:17:32.474 | DEBUG    | __main__:trials:24 - Trial = 13800/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.475 | DEBUG    | __main__:trials:29 - Trial = 13800/30000 | Total reward = 47.02
2022-01-26 14:17:32.479 | DEBUG    | __main__:trials:24 - Trial = 13801/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.480 | DEBUG    | __main__:trials:29 - Trial = 13801/30000 | Total reward = 40.76
2022-01-26 14:17:32.484 | DEBUG    | __main__:trials:24 - Trial = 13802/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.486 | DEBUG    | __main__:trials:29 - Trial = 13802/30000 | Total reward = 47.60
2022-01-26 14:17:32.489 | DEBUG    | __main__:trials:24 - Trial = 13803/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.491 | DEBUG    | __main__:trials:29 - Trial = 13803/30000 | Total reward = 39.50
2022-01-26 14:17:32.495 | DEBUG    | __main__:trials:24 - Trial = 13804/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.496 | DEBUG    | __main__:trials:29 - Trial = 13804/30000 | Total reward = 43.66
2022-01-26 14:17:32.500 | DEBUG    | __main__:trials:24 - Trial = 13805/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.502 | DEBUG    | __main__:trials:29 - Trial = 13805/30000 | Total reward = 46.73
2022-01-26 14:17:32.506 | DEBUG    | __main__:trials:24 - Trial = 13806/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.508 | DEBUG    | __main__:trials:29 - Trial = 13806/30000 | Total reward = 46.41
2022-01-26 14:17:32.511 | DEBUG    | __main__:trials:24 - Trial = 13807/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.513 | DEBUG    | __main__:trials:29 - Trial = 13807/30000 | Total reward = 38.02
2022-01-26 14:17:32.517 | DEBUG    | __main__:trials:24 - Trial = 13808/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.517 | DEBUG    | __main__:trials:29 - Trial = 13808/30000 | Total reward = 45.80
2022-01-26 14:17:32.520 | DEBUG    | __main__:trials:24 - Trial = 13809/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.522 | DEBUG    | __main__:trials:29 - Trial = 13809/30000 | Total reward = 45.66
2022-01-26 14:17:32.526 | DEBUG    | __main__:trials:24 - Trial = 13810/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.527 | DEBUG    | __main__:trials:29 - Trial = 13810/30000 | Total reward = 39.53
2022-01-26 14:17:32.531 | DEBUG    | __main__:trials:24 - Trial = 13811/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.532 | DEBUG    | __main__:trials:29 - Trial = 13811/30000 | Total reward = 49.76
2022-01-26 14:17:32.535 | DEBUG    | __main__:trials:24 - Trial = 13812/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.537 | DEBUG    | __main__:trials:29 - Trial = 13812/30000 | Total reward = 45.04
2022-01-26 14:17:32.541 | DEBUG    | __main__:trials:24 - Trial = 13813/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.543 | DEBUG    | __main__:trials:29 - Trial = 13813/30000 | Total reward = 42.45
2022-01-26 14:17:32.546 | DEBUG    | __main__:trials:24 - Trial = 13814/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.548 | DEBUG    | __main__:trials:29 - Trial = 13814/30000 | Total reward = 43.59
2022-01-26 14:17:32.551 | DEBUG    | __main__:trials:24 - Trial = 13815/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.553 | DEBUG    | __main__:trials:29 - Trial = 13815/30000 | Total reward = 48.65
2022-01-26 14:17:32.556 | DEBUG    | __main__:trials:24 - Trial = 13816/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.558 | DEBUG    | __main__:trials:29 - Trial = 13816/30000 | Total reward = 40.04
2022-01-26 14:17:32.562 | DEBUG    | __main__:trials:24 - Trial = 13817/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.563 | DEBUG    | __main__:trials:29 - Trial = 13817/30000 | Total reward = 45.83
2022-01-26 14:17:32.567 | DEBUG    | __main__:trials:24 - Trial = 13818/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.569 | DEBUG    | __main__:trials:29 - Trial = 13818/30000 | Total reward = 44.11
2022-01-26 14:17:32.572 | DEBUG    | __main__:trials:24 - Trial = 13819/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.573 | DEBUG    | __main__:trials:29 - Trial = 13819/30000 | Total reward = 39.91
2022-01-26 14:17:32.576 | DEBUG    | __main__:trials:24 - Trial = 13820/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.577 | DEBUG    | __main__:trials:29 - Trial = 13820/30000 | Total reward = 47.49
2022-01-26 14:17:32.580 | DEBUG    | __main__:trials:24 - Trial = 13821/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.581 | DEBUG    | __main__:trials:29 - Trial = 13821/30000 | Total reward = 50.23
2022-01-26 14:17:32.585 | DEBUG    | __main__:trials:24 - Trial = 13822/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.587 | DEBUG    | __main__:trials:29 - Trial = 13822/30000 | Total reward = 43.17
2022-01-26 14:17:32.590 | DEBUG    | __main__:trials:24 - Trial = 13823/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.592 | DEBUG    | __main__:trials:29 - Trial = 13823/30000 | Total reward = 46.79
2022-01-26 14:17:32.596 | DEBUG    | __main__:trials:24 - Trial = 13824/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.598 | DEBUG    | __main__:trials:29 - Trial = 13824/30000 | Total reward = 48.64
2022-01-26 14:17:32.601 | DEBUG    | __main__:trials:24 - Trial = 13825/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.603 | DEBUG    | __main__:trials:29 - Trial = 13825/30000 | Total reward = 47.20
2022-01-26 14:17:32.607 | DEBUG    | __main__:trials:24 - Trial = 13826/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.608 | DEBUG    | __main__:trials:29 - Trial = 13826/30000 | Total reward = 47.05
2022-01-26 14:17:32.612 | DEBUG    | __main__:trials:24 - Trial = 13827/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.613 | DEBUG    | __main__:trials:29 - Trial = 13827/30000 | Total reward = 43.87
2022-01-26 14:17:32.617 | DEBUG    | __main__:trials:24 - Trial = 13828/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.619 | DEBUG    | __main__:trials:29 - Trial = 13828/30000 | Total reward = 48.26
2022-01-26 14:17:32.622 | DEBUG    | __main__:trials:24 - Trial = 13829/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.623 | DEBUG    | __main__:trials:29 - Trial = 13829/30000 | Total reward = 42.28
2022-01-26 14:17:32.627 | DEBUG    | __main__:trials:24 - Trial = 13830/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.629 | DEBUG    | __main__:trials:29 - Trial = 13830/30000 | Total reward = 51.96
2022-01-26 14:17:32.632 | DEBUG    | __main__:trials:24 - Trial = 13831/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.634 | DEBUG    | __main__:trials:29 - Trial = 13831/30000 | Total reward = 46.92
2022-01-26 14:17:32.638 | DEBUG    | __main__:trials:24 - Trial = 13832/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.640 | DEBUG    | __main__:trials:29 - Trial = 13832/30000 | Total reward = 49.43
2022-01-26 14:17:32.643 | DEBUG    | __main__:trials:24 - Trial = 13833/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.645 | DEBUG    | __main__:trials:29 - Trial = 13833/30000 | Total reward = 43.21
2022-01-26 14:17:32.648 | DEBUG    | __main__:trials:24 - Trial = 13834/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.650 | DEBUG    | __main__:trials:29 - Trial = 13834/30000 | Total reward = 41.40
2022-01-26 14:17:32.654 | DEBUG    | __main__:trials:24 - Trial = 13835/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.655 | DEBUG    | __main__:trials:29 - Trial = 13835/30000 | Total reward = 46.72
2022-01-26 14:17:32.659 | DEBUG    | __main__:trials:24 - Trial = 13836/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.661 | DEBUG    | __main__:trials:29 - Trial = 13836/30000 | Total reward = 39.04
2022-01-26 14:17:32.664 | DEBUG    | __main__:trials:24 - Trial = 13837/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.666 | DEBUG    | __main__:trials:29 - Trial = 13837/30000 | Total reward = 43.91
2022-01-26 14:17:32.669 | DEBUG    | __main__:trials:24 - Trial = 13838/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.671 | DEBUG    | __main__:trials:29 - Trial = 13838/30000 | Total reward = 58.16
2022-01-26 14:17:32.675 | DEBUG    | __main__:trials:24 - Trial = 13839/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.677 | DEBUG    | __main__:trials:29 - Trial = 13839/30000 | Total reward = 40.49
2022-01-26 14:17:32.680 | DEBUG    | __main__:trials:24 - Trial = 13840/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.682 | DEBUG    | __main__:trials:29 - Trial = 13840/30000 | Total reward = 42.75
2022-01-26 14:17:32.686 | DEBUG    | __main__:trials:24 - Trial = 13841/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.687 | DEBUG    | __main__:trials:29 - Trial = 13841/30000 | Total reward = 54.13
2022-01-26 14:17:32.690 | DEBUG    | __main__:trials:24 - Trial = 13842/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.692 | DEBUG    | __main__:trials:29 - Trial = 13842/30000 | Total reward = 46.61
2022-01-26 14:17:32.696 | DEBUG    | __main__:trials:24 - Trial = 13843/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.698 | DEBUG    | __main__:trials:29 - Trial = 13843/30000 | Total reward = 52.01
2022-01-26 14:17:32.702 | DEBUG    | __main__:trials:24 - Trial = 13844/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.703 | DEBUG    | __main__:trials:29 - Trial = 13844/30000 | Total reward = 39.77
2022-01-26 14:17:32.707 | DEBUG    | __main__:trials:24 - Trial = 13845/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.708 | DEBUG    | __main__:trials:29 - Trial = 13845/30000 | Total reward = 52.98
2022-01-26 14:17:32.712 | DEBUG    | __main__:trials:24 - Trial = 13846/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.714 | DEBUG    | __main__:trials:29 - Trial = 13846/30000 | Total reward = 39.98
2022-01-26 14:17:32.717 | DEBUG    | __main__:trials:24 - Trial = 13847/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.719 | DEBUG    | __main__:trials:29 - Trial = 13847/30000 | Total reward = 37.91
2022-01-26 14:17:32.723 | DEBUG    | __main__:trials:24 - Trial = 13848/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.723 | DEBUG    | __main__:trials:29 - Trial = 13848/30000 | Total reward = 24.76
2022-01-26 14:17:32.727 | DEBUG    | __main__:trials:24 - Trial = 13849/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.729 | DEBUG    | __main__:trials:29 - Trial = 13849/30000 | Total reward = 39.89
2022-01-26 14:17:32.733 | DEBUG    | __main__:trials:24 - Trial = 13850/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.734 | DEBUG    | __main__:trials:29 - Trial = 13850/30000 | Total reward = 43.60
2022-01-26 14:17:32.738 | DEBUG    | __main__:trials:24 - Trial = 13851/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.740 | DEBUG    | __main__:trials:29 - Trial = 13851/30000 | Total reward = 39.55
2022-01-26 14:17:32.744 | DEBUG    | __main__:trials:24 - Trial = 13852/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.746 | DEBUG    | __main__:trials:29 - Trial = 13852/30000 | Total reward = 39.32
2022-01-26 14:17:32.748 | DEBUG    | __main__:trials:24 - Trial = 13853/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.751 | DEBUG    | __main__:trials:29 - Trial = 13853/30000 | Total reward = 38.92
2022-01-26 14:17:32.755 | DEBUG    | __main__:trials:24 - Trial = 13854/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.756 | DEBUG    | __main__:trials:29 - Trial = 13854/30000 | Total reward = 44.25
2022-01-26 14:17:32.760 | DEBUG    | __main__:trials:24 - Trial = 13855/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.762 | DEBUG    | __main__:trials:29 - Trial = 13855/30000 | Total reward = 52.53
2022-01-26 14:17:32.765 | DEBUG    | __main__:trials:24 - Trial = 13856/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.767 | DEBUG    | __main__:trials:29 - Trial = 13856/30000 | Total reward = 38.90
2022-01-26 14:17:32.770 | DEBUG    | __main__:trials:24 - Trial = 13857/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.772 | DEBUG    | __main__:trials:29 - Trial = 13857/30000 | Total reward = 53.63
2022-01-26 14:17:32.775 | DEBUG    | __main__:trials:24 - Trial = 13858/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.777 | DEBUG    | __main__:trials:29 - Trial = 13858/30000 | Total reward = 40.16
2022-01-26 14:17:32.781 | DEBUG    | __main__:trials:24 - Trial = 13859/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.781 | DEBUG    | __main__:trials:29 - Trial = 13859/30000 | Total reward = 48.77
2022-01-26 14:17:32.785 | DEBUG    | __main__:trials:24 - Trial = 13860/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.785 | DEBUG    | __main__:trials:29 - Trial = 13860/30000 | Total reward = 40.44
2022-01-26 14:17:32.790 | DEBUG    | __main__:trials:24 - Trial = 13861/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.791 | DEBUG    | __main__:trials:29 - Trial = 13861/30000 | Total reward = 40.45
2022-01-26 14:17:32.794 | DEBUG    | __main__:trials:24 - Trial = 13862/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.797 | DEBUG    | __main__:trials:29 - Trial = 13862/30000 | Total reward = 47.36
2022-01-26 14:17:32.800 | DEBUG    | __main__:trials:24 - Trial = 13863/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.802 | DEBUG    | __main__:trials:29 - Trial = 13863/30000 | Total reward = 40.00
2022-01-26 14:17:32.806 | DEBUG    | __main__:trials:24 - Trial = 13864/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.808 | DEBUG    | __main__:trials:29 - Trial = 13864/30000 | Total reward = 47.24
2022-01-26 14:17:32.811 | DEBUG    | __main__:trials:24 - Trial = 13865/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.813 | DEBUG    | __main__:trials:29 - Trial = 13865/30000 | Total reward = 43.02
2022-01-26 14:17:32.816 | DEBUG    | __main__:trials:24 - Trial = 13866/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.818 | DEBUG    | __main__:trials:29 - Trial = 13866/30000 | Total reward = 42.23
2022-01-26 14:17:32.821 | DEBUG    | __main__:trials:24 - Trial = 13867/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.822 | DEBUG    | __main__:trials:29 - Trial = 13867/30000 | Total reward = 59.91
2022-01-26 14:17:32.826 | DEBUG    | __main__:trials:24 - Trial = 13868/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.827 | DEBUG    | __main__:trials:29 - Trial = 13868/30000 | Total reward = 53.41
2022-01-26 14:17:32.831 | DEBUG    | __main__:trials:24 - Trial = 13869/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.833 | DEBUG    | __main__:trials:29 - Trial = 13869/30000 | Total reward = 48.06
2022-01-26 14:17:32.837 | DEBUG    | __main__:trials:24 - Trial = 13870/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.838 | DEBUG    | __main__:trials:29 - Trial = 13870/30000 | Total reward = 39.73
2022-01-26 14:17:32.842 | DEBUG    | __main__:trials:24 - Trial = 13871/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.844 | DEBUG    | __main__:trials:29 - Trial = 13871/30000 | Total reward = 37.33
2022-01-26 14:17:32.847 | DEBUG    | __main__:trials:24 - Trial = 13872/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.849 | DEBUG    | __main__:trials:29 - Trial = 13872/30000 | Total reward = 43.03
2022-01-26 14:17:32.853 | DEBUG    | __main__:trials:24 - Trial = 13873/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.854 | DEBUG    | __main__:trials:29 - Trial = 13873/30000 | Total reward = 40.49
2022-01-26 14:17:32.857 | DEBUG    | __main__:trials:24 - Trial = 13874/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.857 | DEBUG    | __main__:trials:29 - Trial = 13874/30000 | Total reward = 43.58
2022-01-26 14:17:32.861 | DEBUG    | __main__:trials:24 - Trial = 13875/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.862 | DEBUG    | __main__:trials:29 - Trial = 13875/30000 | Total reward = 47.02
2022-01-26 14:17:32.865 | DEBUG    | __main__:trials:24 - Trial = 13876/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.866 | DEBUG    | __main__:trials:29 - Trial = 13876/30000 | Total reward = 55.40
2022-01-26 14:17:32.870 | DEBUG    | __main__:trials:24 - Trial = 13877/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.872 | DEBUG    | __main__:trials:29 - Trial = 13877/30000 | Total reward = 58.93
2022-01-26 14:17:32.876 | DEBUG    | __main__:trials:24 - Trial = 13878/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.877 | DEBUG    | __main__:trials:29 - Trial = 13878/30000 | Total reward = 33.75
2022-01-26 14:17:32.880 | DEBUG    | __main__:trials:24 - Trial = 13879/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.881 | DEBUG    | __main__:trials:29 - Trial = 13879/30000 | Total reward = 42.49
2022-01-26 14:17:32.885 | DEBUG    | __main__:trials:24 - Trial = 13880/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.887 | DEBUG    | __main__:trials:29 - Trial = 13880/30000 | Total reward = 45.34
2022-01-26 14:17:32.891 | DEBUG    | __main__:trials:24 - Trial = 13881/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.892 | DEBUG    | __main__:trials:29 - Trial = 13881/30000 | Total reward = 44.17
2022-01-26 14:17:32.896 | DEBUG    | __main__:trials:24 - Trial = 13882/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.897 | DEBUG    | __main__:trials:29 - Trial = 13882/30000 | Total reward = 43.00
2022-01-26 14:17:32.901 | DEBUG    | __main__:trials:24 - Trial = 13883/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.903 | DEBUG    | __main__:trials:29 - Trial = 13883/30000 | Total reward = 51.56
2022-01-26 14:17:32.906 | DEBUG    | __main__:trials:24 - Trial = 13884/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.908 | DEBUG    | __main__:trials:29 - Trial = 13884/30000 | Total reward = 48.37
2022-01-26 14:17:32.912 | DEBUG    | __main__:trials:24 - Trial = 13885/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.914 | DEBUG    | __main__:trials:29 - Trial = 13885/30000 | Total reward = 46.94
2022-01-26 14:17:32.918 | DEBUG    | __main__:trials:24 - Trial = 13886/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.919 | DEBUG    | __main__:trials:29 - Trial = 13886/30000 | Total reward = 47.55
2022-01-26 14:17:32.923 | DEBUG    | __main__:trials:24 - Trial = 13887/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.925 | DEBUG    | __main__:trials:29 - Trial = 13887/30000 | Total reward = 44.19
2022-01-26 14:17:32.928 | DEBUG    | __main__:trials:24 - Trial = 13888/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.929 | DEBUG    | __main__:trials:29 - Trial = 13888/30000 | Total reward = 48.60
2022-01-26 14:17:32.932 | DEBUG    | __main__:trials:24 - Trial = 13889/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.934 | DEBUG    | __main__:trials:29 - Trial = 13889/30000 | Total reward = 53.25
2022-01-26 14:17:32.937 | DEBUG    | __main__:trials:24 - Trial = 13890/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.939 | DEBUG    | __main__:trials:29 - Trial = 13890/30000 | Total reward = 57.07
2022-01-26 14:17:32.943 | DEBUG    | __main__:trials:24 - Trial = 13891/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.944 | DEBUG    | __main__:trials:29 - Trial = 13891/30000 | Total reward = 50.97
2022-01-26 14:17:32.948 | DEBUG    | __main__:trials:24 - Trial = 13892/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.949 | DEBUG    | __main__:trials:29 - Trial = 13892/30000 | Total reward = 59.43
2022-01-26 14:17:32.953 | DEBUG    | __main__:trials:24 - Trial = 13893/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.955 | DEBUG    | __main__:trials:29 - Trial = 13893/30000 | Total reward = 42.95
2022-01-26 14:17:32.959 | DEBUG    | __main__:trials:24 - Trial = 13894/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.960 | DEBUG    | __main__:trials:29 - Trial = 13894/30000 | Total reward = 52.57
2022-01-26 14:17:32.963 | DEBUG    | __main__:trials:24 - Trial = 13895/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.966 | DEBUG    | __main__:trials:29 - Trial = 13895/30000 | Total reward = 53.27
2022-01-26 14:17:32.970 | DEBUG    | __main__:trials:24 - Trial = 13896/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.971 | DEBUG    | __main__:trials:29 - Trial = 13896/30000 | Total reward = 42.70
2022-01-26 14:17:32.974 | DEBUG    | __main__:trials:24 - Trial = 13897/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.976 | DEBUG    | __main__:trials:29 - Trial = 13897/30000 | Total reward = 47.54
2022-01-26 14:17:32.980 | DEBUG    | __main__:trials:24 - Trial = 13898/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.981 | DEBUG    | __main__:trials:29 - Trial = 13898/30000 | Total reward = 41.50
2022-01-26 14:17:32.985 | DEBUG    | __main__:trials:24 - Trial = 13899/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.987 | DEBUG    | __main__:trials:29 - Trial = 13899/30000 | Total reward = 55.03
2022-01-26 14:17:32.991 | DEBUG    | __main__:trials:24 - Trial = 13900/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.992 | DEBUG    | __main__:trials:29 - Trial = 13900/30000 | Total reward = 43.48
2022-01-26 14:17:32.996 | DEBUG    | __main__:trials:24 - Trial = 13901/30000 | Max number of steps (20) reached
2022-01-26 14:17:32.998 | DEBUG    | __main__:trials:29 - Trial = 13901/30000 | Total reward = 52.76
2022-01-26 14:17:33.001 | DEBUG    | __main__:trials:24 - Trial = 13902/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.002 | DEBUG    | __main__:trials:29 - Trial = 13902/30000 | Total reward = 45.80
2022-01-26 14:17:33.006 | DEBUG    | __main__:trials:24 - Trial = 13903/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.007 | DEBUG    | __main__:trials:29 - Trial = 13903/30000 | Total reward = 36.95
2022-01-26 14:17:33.011 | DEBUG    | __main__:trials:24 - Trial = 13904/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.013 | DEBUG    | __main__:trials:29 - Trial = 13904/30000 | Total reward = 43.41
2022-01-26 14:17:33.016 | DEBUG    | __main__:trials:24 - Trial = 13905/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.018 | DEBUG    | __main__:trials:29 - Trial = 13905/30000 | Total reward = 39.30
2022-01-26 14:17:33.022 | DEBUG    | __main__:trials:24 - Trial = 13906/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.022 | DEBUG    | __main__:trials:29 - Trial = 13906/30000 | Total reward = 49.75
2022-01-26 14:17:33.026 | DEBUG    | __main__:trials:24 - Trial = 13907/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.028 | DEBUG    | __main__:trials:29 - Trial = 13907/30000 | Total reward = 38.99
2022-01-26 14:17:33.032 | DEBUG    | __main__:trials:24 - Trial = 13908/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.033 | DEBUG    | __main__:trials:29 - Trial = 13908/30000 | Total reward = 51.85
2022-01-26 14:17:33.037 | DEBUG    | __main__:trials:26 - Trial = 13909/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:33.037 | DEBUG    | __main__:trials:29 - Trial = 13909/30000 | Total reward = 20.14
2022-01-26 14:17:33.040 | DEBUG    | __main__:trials:24 - Trial = 13910/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.041 | DEBUG    | __main__:trials:29 - Trial = 13910/30000 | Total reward = 45.84
2022-01-26 14:17:33.044 | DEBUG    | __main__:trials:24 - Trial = 13911/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.045 | DEBUG    | __main__:trials:29 - Trial = 13911/30000 | Total reward = 39.66
2022-01-26 14:17:33.048 | DEBUG    | __main__:trials:24 - Trial = 13912/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.049 | DEBUG    | __main__:trials:29 - Trial = 13912/30000 | Total reward = 38.18
2022-01-26 14:17:33.052 | DEBUG    | __main__:trials:24 - Trial = 13913/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.054 | DEBUG    | __main__:trials:29 - Trial = 13913/30000 | Total reward = 29.48
2022-01-26 14:17:33.058 | DEBUG    | __main__:trials:24 - Trial = 13914/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.060 | DEBUG    | __main__:trials:29 - Trial = 13914/30000 | Total reward = 42.57
2022-01-26 14:17:33.063 | DEBUG    | __main__:trials:24 - Trial = 13915/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.065 | DEBUG    | __main__:trials:29 - Trial = 13915/30000 | Total reward = 35.38
2022-01-26 14:17:33.069 | DEBUG    | __main__:trials:24 - Trial = 13916/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.070 | DEBUG    | __main__:trials:29 - Trial = 13916/30000 | Total reward = 39.20
2022-01-26 14:17:33.073 | DEBUG    | __main__:trials:24 - Trial = 13917/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.075 | DEBUG    | __main__:trials:29 - Trial = 13917/30000 | Total reward = 40.59
2022-01-26 14:17:33.078 | DEBUG    | __main__:trials:24 - Trial = 13918/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.080 | DEBUG    | __main__:trials:29 - Trial = 13918/30000 | Total reward = 39.67
2022-01-26 14:17:33.084 | DEBUG    | __main__:trials:24 - Trial = 13919/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.085 | DEBUG    | __main__:trials:29 - Trial = 13919/30000 | Total reward = 39.51
2022-01-26 14:17:33.088 | DEBUG    | __main__:trials:24 - Trial = 13920/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.090 | DEBUG    | __main__:trials:29 - Trial = 13920/30000 | Total reward = 37.03
2022-01-26 14:17:33.093 | DEBUG    | __main__:trials:24 - Trial = 13921/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.095 | DEBUG    | __main__:trials:29 - Trial = 13921/30000 | Total reward = 35.36
2022-01-26 14:17:33.098 | DEBUG    | __main__:trials:24 - Trial = 13922/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.099 | DEBUG    | __main__:trials:29 - Trial = 13922/30000 | Total reward = 38.89
2022-01-26 14:17:33.103 | DEBUG    | __main__:trials:24 - Trial = 13923/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.104 | DEBUG    | __main__:trials:29 - Trial = 13923/30000 | Total reward = 50.85
2022-01-26 14:17:33.107 | DEBUG    | __main__:trials:24 - Trial = 13924/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.109 | DEBUG    | __main__:trials:29 - Trial = 13924/30000 | Total reward = 40.14
2022-01-26 14:17:33.112 | DEBUG    | __main__:trials:24 - Trial = 13925/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.114 | DEBUG    | __main__:trials:29 - Trial = 13925/30000 | Total reward = 28.22
2022-01-26 14:17:33.118 | DEBUG    | __main__:trials:24 - Trial = 13926/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.120 | DEBUG    | __main__:trials:29 - Trial = 13926/30000 | Total reward = 45.02
2022-01-26 14:17:33.123 | DEBUG    | __main__:trials:24 - Trial = 13927/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.125 | DEBUG    | __main__:trials:29 - Trial = 13927/30000 | Total reward = 40.06
2022-01-26 14:17:33.128 | DEBUG    | __main__:trials:26 - Trial = 13928/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:33.130 | DEBUG    | __main__:trials:29 - Trial = 13928/30000 | Total reward = 30.00
2022-01-26 14:17:33.133 | DEBUG    | __main__:trials:24 - Trial = 13929/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.135 | DEBUG    | __main__:trials:29 - Trial = 13929/30000 | Total reward = 41.15
2022-01-26 14:17:33.139 | DEBUG    | __main__:trials:24 - Trial = 13930/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.141 | DEBUG    | __main__:trials:29 - Trial = 13930/30000 | Total reward = 38.92
2022-01-26 14:17:33.144 | DEBUG    | __main__:trials:24 - Trial = 13931/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.146 | DEBUG    | __main__:trials:29 - Trial = 13931/30000 | Total reward = 44.07
2022-01-26 14:17:33.149 | DEBUG    | __main__:trials:24 - Trial = 13932/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.150 | DEBUG    | __main__:trials:29 - Trial = 13932/30000 | Total reward = 45.36
2022-01-26 14:17:33.154 | DEBUG    | __main__:trials:24 - Trial = 13933/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.156 | DEBUG    | __main__:trials:29 - Trial = 13933/30000 | Total reward = 43.70
2022-01-26 14:17:33.159 | DEBUG    | __main__:trials:24 - Trial = 13934/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.161 | DEBUG    | __main__:trials:29 - Trial = 13934/30000 | Total reward = 36.98
2022-01-26 14:17:33.165 | DEBUG    | __main__:trials:24 - Trial = 13935/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.165 | DEBUG    | __main__:trials:29 - Trial = 13935/30000 | Total reward = 44.84
2022-01-26 14:17:33.169 | DEBUG    | __main__:trials:24 - Trial = 13936/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.171 | DEBUG    | __main__:trials:29 - Trial = 13936/30000 | Total reward = 64.16
2022-01-26 14:17:33.174 | DEBUG    | __main__:trials:24 - Trial = 13937/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.177 | DEBUG    | __main__:trials:29 - Trial = 13937/30000 | Total reward = 47.20
2022-01-26 14:17:33.180 | DEBUG    | __main__:trials:24 - Trial = 13938/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.182 | DEBUG    | __main__:trials:29 - Trial = 13938/30000 | Total reward = 39.61
2022-01-26 14:17:33.186 | DEBUG    | __main__:trials:24 - Trial = 13939/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.187 | DEBUG    | __main__:trials:29 - Trial = 13939/30000 | Total reward = 45.84
2022-01-26 14:17:33.191 | DEBUG    | __main__:trials:24 - Trial = 13940/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.192 | DEBUG    | __main__:trials:29 - Trial = 13940/30000 | Total reward = 46.16
2022-01-26 14:17:33.197 | DEBUG    | __main__:trials:24 - Trial = 13941/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.199 | DEBUG    | __main__:trials:29 - Trial = 13941/30000 | Total reward = 51.12
2022-01-26 14:17:33.203 | DEBUG    | __main__:trials:24 - Trial = 13942/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.204 | DEBUG    | __main__:trials:29 - Trial = 13942/30000 | Total reward = 39.86
2022-01-26 14:17:33.208 | DEBUG    | __main__:trials:24 - Trial = 13943/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.209 | DEBUG    | __main__:trials:29 - Trial = 13943/30000 | Total reward = 47.46
2022-01-26 14:17:33.212 | DEBUG    | __main__:trials:24 - Trial = 13944/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.214 | DEBUG    | __main__:trials:29 - Trial = 13944/30000 | Total reward = 45.28
2022-01-26 14:17:33.218 | DEBUG    | __main__:trials:24 - Trial = 13945/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.219 | DEBUG    | __main__:trials:29 - Trial = 13945/30000 | Total reward = 42.91
2022-01-26 14:17:33.222 | DEBUG    | __main__:trials:24 - Trial = 13946/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.224 | DEBUG    | __main__:trials:29 - Trial = 13946/30000 | Total reward = 41.73
2022-01-26 14:17:33.228 | DEBUG    | __main__:trials:24 - Trial = 13947/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.230 | DEBUG    | __main__:trials:29 - Trial = 13947/30000 | Total reward = 52.89
2022-01-26 14:17:33.233 | DEBUG    | __main__:trials:24 - Trial = 13948/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.235 | DEBUG    | __main__:trials:29 - Trial = 13948/30000 | Total reward = 49.20
2022-01-26 14:17:33.238 | DEBUG    | __main__:trials:24 - Trial = 13949/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.240 | DEBUG    | __main__:trials:29 - Trial = 13949/30000 | Total reward = 53.52
2022-01-26 14:17:33.244 | DEBUG    | __main__:trials:24 - Trial = 13950/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.244 | DEBUG    | __main__:trials:29 - Trial = 13950/30000 | Total reward = 52.19
2022-01-26 14:17:33.248 | DEBUG    | __main__:trials:24 - Trial = 13951/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.249 | DEBUG    | __main__:trials:29 - Trial = 13951/30000 | Total reward = 48.97
2022-01-26 14:17:33.252 | DEBUG    | __main__:trials:24 - Trial = 13952/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.254 | DEBUG    | __main__:trials:29 - Trial = 13952/30000 | Total reward = 45.89
2022-01-26 14:17:33.258 | DEBUG    | __main__:trials:24 - Trial = 13953/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.260 | DEBUG    | __main__:trials:29 - Trial = 13953/30000 | Total reward = 60.51
2022-01-26 14:17:33.263 | DEBUG    | __main__:trials:24 - Trial = 13954/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.265 | DEBUG    | __main__:trials:29 - Trial = 13954/30000 | Total reward = 41.13
2022-01-26 14:17:33.269 | DEBUG    | __main__:trials:24 - Trial = 13955/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.269 | DEBUG    | __main__:trials:29 - Trial = 13955/30000 | Total reward = 46.41
2022-01-26 14:17:33.272 | DEBUG    | __main__:trials:24 - Trial = 13956/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.274 | DEBUG    | __main__:trials:29 - Trial = 13956/30000 | Total reward = 47.72
2022-01-26 14:17:33.278 | DEBUG    | __main__:trials:24 - Trial = 13957/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.278 | DEBUG    | __main__:trials:29 - Trial = 13957/30000 | Total reward = 41.92
2022-01-26 14:17:33.283 | DEBUG    | __main__:trials:24 - Trial = 13958/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.284 | DEBUG    | __main__:trials:29 - Trial = 13958/30000 | Total reward = 47.05
2022-01-26 14:17:33.288 | DEBUG    | __main__:trials:24 - Trial = 13959/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.289 | DEBUG    | __main__:trials:29 - Trial = 13959/30000 | Total reward = 47.48
2022-01-26 14:17:33.293 | DEBUG    | __main__:trials:24 - Trial = 13960/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.294 | DEBUG    | __main__:trials:29 - Trial = 13960/30000 | Total reward = 45.13
2022-01-26 14:17:33.299 | DEBUG    | __main__:trials:24 - Trial = 13961/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.300 | DEBUG    | __main__:trials:29 - Trial = 13961/30000 | Total reward = 51.56
2022-01-26 14:17:33.304 | DEBUG    | __main__:trials:24 - Trial = 13962/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.306 | DEBUG    | __main__:trials:29 - Trial = 13962/30000 | Total reward = 45.72
2022-01-26 14:17:33.310 | DEBUG    | __main__:trials:24 - Trial = 13963/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.311 | DEBUG    | __main__:trials:29 - Trial = 13963/30000 | Total reward = 47.92
2022-01-26 14:17:33.315 | DEBUG    | __main__:trials:24 - Trial = 13964/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.317 | DEBUG    | __main__:trials:29 - Trial = 13964/30000 | Total reward = 43.02
2022-01-26 14:17:33.320 | DEBUG    | __main__:trials:24 - Trial = 13965/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.322 | DEBUG    | __main__:trials:29 - Trial = 13965/30000 | Total reward = 47.05
2022-01-26 14:17:33.326 | DEBUG    | __main__:trials:24 - Trial = 13966/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.328 | DEBUG    | __main__:trials:29 - Trial = 13966/30000 | Total reward = 42.24
2022-01-26 14:17:33.331 | DEBUG    | __main__:trials:24 - Trial = 13967/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.333 | DEBUG    | __main__:trials:29 - Trial = 13967/30000 | Total reward = 40.45
2022-01-26 14:17:33.336 | DEBUG    | __main__:trials:24 - Trial = 13968/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.338 | DEBUG    | __main__:trials:29 - Trial = 13968/30000 | Total reward = 43.94
2022-01-26 14:17:33.342 | DEBUG    | __main__:trials:24 - Trial = 13969/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.344 | DEBUG    | __main__:trials:29 - Trial = 13969/30000 | Total reward = 31.39
2022-01-26 14:17:33.348 | DEBUG    | __main__:trials:24 - Trial = 13970/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.350 | DEBUG    | __main__:trials:29 - Trial = 13970/30000 | Total reward = 42.58
2022-01-26 14:17:33.353 | DEBUG    | __main__:trials:24 - Trial = 13971/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.355 | DEBUG    | __main__:trials:29 - Trial = 13971/30000 | Total reward = 45.52
2022-01-26 14:17:33.359 | DEBUG    | __main__:trials:24 - Trial = 13972/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.361 | DEBUG    | __main__:trials:29 - Trial = 13972/30000 | Total reward = 43.05
2022-01-26 14:17:33.364 | DEBUG    | __main__:trials:24 - Trial = 13973/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.366 | DEBUG    | __main__:trials:29 - Trial = 13973/30000 | Total reward = 39.10
2022-01-26 14:17:33.370 | DEBUG    | __main__:trials:24 - Trial = 13974/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.371 | DEBUG    | __main__:trials:29 - Trial = 13974/30000 | Total reward = 49.65
2022-01-26 14:17:33.375 | DEBUG    | __main__:trials:24 - Trial = 13975/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.377 | DEBUG    | __main__:trials:29 - Trial = 13975/30000 | Total reward = 38.66
2022-01-26 14:17:33.380 | DEBUG    | __main__:trials:24 - Trial = 13976/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.382 | DEBUG    | __main__:trials:29 - Trial = 13976/30000 | Total reward = 42.48
2022-01-26 14:17:33.385 | DEBUG    | __main__:trials:24 - Trial = 13977/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.386 | DEBUG    | __main__:trials:29 - Trial = 13977/30000 | Total reward = 53.33
2022-01-26 14:17:33.389 | DEBUG    | __main__:trials:24 - Trial = 13978/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.391 | DEBUG    | __main__:trials:29 - Trial = 13978/30000 | Total reward = 53.13
2022-01-26 14:17:33.395 | DEBUG    | __main__:trials:24 - Trial = 13979/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.396 | DEBUG    | __main__:trials:29 - Trial = 13979/30000 | Total reward = 39.42
2022-01-26 14:17:33.399 | DEBUG    | __main__:trials:24 - Trial = 13980/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.401 | DEBUG    | __main__:trials:29 - Trial = 13980/30000 | Total reward = 41.76
2022-01-26 14:17:33.405 | DEBUG    | __main__:trials:24 - Trial = 13981/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.406 | DEBUG    | __main__:trials:29 - Trial = 13981/30000 | Total reward = 42.07
2022-01-26 14:17:33.409 | DEBUG    | __main__:trials:24 - Trial = 13982/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.410 | DEBUG    | __main__:trials:29 - Trial = 13982/30000 | Total reward = 45.38
2022-01-26 14:17:33.413 | DEBUG    | __main__:trials:24 - Trial = 13983/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.415 | DEBUG    | __main__:trials:29 - Trial = 13983/30000 | Total reward = 46.87
2022-01-26 14:17:33.418 | DEBUG    | __main__:trials:24 - Trial = 13984/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.420 | DEBUG    | __main__:trials:29 - Trial = 13984/30000 | Total reward = 38.91
2022-01-26 14:17:33.423 | DEBUG    | __main__:trials:24 - Trial = 13985/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.425 | DEBUG    | __main__:trials:29 - Trial = 13985/30000 | Total reward = 49.33
2022-01-26 14:17:33.428 | DEBUG    | __main__:trials:24 - Trial = 13986/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.430 | DEBUG    | __main__:trials:29 - Trial = 13986/30000 | Total reward = 44.03
2022-01-26 14:17:33.434 | DEBUG    | __main__:trials:24 - Trial = 13987/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.434 | DEBUG    | __main__:trials:29 - Trial = 13987/30000 | Total reward = 50.95
2022-01-26 14:17:33.438 | DEBUG    | __main__:trials:24 - Trial = 13988/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.440 | DEBUG    | __main__:trials:29 - Trial = 13988/30000 | Total reward = 43.04
2022-01-26 14:17:33.444 | DEBUG    | __main__:trials:24 - Trial = 13989/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.446 | DEBUG    | __main__:trials:29 - Trial = 13989/30000 | Total reward = 45.87
2022-01-26 14:17:33.449 | DEBUG    | __main__:trials:24 - Trial = 13990/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.450 | DEBUG    | __main__:trials:29 - Trial = 13990/30000 | Total reward = 42.00
2022-01-26 14:17:33.454 | DEBUG    | __main__:trials:24 - Trial = 13991/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.456 | DEBUG    | __main__:trials:29 - Trial = 13991/30000 | Total reward = 41.97
2022-01-26 14:17:33.459 | DEBUG    | __main__:trials:24 - Trial = 13992/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.461 | DEBUG    | __main__:trials:29 - Trial = 13992/30000 | Total reward = 43.86
2022-01-26 14:17:33.464 | DEBUG    | __main__:trials:24 - Trial = 13993/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.466 | DEBUG    | __main__:trials:29 - Trial = 13993/30000 | Total reward = 47.05
2022-01-26 14:17:33.470 | DEBUG    | __main__:trials:24 - Trial = 13994/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.470 | DEBUG    | __main__:trials:29 - Trial = 13994/30000 | Total reward = 56.37
2022-01-26 14:17:33.475 | DEBUG    | __main__:trials:24 - Trial = 13995/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.476 | DEBUG    | __main__:trials:29 - Trial = 13995/30000 | Total reward = 45.55
2022-01-26 14:17:33.480 | DEBUG    | __main__:trials:24 - Trial = 13996/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.482 | DEBUG    | __main__:trials:29 - Trial = 13996/30000 | Total reward = 46.31
2022-01-26 14:17:33.486 | DEBUG    | __main__:trials:24 - Trial = 13997/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.487 | DEBUG    | __main__:trials:29 - Trial = 13997/30000 | Total reward = 44.01
2022-01-26 14:17:33.490 | DEBUG    | __main__:trials:24 - Trial = 13998/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.492 | DEBUG    | __main__:trials:29 - Trial = 13998/30000 | Total reward = 48.19
2022-01-26 14:17:33.496 | DEBUG    | __main__:trials:24 - Trial = 13999/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.498 | DEBUG    | __main__:trials:29 - Trial = 13999/30000 | Total reward = 50.45
2022-01-26 14:17:33.501 | DEBUG    | __main__:trials:24 - Trial = 14000/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.503 | DEBUG    | __main__:trials:29 - Trial = 14000/30000 | Total reward = 48.30
2022-01-26 14:17:33.507 | DEBUG    | __main__:trials:24 - Trial = 14001/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.508 | DEBUG    | __main__:trials:29 - Trial = 14001/30000 | Total reward = 40.00
2022-01-26 14:17:33.512 | DEBUG    | __main__:trials:24 - Trial = 14002/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.513 | DEBUG    | __main__:trials:29 - Trial = 14002/30000 | Total reward = 49.95
2022-01-26 14:17:33.517 | DEBUG    | __main__:trials:24 - Trial = 14003/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.519 | DEBUG    | __main__:trials:29 - Trial = 14003/30000 | Total reward = 43.78
2022-01-26 14:17:33.522 | DEBUG    | __main__:trials:24 - Trial = 14004/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.524 | DEBUG    | __main__:trials:29 - Trial = 14004/30000 | Total reward = 41.13
2022-01-26 14:17:33.527 | DEBUG    | __main__:trials:24 - Trial = 14005/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.529 | DEBUG    | __main__:trials:29 - Trial = 14005/30000 | Total reward = 44.78
2022-01-26 14:17:33.532 | DEBUG    | __main__:trials:24 - Trial = 14006/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.534 | DEBUG    | __main__:trials:29 - Trial = 14006/30000 | Total reward = 47.05
2022-01-26 14:17:33.537 | DEBUG    | __main__:trials:24 - Trial = 14007/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.538 | DEBUG    | __main__:trials:29 - Trial = 14007/30000 | Total reward = 46.41
2022-01-26 14:17:33.542 | DEBUG    | __main__:trials:24 - Trial = 14008/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.544 | DEBUG    | __main__:trials:29 - Trial = 14008/30000 | Total reward = 47.05
2022-01-26 14:17:33.547 | DEBUG    | __main__:trials:24 - Trial = 14009/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.549 | DEBUG    | __main__:trials:29 - Trial = 14009/30000 | Total reward = 47.05
2022-01-26 14:17:33.553 | DEBUG    | __main__:trials:24 - Trial = 14010/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.554 | DEBUG    | __main__:trials:29 - Trial = 14010/30000 | Total reward = 46.06
2022-01-26 14:17:33.558 | DEBUG    | __main__:trials:24 - Trial = 14011/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.560 | DEBUG    | __main__:trials:29 - Trial = 14011/30000 | Total reward = 40.77
2022-01-26 14:17:33.563 | DEBUG    | __main__:trials:24 - Trial = 14012/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.565 | DEBUG    | __main__:trials:29 - Trial = 14012/30000 | Total reward = 43.33
2022-01-26 14:17:33.569 | DEBUG    | __main__:trials:24 - Trial = 14013/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.570 | DEBUG    | __main__:trials:29 - Trial = 14013/30000 | Total reward = 46.94
2022-01-26 14:17:33.574 | DEBUG    | __main__:trials:24 - Trial = 14014/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.576 | DEBUG    | __main__:trials:29 - Trial = 14014/30000 | Total reward = 40.92
2022-01-26 14:17:33.579 | DEBUG    | __main__:trials:26 - Trial = 14015/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:33.581 | DEBUG    | __main__:trials:29 - Trial = 14015/30000 | Total reward = 36.86
2022-01-26 14:17:33.584 | DEBUG    | __main__:trials:24 - Trial = 14016/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.586 | DEBUG    | __main__:trials:29 - Trial = 14016/30000 | Total reward = 45.67
2022-01-26 14:17:33.590 | DEBUG    | __main__:trials:24 - Trial = 14017/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.591 | DEBUG    | __main__:trials:29 - Trial = 14017/30000 | Total reward = 46.78
2022-01-26 14:17:33.595 | DEBUG    | __main__:trials:24 - Trial = 14018/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.596 | DEBUG    | __main__:trials:29 - Trial = 14018/30000 | Total reward = 44.07
2022-01-26 14:17:33.599 | DEBUG    | __main__:trials:24 - Trial = 14019/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.601 | DEBUG    | __main__:trials:29 - Trial = 14019/30000 | Total reward = 50.91
2022-01-26 14:17:33.604 | DEBUG    | __main__:trials:24 - Trial = 14020/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.607 | DEBUG    | __main__:trials:29 - Trial = 14020/30000 | Total reward = 44.15
2022-01-26 14:17:33.609 | DEBUG    | __main__:trials:24 - Trial = 14021/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.611 | DEBUG    | __main__:trials:29 - Trial = 14021/30000 | Total reward = 46.57
2022-01-26 14:17:33.614 | DEBUG    | __main__:trials:24 - Trial = 14022/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.616 | DEBUG    | __main__:trials:29 - Trial = 14022/30000 | Total reward = 43.83
2022-01-26 14:17:33.620 | DEBUG    | __main__:trials:24 - Trial = 14023/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.622 | DEBUG    | __main__:trials:29 - Trial = 14023/30000 | Total reward = 41.80
2022-01-26 14:17:33.626 | DEBUG    | __main__:trials:24 - Trial = 14024/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.627 | DEBUG    | __main__:trials:29 - Trial = 14024/30000 | Total reward = 45.10
2022-01-26 14:17:33.631 | DEBUG    | __main__:trials:24 - Trial = 14025/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.633 | DEBUG    | __main__:trials:29 - Trial = 14025/30000 | Total reward = 49.36
2022-01-26 14:17:33.636 | DEBUG    | __main__:trials:24 - Trial = 14026/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.637 | DEBUG    | __main__:trials:29 - Trial = 14026/30000 | Total reward = 49.42
2022-01-26 14:17:33.641 | DEBUG    | __main__:trials:24 - Trial = 14027/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.643 | DEBUG    | __main__:trials:29 - Trial = 14027/30000 | Total reward = 45.93
2022-01-26 14:17:33.647 | DEBUG    | __main__:trials:24 - Trial = 14028/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.648 | DEBUG    | __main__:trials:29 - Trial = 14028/30000 | Total reward = 39.57
2022-01-26 14:17:33.652 | DEBUG    | __main__:trials:24 - Trial = 14029/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.653 | DEBUG    | __main__:trials:29 - Trial = 14029/30000 | Total reward = 39.62
2022-01-26 14:17:33.657 | DEBUG    | __main__:trials:24 - Trial = 14030/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.658 | DEBUG    | __main__:trials:29 - Trial = 14030/30000 | Total reward = 48.04
2022-01-26 14:17:33.662 | DEBUG    | __main__:trials:24 - Trial = 14031/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.664 | DEBUG    | __main__:trials:29 - Trial = 14031/30000 | Total reward = 43.29
2022-01-26 14:17:33.667 | DEBUG    | __main__:trials:24 - Trial = 14032/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.668 | DEBUG    | __main__:trials:29 - Trial = 14032/30000 | Total reward = 47.20
2022-01-26 14:17:33.671 | DEBUG    | __main__:trials:24 - Trial = 14033/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.673 | DEBUG    | __main__:trials:29 - Trial = 14033/30000 | Total reward = 49.81
2022-01-26 14:17:33.676 | DEBUG    | __main__:trials:24 - Trial = 14034/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.678 | DEBUG    | __main__:trials:29 - Trial = 14034/30000 | Total reward = 53.20
2022-01-26 14:17:33.682 | DEBUG    | __main__:trials:24 - Trial = 14035/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.684 | DEBUG    | __main__:trials:29 - Trial = 14035/30000 | Total reward = 46.69
2022-01-26 14:17:33.687 | DEBUG    | __main__:trials:24 - Trial = 14036/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.689 | DEBUG    | __main__:trials:29 - Trial = 14036/30000 | Total reward = 40.10
2022-01-26 14:17:33.692 | DEBUG    | __main__:trials:24 - Trial = 14037/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.694 | DEBUG    | __main__:trials:29 - Trial = 14037/30000 | Total reward = 42.15
2022-01-26 14:17:33.697 | DEBUG    | __main__:trials:24 - Trial = 14038/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.699 | DEBUG    | __main__:trials:29 - Trial = 14038/30000 | Total reward = 40.08
2022-01-26 14:17:33.703 | DEBUG    | __main__:trials:24 - Trial = 14039/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.704 | DEBUG    | __main__:trials:29 - Trial = 14039/30000 | Total reward = 47.63
2022-01-26 14:17:33.708 | DEBUG    | __main__:trials:24 - Trial = 14040/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.709 | DEBUG    | __main__:trials:29 - Trial = 14040/30000 | Total reward = 43.00
2022-01-26 14:17:33.713 | DEBUG    | __main__:trials:24 - Trial = 14041/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.714 | DEBUG    | __main__:trials:29 - Trial = 14041/30000 | Total reward = 47.20
2022-01-26 14:17:33.718 | DEBUG    | __main__:trials:24 - Trial = 14042/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.719 | DEBUG    | __main__:trials:29 - Trial = 14042/30000 | Total reward = 50.80
2022-01-26 14:17:33.723 | DEBUG    | __main__:trials:24 - Trial = 14043/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.725 | DEBUG    | __main__:trials:29 - Trial = 14043/30000 | Total reward = 39.27
2022-01-26 14:17:33.728 | DEBUG    | __main__:trials:26 - Trial = 14044/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:33.730 | DEBUG    | __main__:trials:29 - Trial = 14044/30000 | Total reward = 32.41
2022-01-26 14:17:33.733 | DEBUG    | __main__:trials:24 - Trial = 14045/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.734 | DEBUG    | __main__:trials:29 - Trial = 14045/30000 | Total reward = 51.92
2022-01-26 14:17:33.738 | DEBUG    | __main__:trials:24 - Trial = 14046/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.739 | DEBUG    | __main__:trials:29 - Trial = 14046/30000 | Total reward = 59.38
2022-01-26 14:17:33.744 | DEBUG    | __main__:trials:24 - Trial = 14047/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.746 | DEBUG    | __main__:trials:29 - Trial = 14047/30000 | Total reward = 46.51
2022-01-26 14:17:33.749 | DEBUG    | __main__:trials:24 - Trial = 14048/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.751 | DEBUG    | __main__:trials:29 - Trial = 14048/30000 | Total reward = 47.05
2022-01-26 14:17:33.754 | DEBUG    | __main__:trials:24 - Trial = 14049/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.756 | DEBUG    | __main__:trials:29 - Trial = 14049/30000 | Total reward = 48.12
2022-01-26 14:17:33.759 | DEBUG    | __main__:trials:24 - Trial = 14050/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.760 | DEBUG    | __main__:trials:29 - Trial = 14050/30000 | Total reward = 50.28
2022-01-26 14:17:33.764 | DEBUG    | __main__:trials:24 - Trial = 14051/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.765 | DEBUG    | __main__:trials:29 - Trial = 14051/30000 | Total reward = 51.65
2022-01-26 14:17:33.769 | DEBUG    | __main__:trials:24 - Trial = 14052/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.770 | DEBUG    | __main__:trials:29 - Trial = 14052/30000 | Total reward = 49.11
2022-01-26 14:17:33.774 | DEBUG    | __main__:trials:24 - Trial = 14053/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.775 | DEBUG    | __main__:trials:29 - Trial = 14053/30000 | Total reward = 41.82
2022-01-26 14:17:33.779 | DEBUG    | __main__:trials:24 - Trial = 14054/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.781 | DEBUG    | __main__:trials:29 - Trial = 14054/30000 | Total reward = 48.82
2022-01-26 14:17:33.784 | DEBUG    | __main__:trials:24 - Trial = 14055/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.786 | DEBUG    | __main__:trials:29 - Trial = 14055/30000 | Total reward = 47.83
2022-01-26 14:17:33.789 | DEBUG    | __main__:trials:24 - Trial = 14056/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.790 | DEBUG    | __main__:trials:29 - Trial = 14056/30000 | Total reward = 47.46
2022-01-26 14:17:33.793 | DEBUG    | __main__:trials:24 - Trial = 14057/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.794 | DEBUG    | __main__:trials:29 - Trial = 14057/30000 | Total reward = 48.19
2022-01-26 14:17:33.797 | DEBUG    | __main__:trials:24 - Trial = 14058/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.799 | DEBUG    | __main__:trials:29 - Trial = 14058/30000 | Total reward = 52.03
2022-01-26 14:17:33.803 | DEBUG    | __main__:trials:24 - Trial = 14059/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.804 | DEBUG    | __main__:trials:29 - Trial = 14059/30000 | Total reward = 47.38
2022-01-26 14:17:33.808 | DEBUG    | __main__:trials:24 - Trial = 14060/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.809 | DEBUG    | __main__:trials:29 - Trial = 14060/30000 | Total reward = 52.72
2022-01-26 14:17:33.813 | DEBUG    | __main__:trials:24 - Trial = 14061/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.814 | DEBUG    | __main__:trials:29 - Trial = 14061/30000 | Total reward = 47.09
2022-01-26 14:17:33.818 | DEBUG    | __main__:trials:24 - Trial = 14062/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.819 | DEBUG    | __main__:trials:29 - Trial = 14062/30000 | Total reward = 47.79
2022-01-26 14:17:33.824 | DEBUG    | __main__:trials:24 - Trial = 14063/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.825 | DEBUG    | __main__:trials:29 - Trial = 14063/30000 | Total reward = 56.57
2022-01-26 14:17:33.829 | DEBUG    | __main__:trials:24 - Trial = 14064/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.830 | DEBUG    | __main__:trials:29 - Trial = 14064/30000 | Total reward = 48.98
2022-01-26 14:17:33.833 | DEBUG    | __main__:trials:24 - Trial = 14065/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.834 | DEBUG    | __main__:trials:29 - Trial = 14065/30000 | Total reward = 51.65
2022-01-26 14:17:33.838 | DEBUG    | __main__:trials:24 - Trial = 14066/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.839 | DEBUG    | __main__:trials:29 - Trial = 14066/30000 | Total reward = 49.50
2022-01-26 14:17:33.843 | DEBUG    | __main__:trials:24 - Trial = 14067/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.844 | DEBUG    | __main__:trials:29 - Trial = 14067/30000 | Total reward = 47.10
2022-01-26 14:17:33.848 | DEBUG    | __main__:trials:24 - Trial = 14068/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.850 | DEBUG    | __main__:trials:29 - Trial = 14068/30000 | Total reward = 45.73
2022-01-26 14:17:33.853 | DEBUG    | __main__:trials:24 - Trial = 14069/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.855 | DEBUG    | __main__:trials:29 - Trial = 14069/30000 | Total reward = 44.33
2022-01-26 14:17:33.858 | DEBUG    | __main__:trials:24 - Trial = 14070/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.860 | DEBUG    | __main__:trials:29 - Trial = 14070/30000 | Total reward = 53.42
2022-01-26 14:17:33.863 | DEBUG    | __main__:trials:24 - Trial = 14071/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.864 | DEBUG    | __main__:trials:29 - Trial = 14071/30000 | Total reward = 39.17
2022-01-26 14:17:33.868 | DEBUG    | __main__:trials:24 - Trial = 14072/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.869 | DEBUG    | __main__:trials:29 - Trial = 14072/30000 | Total reward = 36.73
2022-01-26 14:17:33.872 | DEBUG    | __main__:trials:24 - Trial = 14073/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.873 | DEBUG    | __main__:trials:29 - Trial = 14073/30000 | Total reward = 41.58
2022-01-26 14:17:33.877 | DEBUG    | __main__:trials:24 - Trial = 14074/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.877 | DEBUG    | __main__:trials:29 - Trial = 14074/30000 | Total reward = 42.97
2022-01-26 14:17:33.882 | DEBUG    | __main__:trials:24 - Trial = 14075/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.883 | DEBUG    | __main__:trials:29 - Trial = 14075/30000 | Total reward = 30.23
2022-01-26 14:17:33.887 | DEBUG    | __main__:trials:24 - Trial = 14076/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.888 | DEBUG    | __main__:trials:29 - Trial = 14076/30000 | Total reward = 39.93
2022-01-26 14:17:33.893 | DEBUG    | __main__:trials:24 - Trial = 14077/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.894 | DEBUG    | __main__:trials:29 - Trial = 14077/30000 | Total reward = 57.70
2022-01-26 14:17:33.898 | DEBUG    | __main__:trials:24 - Trial = 14078/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.899 | DEBUG    | __main__:trials:29 - Trial = 14078/30000 | Total reward = 47.38
2022-01-26 14:17:33.903 | DEBUG    | __main__:trials:24 - Trial = 14079/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.903 | DEBUG    | __main__:trials:29 - Trial = 14079/30000 | Total reward = 47.05
2022-01-26 14:17:33.908 | DEBUG    | __main__:trials:24 - Trial = 14080/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.908 | DEBUG    | __main__:trials:29 - Trial = 14080/30000 | Total reward = 42.90
2022-01-26 14:17:33.912 | DEBUG    | __main__:trials:24 - Trial = 14081/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.914 | DEBUG    | __main__:trials:29 - Trial = 14081/30000 | Total reward = 35.84
2022-01-26 14:17:33.917 | DEBUG    | __main__:trials:24 - Trial = 14082/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.919 | DEBUG    | __main__:trials:29 - Trial = 14082/30000 | Total reward = 50.12
2022-01-26 14:17:33.923 | DEBUG    | __main__:trials:24 - Trial = 14083/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.924 | DEBUG    | __main__:trials:29 - Trial = 14083/30000 | Total reward = 55.36
2022-01-26 14:17:33.928 | DEBUG    | __main__:trials:24 - Trial = 14084/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.929 | DEBUG    | __main__:trials:29 - Trial = 14084/30000 | Total reward = 45.59
2022-01-26 14:17:33.932 | DEBUG    | __main__:trials:24 - Trial = 14085/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.933 | DEBUG    | __main__:trials:29 - Trial = 14085/30000 | Total reward = 49.01
2022-01-26 14:17:33.937 | DEBUG    | __main__:trials:24 - Trial = 14086/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.937 | DEBUG    | __main__:trials:29 - Trial = 14086/30000 | Total reward = 48.50
2022-01-26 14:17:33.941 | DEBUG    | __main__:trials:24 - Trial = 14087/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.942 | DEBUG    | __main__:trials:29 - Trial = 14087/30000 | Total reward = 45.82
2022-01-26 14:17:33.946 | DEBUG    | __main__:trials:24 - Trial = 14088/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.947 | DEBUG    | __main__:trials:29 - Trial = 14088/30000 | Total reward = 39.72
2022-01-26 14:17:33.951 | DEBUG    | __main__:trials:24 - Trial = 14089/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.952 | DEBUG    | __main__:trials:29 - Trial = 14089/30000 | Total reward = 43.07
2022-01-26 14:17:33.956 | DEBUG    | __main__:trials:24 - Trial = 14090/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.958 | DEBUG    | __main__:trials:29 - Trial = 14090/30000 | Total reward = 30.61
2022-01-26 14:17:33.961 | DEBUG    | __main__:trials:24 - Trial = 14091/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.963 | DEBUG    | __main__:trials:29 - Trial = 14091/30000 | Total reward = 43.96
2022-01-26 14:17:33.967 | DEBUG    | __main__:trials:24 - Trial = 14092/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.968 | DEBUG    | __main__:trials:29 - Trial = 14092/30000 | Total reward = 43.53
2022-01-26 14:17:33.971 | DEBUG    | __main__:trials:24 - Trial = 14093/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.973 | DEBUG    | __main__:trials:29 - Trial = 14093/30000 | Total reward = 48.31
2022-01-26 14:17:33.976 | DEBUG    | __main__:trials:24 - Trial = 14094/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.978 | DEBUG    | __main__:trials:29 - Trial = 14094/30000 | Total reward = 52.25
2022-01-26 14:17:33.982 | DEBUG    | __main__:trials:24 - Trial = 14095/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.982 | DEBUG    | __main__:trials:29 - Trial = 14095/30000 | Total reward = 47.05
2022-01-26 14:17:33.986 | DEBUG    | __main__:trials:24 - Trial = 14096/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.988 | DEBUG    | __main__:trials:29 - Trial = 14096/30000 | Total reward = 47.08
2022-01-26 14:17:33.992 | DEBUG    | __main__:trials:24 - Trial = 14097/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.992 | DEBUG    | __main__:trials:29 - Trial = 14097/30000 | Total reward = 45.98
2022-01-26 14:17:33.997 | DEBUG    | __main__:trials:24 - Trial = 14098/30000 | Max number of steps (20) reached
2022-01-26 14:17:33.999 | DEBUG    | __main__:trials:29 - Trial = 14098/30000 | Total reward = 47.73
2022-01-26 14:17:34.002 | DEBUG    | __main__:trials:24 - Trial = 14099/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.003 | DEBUG    | __main__:trials:29 - Trial = 14099/30000 | Total reward = 45.59
2022-01-26 14:17:34.007 | DEBUG    | __main__:trials:24 - Trial = 14100/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.008 | DEBUG    | __main__:trials:29 - Trial = 14100/30000 | Total reward = 46.61
2022-01-26 14:17:34.012 | DEBUG    | __main__:trials:24 - Trial = 14101/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.013 | DEBUG    | __main__:trials:29 - Trial = 14101/30000 | Total reward = 45.14
2022-01-26 14:17:34.017 | DEBUG    | __main__:trials:24 - Trial = 14102/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.019 | DEBUG    | __main__:trials:29 - Trial = 14102/30000 | Total reward = 47.16
2022-01-26 14:17:34.022 | DEBUG    | __main__:trials:24 - Trial = 14103/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.024 | DEBUG    | __main__:trials:29 - Trial = 14103/30000 | Total reward = 52.04
2022-01-26 14:17:34.027 | DEBUG    | __main__:trials:24 - Trial = 14104/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.029 | DEBUG    | __main__:trials:29 - Trial = 14104/30000 | Total reward = 33.98
2022-01-26 14:17:34.032 | DEBUG    | __main__:trials:24 - Trial = 14105/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.033 | DEBUG    | __main__:trials:29 - Trial = 14105/30000 | Total reward = 40.73
2022-01-26 14:17:34.036 | DEBUG    | __main__:trials:24 - Trial = 14106/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.038 | DEBUG    | __main__:trials:29 - Trial = 14106/30000 | Total reward = 41.09
2022-01-26 14:17:34.041 | DEBUG    | __main__:trials:24 - Trial = 14107/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.042 | DEBUG    | __main__:trials:29 - Trial = 14107/30000 | Total reward = 38.75
2022-01-26 14:17:34.045 | DEBUG    | __main__:trials:24 - Trial = 14108/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.046 | DEBUG    | __main__:trials:29 - Trial = 14108/30000 | Total reward = 39.50
2022-01-26 14:17:34.049 | DEBUG    | __main__:trials:24 - Trial = 14109/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.051 | DEBUG    | __main__:trials:29 - Trial = 14109/30000 | Total reward = 36.60
2022-01-26 14:17:34.054 | DEBUG    | __main__:trials:24 - Trial = 14110/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.055 | DEBUG    | __main__:trials:29 - Trial = 14110/30000 | Total reward = 52.82
2022-01-26 14:17:34.059 | DEBUG    | __main__:trials:24 - Trial = 14111/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.060 | DEBUG    | __main__:trials:29 - Trial = 14111/30000 | Total reward = 35.64
2022-01-26 14:17:34.064 | DEBUG    | __main__:trials:24 - Trial = 14112/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.065 | DEBUG    | __main__:trials:29 - Trial = 14112/30000 | Total reward = 38.14
2022-01-26 14:17:34.069 | DEBUG    | __main__:trials:24 - Trial = 14113/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.071 | DEBUG    | __main__:trials:29 - Trial = 14113/30000 | Total reward = 37.42
2022-01-26 14:17:34.075 | DEBUG    | __main__:trials:24 - Trial = 14114/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.076 | DEBUG    | __main__:trials:29 - Trial = 14114/30000 | Total reward = 37.14
2022-01-26 14:17:34.079 | DEBUG    | __main__:trials:24 - Trial = 14115/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.081 | DEBUG    | __main__:trials:29 - Trial = 14115/30000 | Total reward = 52.05
2022-01-26 14:17:34.084 | DEBUG    | __main__:trials:24 - Trial = 14116/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.086 | DEBUG    | __main__:trials:29 - Trial = 14116/30000 | Total reward = 47.91
2022-01-26 14:17:34.090 | DEBUG    | __main__:trials:24 - Trial = 14117/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.092 | DEBUG    | __main__:trials:29 - Trial = 14117/30000 | Total reward = 44.31
2022-01-26 14:17:34.095 | DEBUG    | __main__:trials:24 - Trial = 14118/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.096 | DEBUG    | __main__:trials:29 - Trial = 14118/30000 | Total reward = 50.58
2022-01-26 14:17:34.100 | DEBUG    | __main__:trials:24 - Trial = 14119/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.102 | DEBUG    | __main__:trials:29 - Trial = 14119/30000 | Total reward = 49.27
2022-01-26 14:17:34.106 | DEBUG    | __main__:trials:24 - Trial = 14120/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.106 | DEBUG    | __main__:trials:29 - Trial = 14120/30000 | Total reward = 44.82
2022-01-26 14:17:34.111 | DEBUG    | __main__:trials:24 - Trial = 14121/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.112 | DEBUG    | __main__:trials:29 - Trial = 14121/30000 | Total reward = 40.23
2022-01-26 14:17:34.116 | DEBUG    | __main__:trials:26 - Trial = 14122/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.118 | DEBUG    | __main__:trials:29 - Trial = 14122/30000 | Total reward = 33.94
2022-01-26 14:17:34.121 | DEBUG    | __main__:trials:24 - Trial = 14123/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.123 | DEBUG    | __main__:trials:29 - Trial = 14123/30000 | Total reward = 44.39
2022-01-26 14:17:34.127 | DEBUG    | __main__:trials:24 - Trial = 14124/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.128 | DEBUG    | __main__:trials:29 - Trial = 14124/30000 | Total reward = 41.41
2022-01-26 14:17:34.132 | DEBUG    | __main__:trials:24 - Trial = 14125/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.133 | DEBUG    | __main__:trials:29 - Trial = 14125/30000 | Total reward = 39.77
2022-01-26 14:17:34.137 | DEBUG    | __main__:trials:24 - Trial = 14126/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.138 | DEBUG    | __main__:trials:29 - Trial = 14126/30000 | Total reward = 51.74
2022-01-26 14:17:34.141 | DEBUG    | __main__:trials:24 - Trial = 14127/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.142 | DEBUG    | __main__:trials:29 - Trial = 14127/30000 | Total reward = 65.27
2022-01-26 14:17:34.147 | DEBUG    | __main__:trials:24 - Trial = 14128/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.148 | DEBUG    | __main__:trials:29 - Trial = 14128/30000 | Total reward = 44.38
2022-01-26 14:17:34.151 | DEBUG    | __main__:trials:24 - Trial = 14129/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.152 | DEBUG    | __main__:trials:29 - Trial = 14129/30000 | Total reward = 49.78
2022-01-26 14:17:34.156 | DEBUG    | __main__:trials:24 - Trial = 14130/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.157 | DEBUG    | __main__:trials:29 - Trial = 14130/30000 | Total reward = 57.28
2022-01-26 14:17:34.160 | DEBUG    | __main__:trials:24 - Trial = 14131/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.162 | DEBUG    | __main__:trials:29 - Trial = 14131/30000 | Total reward = 41.91
2022-01-26 14:17:34.165 | DEBUG    | __main__:trials:24 - Trial = 14132/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.166 | DEBUG    | __main__:trials:29 - Trial = 14132/30000 | Total reward = 46.97
2022-01-26 14:17:34.170 | DEBUG    | __main__:trials:24 - Trial = 14133/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.170 | DEBUG    | __main__:trials:29 - Trial = 14133/30000 | Total reward = 52.27
2022-01-26 14:17:34.174 | DEBUG    | __main__:trials:24 - Trial = 14134/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.176 | DEBUG    | __main__:trials:29 - Trial = 14134/30000 | Total reward = 47.60
2022-01-26 14:17:34.180 | DEBUG    | __main__:trials:24 - Trial = 14135/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.182 | DEBUG    | __main__:trials:29 - Trial = 14135/30000 | Total reward = 56.62
2022-01-26 14:17:34.185 | DEBUG    | __main__:trials:24 - Trial = 14136/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.187 | DEBUG    | __main__:trials:29 - Trial = 14136/30000 | Total reward = 48.00
2022-01-26 14:17:34.191 | DEBUG    | __main__:trials:24 - Trial = 14137/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.192 | DEBUG    | __main__:trials:29 - Trial = 14137/30000 | Total reward = 48.15
2022-01-26 14:17:34.196 | DEBUG    | __main__:trials:24 - Trial = 14138/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.197 | DEBUG    | __main__:trials:29 - Trial = 14138/30000 | Total reward = 50.70
2022-01-26 14:17:34.201 | DEBUG    | __main__:trials:24 - Trial = 14139/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.202 | DEBUG    | __main__:trials:29 - Trial = 14139/30000 | Total reward = 37.49
2022-01-26 14:17:34.205 | DEBUG    | __main__:trials:24 - Trial = 14140/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.206 | DEBUG    | __main__:trials:29 - Trial = 14140/30000 | Total reward = 41.73
2022-01-26 14:17:34.210 | DEBUG    | __main__:trials:24 - Trial = 14141/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.211 | DEBUG    | __main__:trials:29 - Trial = 14141/30000 | Total reward = 58.30
2022-01-26 14:17:34.215 | DEBUG    | __main__:trials:24 - Trial = 14142/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.216 | DEBUG    | __main__:trials:29 - Trial = 14142/30000 | Total reward = 37.21
2022-01-26 14:17:34.219 | DEBUG    | __main__:trials:24 - Trial = 14143/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.221 | DEBUG    | __main__:trials:29 - Trial = 14143/30000 | Total reward = 50.56
2022-01-26 14:17:34.224 | DEBUG    | __main__:trials:26 - Trial = 14144/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.225 | DEBUG    | __main__:trials:29 - Trial = 14144/30000 | Total reward = 26.77
2022-01-26 14:17:34.228 | DEBUG    | __main__:trials:24 - Trial = 14145/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.230 | DEBUG    | __main__:trials:29 - Trial = 14145/30000 | Total reward = 61.53
2022-01-26 14:17:34.233 | DEBUG    | __main__:trials:24 - Trial = 14146/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.235 | DEBUG    | __main__:trials:29 - Trial = 14146/30000 | Total reward = 50.05
2022-01-26 14:17:34.237 | DEBUG    | __main__:trials:24 - Trial = 14147/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.238 | DEBUG    | __main__:trials:29 - Trial = 14147/30000 | Total reward = 56.82
2022-01-26 14:17:34.242 | DEBUG    | __main__:trials:24 - Trial = 14148/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.243 | DEBUG    | __main__:trials:29 - Trial = 14148/30000 | Total reward = 38.27
2022-01-26 14:17:34.246 | DEBUG    | __main__:trials:24 - Trial = 14149/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.248 | DEBUG    | __main__:trials:29 - Trial = 14149/30000 | Total reward = 59.74
2022-01-26 14:17:34.251 | DEBUG    | __main__:trials:24 - Trial = 14150/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.253 | DEBUG    | __main__:trials:29 - Trial = 14150/30000 | Total reward = 41.52
2022-01-26 14:17:34.256 | DEBUG    | __main__:trials:24 - Trial = 14151/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.257 | DEBUG    | __main__:trials:29 - Trial = 14151/30000 | Total reward = 44.98
2022-01-26 14:17:34.260 | DEBUG    | __main__:trials:24 - Trial = 14152/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.262 | DEBUG    | __main__:trials:29 - Trial = 14152/30000 | Total reward = 40.81
2022-01-26 14:17:34.266 | DEBUG    | __main__:trials:24 - Trial = 14153/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.267 | DEBUG    | __main__:trials:29 - Trial = 14153/30000 | Total reward = 51.25
2022-01-26 14:17:34.271 | DEBUG    | __main__:trials:24 - Trial = 14154/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.272 | DEBUG    | __main__:trials:29 - Trial = 14154/30000 | Total reward = 47.53
2022-01-26 14:17:34.276 | DEBUG    | __main__:trials:24 - Trial = 14155/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.276 | DEBUG    | __main__:trials:29 - Trial = 14155/30000 | Total reward = 39.55
2022-01-26 14:17:34.281 | DEBUG    | __main__:trials:24 - Trial = 14156/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.282 | DEBUG    | __main__:trials:29 - Trial = 14156/30000 | Total reward = 46.06
2022-01-26 14:17:34.285 | DEBUG    | __main__:trials:24 - Trial = 14157/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.286 | DEBUG    | __main__:trials:29 - Trial = 14157/30000 | Total reward = 38.84
2022-01-26 14:17:34.289 | DEBUG    | __main__:trials:24 - Trial = 14158/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.291 | DEBUG    | __main__:trials:29 - Trial = 14158/30000 | Total reward = 42.39
2022-01-26 14:17:34.294 | DEBUG    | __main__:trials:24 - Trial = 14159/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.295 | DEBUG    | __main__:trials:29 - Trial = 14159/30000 | Total reward = 47.84
2022-01-26 14:17:34.298 | DEBUG    | __main__:trials:24 - Trial = 14160/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.300 | DEBUG    | __main__:trials:29 - Trial = 14160/30000 | Total reward = 47.27
2022-01-26 14:17:34.303 | DEBUG    | __main__:trials:24 - Trial = 14161/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.305 | DEBUG    | __main__:trials:29 - Trial = 14161/30000 | Total reward = 48.96
2022-01-26 14:17:34.308 | DEBUG    | __main__:trials:24 - Trial = 14162/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.309 | DEBUG    | __main__:trials:29 - Trial = 14162/30000 | Total reward = 51.35
2022-01-26 14:17:34.313 | DEBUG    | __main__:trials:24 - Trial = 14163/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.314 | DEBUG    | __main__:trials:29 - Trial = 14163/30000 | Total reward = 64.57
2022-01-26 14:17:34.319 | DEBUG    | __main__:trials:24 - Trial = 14164/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.319 | DEBUG    | __main__:trials:29 - Trial = 14164/30000 | Total reward = 50.53
2022-01-26 14:17:34.324 | DEBUG    | __main__:trials:24 - Trial = 14165/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.324 | DEBUG    | __main__:trials:29 - Trial = 14165/30000 | Total reward = 40.55
2022-01-26 14:17:34.328 | DEBUG    | __main__:trials:24 - Trial = 14166/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.329 | DEBUG    | __main__:trials:29 - Trial = 14166/30000 | Total reward = 62.71
2022-01-26 14:17:34.334 | DEBUG    | __main__:trials:24 - Trial = 14167/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.335 | DEBUG    | __main__:trials:29 - Trial = 14167/30000 | Total reward = 47.73
2022-01-26 14:17:34.339 | DEBUG    | __main__:trials:24 - Trial = 14168/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.341 | DEBUG    | __main__:trials:29 - Trial = 14168/30000 | Total reward = 46.54
2022-01-26 14:17:34.344 | DEBUG    | __main__:trials:24 - Trial = 14169/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.346 | DEBUG    | __main__:trials:29 - Trial = 14169/30000 | Total reward = 49.89
2022-01-26 14:17:34.349 | DEBUG    | __main__:trials:24 - Trial = 14170/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.350 | DEBUG    | __main__:trials:29 - Trial = 14170/30000 | Total reward = 51.38
2022-01-26 14:17:34.355 | DEBUG    | __main__:trials:24 - Trial = 14171/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.356 | DEBUG    | __main__:trials:29 - Trial = 14171/30000 | Total reward = 48.72
2022-01-26 14:17:34.360 | DEBUG    | __main__:trials:24 - Trial = 14172/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.360 | DEBUG    | __main__:trials:29 - Trial = 14172/30000 | Total reward = 58.17
2022-01-26 14:17:34.365 | DEBUG    | __main__:trials:24 - Trial = 14173/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.366 | DEBUG    | __main__:trials:29 - Trial = 14173/30000 | Total reward = 51.30
2022-01-26 14:17:34.370 | DEBUG    | __main__:trials:24 - Trial = 14174/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.371 | DEBUG    | __main__:trials:29 - Trial = 14174/30000 | Total reward = 55.07
2022-01-26 14:17:34.375 | DEBUG    | __main__:trials:24 - Trial = 14175/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.376 | DEBUG    | __main__:trials:29 - Trial = 14175/30000 | Total reward = 53.36
2022-01-26 14:17:34.380 | DEBUG    | __main__:trials:24 - Trial = 14176/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.381 | DEBUG    | __main__:trials:29 - Trial = 14176/30000 | Total reward = 53.36
2022-01-26 14:17:34.386 | DEBUG    | __main__:trials:24 - Trial = 14177/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.387 | DEBUG    | __main__:trials:29 - Trial = 14177/30000 | Total reward = 44.57
2022-01-26 14:17:34.391 | DEBUG    | __main__:trials:24 - Trial = 14178/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.392 | DEBUG    | __main__:trials:29 - Trial = 14178/30000 | Total reward = 40.37
2022-01-26 14:17:34.395 | DEBUG    | __main__:trials:24 - Trial = 14179/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.397 | DEBUG    | __main__:trials:29 - Trial = 14179/30000 | Total reward = 53.56
2022-01-26 14:17:34.401 | DEBUG    | __main__:trials:24 - Trial = 14180/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.401 | DEBUG    | __main__:trials:29 - Trial = 14180/30000 | Total reward = 52.82
2022-01-26 14:17:34.405 | DEBUG    | __main__:trials:24 - Trial = 14181/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.406 | DEBUG    | __main__:trials:29 - Trial = 14181/30000 | Total reward = 61.89
2022-01-26 14:17:34.410 | DEBUG    | __main__:trials:24 - Trial = 14182/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.411 | DEBUG    | __main__:trials:29 - Trial = 14182/30000 | Total reward = 36.53
2022-01-26 14:17:34.416 | DEBUG    | __main__:trials:24 - Trial = 14183/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.417 | DEBUG    | __main__:trials:29 - Trial = 14183/30000 | Total reward = 42.18
2022-01-26 14:17:34.421 | DEBUG    | __main__:trials:24 - Trial = 14184/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.422 | DEBUG    | __main__:trials:29 - Trial = 14184/30000 | Total reward = 41.67
2022-01-26 14:17:34.426 | DEBUG    | __main__:trials:24 - Trial = 14185/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.428 | DEBUG    | __main__:trials:29 - Trial = 14185/30000 | Total reward = 38.41
2022-01-26 14:17:34.431 | DEBUG    | __main__:trials:24 - Trial = 14186/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.432 | DEBUG    | __main__:trials:29 - Trial = 14186/30000 | Total reward = 44.71
2022-01-26 14:17:34.436 | DEBUG    | __main__:trials:24 - Trial = 14187/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.438 | DEBUG    | __main__:trials:29 - Trial = 14187/30000 | Total reward = 37.29
2022-01-26 14:17:34.441 | DEBUG    | __main__:trials:24 - Trial = 14188/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.443 | DEBUG    | __main__:trials:29 - Trial = 14188/30000 | Total reward = 36.58
2022-01-26 14:17:34.446 | DEBUG    | __main__:trials:24 - Trial = 14189/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.447 | DEBUG    | __main__:trials:29 - Trial = 14189/30000 | Total reward = 39.44
2022-01-26 14:17:34.451 | DEBUG    | __main__:trials:24 - Trial = 14190/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.452 | DEBUG    | __main__:trials:29 - Trial = 14190/30000 | Total reward = 39.44
2022-01-26 14:17:34.455 | DEBUG    | __main__:trials:24 - Trial = 14191/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.457 | DEBUG    | __main__:trials:29 - Trial = 14191/30000 | Total reward = 37.78
2022-01-26 14:17:34.460 | DEBUG    | __main__:trials:24 - Trial = 14192/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.462 | DEBUG    | __main__:trials:29 - Trial = 14192/30000 | Total reward = 48.79
2022-01-26 14:17:34.465 | DEBUG    | __main__:trials:24 - Trial = 14193/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.466 | DEBUG    | __main__:trials:29 - Trial = 14193/30000 | Total reward = 38.99
2022-01-26 14:17:34.470 | DEBUG    | __main__:trials:24 - Trial = 14194/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.471 | DEBUG    | __main__:trials:29 - Trial = 14194/30000 | Total reward = 32.17
2022-01-26 14:17:34.475 | DEBUG    | __main__:trials:24 - Trial = 14195/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.476 | DEBUG    | __main__:trials:29 - Trial = 14195/30000 | Total reward = 38.99
2022-01-26 14:17:34.480 | DEBUG    | __main__:trials:24 - Trial = 14196/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.482 | DEBUG    | __main__:trials:29 - Trial = 14196/30000 | Total reward = 39.67
2022-01-26 14:17:34.486 | DEBUG    | __main__:trials:24 - Trial = 14197/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.487 | DEBUG    | __main__:trials:29 - Trial = 14197/30000 | Total reward = 45.85
2022-01-26 14:17:34.491 | DEBUG    | __main__:trials:24 - Trial = 14198/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.492 | DEBUG    | __main__:trials:29 - Trial = 14198/30000 | Total reward = 46.16
2022-01-26 14:17:34.495 | DEBUG    | __main__:trials:24 - Trial = 14199/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.497 | DEBUG    | __main__:trials:29 - Trial = 14199/30000 | Total reward = 47.05
2022-01-26 14:17:34.500 | DEBUG    | __main__:trials:24 - Trial = 14200/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.502 | DEBUG    | __main__:trials:29 - Trial = 14200/30000 | Total reward = 45.42
2022-01-26 14:17:34.505 | DEBUG    | __main__:trials:24 - Trial = 14201/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.506 | DEBUG    | __main__:trials:29 - Trial = 14201/30000 | Total reward = 49.46
2022-01-26 14:17:34.509 | DEBUG    | __main__:trials:24 - Trial = 14202/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.511 | DEBUG    | __main__:trials:29 - Trial = 14202/30000 | Total reward = 44.48
2022-01-26 14:17:34.514 | DEBUG    | __main__:trials:24 - Trial = 14203/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.515 | DEBUG    | __main__:trials:29 - Trial = 14203/30000 | Total reward = 54.53
2022-01-26 14:17:34.519 | DEBUG    | __main__:trials:24 - Trial = 14204/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.520 | DEBUG    | __main__:trials:29 - Trial = 14204/30000 | Total reward = 50.84
2022-01-26 14:17:34.523 | DEBUG    | __main__:trials:26 - Trial = 14205/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.524 | DEBUG    | __main__:trials:29 - Trial = 14205/30000 | Total reward = 18.80
2022-01-26 14:17:34.528 | DEBUG    | __main__:trials:24 - Trial = 14206/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.529 | DEBUG    | __main__:trials:29 - Trial = 14206/30000 | Total reward = 38.67
2022-01-26 14:17:34.533 | DEBUG    | __main__:trials:24 - Trial = 14207/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.533 | DEBUG    | __main__:trials:29 - Trial = 14207/30000 | Total reward = 48.04
2022-01-26 14:17:34.537 | DEBUG    | __main__:trials:24 - Trial = 14208/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.538 | DEBUG    | __main__:trials:29 - Trial = 14208/30000 | Total reward = 62.22
2022-01-26 14:17:34.542 | DEBUG    | __main__:trials:24 - Trial = 14209/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.543 | DEBUG    | __main__:trials:29 - Trial = 14209/30000 | Total reward = 35.13
2022-01-26 14:17:34.546 | DEBUG    | __main__:trials:24 - Trial = 14210/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.548 | DEBUG    | __main__:trials:29 - Trial = 14210/30000 | Total reward = 36.56
2022-01-26 14:17:34.551 | DEBUG    | __main__:trials:24 - Trial = 14211/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.553 | DEBUG    | __main__:trials:29 - Trial = 14211/30000 | Total reward = 48.89
2022-01-26 14:17:34.556 | DEBUG    | __main__:trials:24 - Trial = 14212/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.558 | DEBUG    | __main__:trials:29 - Trial = 14212/30000 | Total reward = 24.85
2022-01-26 14:17:34.562 | DEBUG    | __main__:trials:24 - Trial = 14213/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.563 | DEBUG    | __main__:trials:29 - Trial = 14213/30000 | Total reward = 43.92
2022-01-26 14:17:34.567 | DEBUG    | __main__:trials:24 - Trial = 14214/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.568 | DEBUG    | __main__:trials:29 - Trial = 14214/30000 | Total reward = 46.36
2022-01-26 14:17:34.572 | DEBUG    | __main__:trials:24 - Trial = 14215/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.573 | DEBUG    | __main__:trials:29 - Trial = 14215/30000 | Total reward = 35.61
2022-01-26 14:17:34.576 | DEBUG    | __main__:trials:24 - Trial = 14216/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.577 | DEBUG    | __main__:trials:29 - Trial = 14216/30000 | Total reward = 37.83
2022-01-26 14:17:34.581 | DEBUG    | __main__:trials:24 - Trial = 14217/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.581 | DEBUG    | __main__:trials:29 - Trial = 14217/30000 | Total reward = 33.18
2022-01-26 14:17:34.585 | DEBUG    | __main__:trials:24 - Trial = 14218/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.586 | DEBUG    | __main__:trials:29 - Trial = 14218/30000 | Total reward = 44.24
2022-01-26 14:17:34.589 | DEBUG    | __main__:trials:24 - Trial = 14219/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.590 | DEBUG    | __main__:trials:29 - Trial = 14219/30000 | Total reward = 38.92
2022-01-26 14:17:34.593 | DEBUG    | __main__:trials:24 - Trial = 14220/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.595 | DEBUG    | __main__:trials:29 - Trial = 14220/30000 | Total reward = 38.68
2022-01-26 14:17:34.598 | DEBUG    | __main__:trials:24 - Trial = 14221/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.599 | DEBUG    | __main__:trials:29 - Trial = 14221/30000 | Total reward = 38.43
2022-01-26 14:17:34.602 | DEBUG    | __main__:trials:24 - Trial = 14222/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.604 | DEBUG    | __main__:trials:29 - Trial = 14222/30000 | Total reward = 33.71
2022-01-26 14:17:34.608 | DEBUG    | __main__:trials:24 - Trial = 14223/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.609 | DEBUG    | __main__:trials:29 - Trial = 14223/30000 | Total reward = 40.93
2022-01-26 14:17:34.613 | DEBUG    | __main__:trials:24 - Trial = 14224/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.614 | DEBUG    | __main__:trials:29 - Trial = 14224/30000 | Total reward = 45.94
2022-01-26 14:17:34.618 | DEBUG    | __main__:trials:24 - Trial = 14225/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.619 | DEBUG    | __main__:trials:29 - Trial = 14225/30000 | Total reward = 46.20
2022-01-26 14:17:34.623 | DEBUG    | __main__:trials:24 - Trial = 14226/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.625 | DEBUG    | __main__:trials:29 - Trial = 14226/30000 | Total reward = 39.86
2022-01-26 14:17:34.628 | DEBUG    | __main__:trials:24 - Trial = 14227/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.629 | DEBUG    | __main__:trials:29 - Trial = 14227/30000 | Total reward = 39.31
2022-01-26 14:17:34.633 | DEBUG    | __main__:trials:24 - Trial = 14228/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.634 | DEBUG    | __main__:trials:29 - Trial = 14228/30000 | Total reward = 41.35
2022-01-26 14:17:34.637 | DEBUG    | __main__:trials:24 - Trial = 14229/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.638 | DEBUG    | __main__:trials:29 - Trial = 14229/30000 | Total reward = 38.38
2022-01-26 14:17:34.641 | DEBUG    | __main__:trials:24 - Trial = 14230/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.643 | DEBUG    | __main__:trials:29 - Trial = 14230/30000 | Total reward = 40.81
2022-01-26 14:17:34.645 | DEBUG    | __main__:trials:24 - Trial = 14231/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.647 | DEBUG    | __main__:trials:29 - Trial = 14231/30000 | Total reward = 66.09
2022-01-26 14:17:34.650 | DEBUG    | __main__:trials:24 - Trial = 14232/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.651 | DEBUG    | __main__:trials:29 - Trial = 14232/30000 | Total reward = 53.61
2022-01-26 14:17:34.655 | DEBUG    | __main__:trials:24 - Trial = 14233/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.657 | DEBUG    | __main__:trials:29 - Trial = 14233/30000 | Total reward = 33.77
2022-01-26 14:17:34.660 | DEBUG    | __main__:trials:24 - Trial = 14234/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.661 | DEBUG    | __main__:trials:29 - Trial = 14234/30000 | Total reward = 65.86
2022-01-26 14:17:34.665 | DEBUG    | __main__:trials:24 - Trial = 14235/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.666 | DEBUG    | __main__:trials:29 - Trial = 14235/30000 | Total reward = 45.53
2022-01-26 14:17:34.671 | DEBUG    | __main__:trials:24 - Trial = 14236/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.672 | DEBUG    | __main__:trials:29 - Trial = 14236/30000 | Total reward = 57.11
2022-01-26 14:17:34.676 | DEBUG    | __main__:trials:24 - Trial = 14237/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.678 | DEBUG    | __main__:trials:29 - Trial = 14237/30000 | Total reward = 49.43
2022-01-26 14:17:34.681 | DEBUG    | __main__:trials:24 - Trial = 14238/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.683 | DEBUG    | __main__:trials:29 - Trial = 14238/30000 | Total reward = 42.54
2022-01-26 14:17:34.686 | DEBUG    | __main__:trials:24 - Trial = 14239/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.687 | DEBUG    | __main__:trials:29 - Trial = 14239/30000 | Total reward = 46.73
2022-01-26 14:17:34.691 | DEBUG    | __main__:trials:24 - Trial = 14240/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.692 | DEBUG    | __main__:trials:29 - Trial = 14240/30000 | Total reward = 57.60
2022-01-26 14:17:34.695 | DEBUG    | __main__:trials:24 - Trial = 14241/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.697 | DEBUG    | __main__:trials:29 - Trial = 14241/30000 | Total reward = 50.07
2022-01-26 14:17:34.700 | DEBUG    | __main__:trials:24 - Trial = 14242/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.702 | DEBUG    | __main__:trials:29 - Trial = 14242/30000 | Total reward = 53.33
2022-01-26 14:17:34.705 | DEBUG    | __main__:trials:24 - Trial = 14243/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.706 | DEBUG    | __main__:trials:29 - Trial = 14243/30000 | Total reward = 53.33
2022-01-26 14:17:34.711 | DEBUG    | __main__:trials:24 - Trial = 14244/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.712 | DEBUG    | __main__:trials:29 - Trial = 14244/30000 | Total reward = 52.74
2022-01-26 14:17:34.716 | DEBUG    | __main__:trials:24 - Trial = 14245/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.717 | DEBUG    | __main__:trials:29 - Trial = 14245/30000 | Total reward = 60.59
2022-01-26 14:17:34.722 | DEBUG    | __main__:trials:24 - Trial = 14246/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.723 | DEBUG    | __main__:trials:29 - Trial = 14246/30000 | Total reward = 54.16
2022-01-26 14:17:34.727 | DEBUG    | __main__:trials:24 - Trial = 14247/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.728 | DEBUG    | __main__:trials:29 - Trial = 14247/30000 | Total reward = 62.13
2022-01-26 14:17:34.733 | DEBUG    | __main__:trials:24 - Trial = 14248/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.733 | DEBUG    | __main__:trials:29 - Trial = 14248/30000 | Total reward = 54.26
2022-01-26 14:17:34.738 | DEBUG    | __main__:trials:24 - Trial = 14249/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.739 | DEBUG    | __main__:trials:29 - Trial = 14249/30000 | Total reward = 54.98
2022-01-26 14:17:34.742 | DEBUG    | __main__:trials:24 - Trial = 14250/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.744 | DEBUG    | __main__:trials:29 - Trial = 14250/30000 | Total reward = 57.57
2022-01-26 14:17:34.748 | DEBUG    | __main__:trials:24 - Trial = 14251/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.749 | DEBUG    | __main__:trials:29 - Trial = 14251/30000 | Total reward = 45.05
2022-01-26 14:17:34.753 | DEBUG    | __main__:trials:26 - Trial = 14252/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.754 | DEBUG    | __main__:trials:29 - Trial = 14252/30000 | Total reward = 23.22
2022-01-26 14:17:34.758 | DEBUG    | __main__:trials:24 - Trial = 14253/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.759 | DEBUG    | __main__:trials:29 - Trial = 14253/30000 | Total reward = 36.95
2022-01-26 14:17:34.764 | DEBUG    | __main__:trials:24 - Trial = 14254/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.765 | DEBUG    | __main__:trials:29 - Trial = 14254/30000 | Total reward = 40.16
2022-01-26 14:17:34.768 | DEBUG    | __main__:trials:24 - Trial = 14255/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.770 | DEBUG    | __main__:trials:29 - Trial = 14255/30000 | Total reward = 45.93
2022-01-26 14:17:34.773 | DEBUG    | __main__:trials:24 - Trial = 14256/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.774 | DEBUG    | __main__:trials:29 - Trial = 14256/30000 | Total reward = 34.10
2022-01-26 14:17:34.777 | DEBUG    | __main__:trials:24 - Trial = 14257/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.779 | DEBUG    | __main__:trials:29 - Trial = 14257/30000 | Total reward = 62.21
2022-01-26 14:17:34.782 | DEBUG    | __main__:trials:24 - Trial = 14258/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.784 | DEBUG    | __main__:trials:29 - Trial = 14258/30000 | Total reward = 47.48
2022-01-26 14:17:34.788 | DEBUG    | __main__:trials:24 - Trial = 14259/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.789 | DEBUG    | __main__:trials:29 - Trial = 14259/30000 | Total reward = 47.20
2022-01-26 14:17:34.793 | DEBUG    | __main__:trials:24 - Trial = 14260/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.794 | DEBUG    | __main__:trials:29 - Trial = 14260/30000 | Total reward = 47.20
2022-01-26 14:17:34.798 | DEBUG    | __main__:trials:24 - Trial = 14261/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.800 | DEBUG    | __main__:trials:29 - Trial = 14261/30000 | Total reward = 42.48
2022-01-26 14:17:34.803 | DEBUG    | __main__:trials:24 - Trial = 14262/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.804 | DEBUG    | __main__:trials:29 - Trial = 14262/30000 | Total reward = 46.00
2022-01-26 14:17:34.807 | DEBUG    | __main__:trials:24 - Trial = 14263/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.807 | DEBUG    | __main__:trials:29 - Trial = 14263/30000 | Total reward = 35.22
2022-01-26 14:17:34.811 | DEBUG    | __main__:trials:24 - Trial = 14264/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.812 | DEBUG    | __main__:trials:29 - Trial = 14264/30000 | Total reward = 47.20
2022-01-26 14:17:34.815 | DEBUG    | __main__:trials:24 - Trial = 14265/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.817 | DEBUG    | __main__:trials:29 - Trial = 14265/30000 | Total reward = 25.75
2022-01-26 14:17:34.820 | DEBUG    | __main__:trials:24 - Trial = 14266/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.822 | DEBUG    | __main__:trials:29 - Trial = 14266/30000 | Total reward = 47.68
2022-01-26 14:17:34.826 | DEBUG    | __main__:trials:24 - Trial = 14267/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.826 | DEBUG    | __main__:trials:29 - Trial = 14267/30000 | Total reward = 54.50
2022-01-26 14:17:34.831 | DEBUG    | __main__:trials:24 - Trial = 14268/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.832 | DEBUG    | __main__:trials:29 - Trial = 14268/30000 | Total reward = 46.63
2022-01-26 14:17:34.836 | DEBUG    | __main__:trials:24 - Trial = 14269/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.838 | DEBUG    | __main__:trials:29 - Trial = 14269/30000 | Total reward = 43.97
2022-01-26 14:17:34.842 | DEBUG    | __main__:trials:24 - Trial = 14270/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.843 | DEBUG    | __main__:trials:29 - Trial = 14270/30000 | Total reward = 48.28
2022-01-26 14:17:34.847 | DEBUG    | __main__:trials:24 - Trial = 14271/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.848 | DEBUG    | __main__:trials:29 - Trial = 14271/30000 | Total reward = 66.47
2022-01-26 14:17:34.852 | DEBUG    | __main__:trials:24 - Trial = 14272/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.853 | DEBUG    | __main__:trials:29 - Trial = 14272/30000 | Total reward = 64.62
2022-01-26 14:17:34.856 | DEBUG    | __main__:trials:24 - Trial = 14273/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.858 | DEBUG    | __main__:trials:29 - Trial = 14273/30000 | Total reward = 47.66
2022-01-26 14:17:34.861 | DEBUG    | __main__:trials:24 - Trial = 14274/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.862 | DEBUG    | __main__:trials:29 - Trial = 14274/30000 | Total reward = 40.82
2022-01-26 14:17:34.865 | DEBUG    | __main__:trials:24 - Trial = 14275/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.866 | DEBUG    | __main__:trials:29 - Trial = 14275/30000 | Total reward = 46.93
2022-01-26 14:17:34.869 | DEBUG    | __main__:trials:24 - Trial = 14276/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.871 | DEBUG    | __main__:trials:29 - Trial = 14276/30000 | Total reward = 42.83
2022-01-26 14:17:34.874 | DEBUG    | __main__:trials:24 - Trial = 14277/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.875 | DEBUG    | __main__:trials:29 - Trial = 14277/30000 | Total reward = 49.27
2022-01-26 14:17:34.879 | DEBUG    | __main__:trials:24 - Trial = 14278/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.881 | DEBUG    | __main__:trials:29 - Trial = 14278/30000 | Total reward = 50.39
2022-01-26 14:17:34.884 | DEBUG    | __main__:trials:24 - Trial = 14279/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.885 | DEBUG    | __main__:trials:29 - Trial = 14279/30000 | Total reward = 42.84
2022-01-26 14:17:34.888 | DEBUG    | __main__:trials:24 - Trial = 14280/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.889 | DEBUG    | __main__:trials:29 - Trial = 14280/30000 | Total reward = 31.83
2022-01-26 14:17:34.892 | DEBUG    | __main__:trials:24 - Trial = 14281/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.893 | DEBUG    | __main__:trials:29 - Trial = 14281/30000 | Total reward = 63.05
2022-01-26 14:17:34.897 | DEBUG    | __main__:trials:24 - Trial = 14282/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.897 | DEBUG    | __main__:trials:29 - Trial = 14282/30000 | Total reward = 65.17
2022-01-26 14:17:34.901 | DEBUG    | __main__:trials:24 - Trial = 14283/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.901 | DEBUG    | __main__:trials:29 - Trial = 14283/30000 | Total reward = 47.05
2022-01-26 14:17:34.905 | DEBUG    | __main__:trials:24 - Trial = 14284/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.906 | DEBUG    | __main__:trials:29 - Trial = 14284/30000 | Total reward = 42.64
2022-01-26 14:17:34.909 | DEBUG    | __main__:trials:24 - Trial = 14285/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.910 | DEBUG    | __main__:trials:29 - Trial = 14285/30000 | Total reward = 45.80
2022-01-26 14:17:34.912 | DEBUG    | __main__:trials:26 - Trial = 14286/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.913 | DEBUG    | __main__:trials:29 - Trial = 14286/30000 | Total reward = 19.80
2022-01-26 14:17:34.918 | DEBUG    | __main__:trials:24 - Trial = 14287/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.919 | DEBUG    | __main__:trials:29 - Trial = 14287/30000 | Total reward = 45.83
2022-01-26 14:17:34.923 | DEBUG    | __main__:trials:24 - Trial = 14288/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.924 | DEBUG    | __main__:trials:29 - Trial = 14288/30000 | Total reward = 60.16
2022-01-26 14:17:34.928 | DEBUG    | __main__:trials:24 - Trial = 14289/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.929 | DEBUG    | __main__:trials:29 - Trial = 14289/30000 | Total reward = 38.75
2022-01-26 14:17:34.933 | DEBUG    | __main__:trials:24 - Trial = 14290/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.933 | DEBUG    | __main__:trials:29 - Trial = 14290/30000 | Total reward = 44.33
2022-01-26 14:17:34.938 | DEBUG    | __main__:trials:24 - Trial = 14291/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.938 | DEBUG    | __main__:trials:29 - Trial = 14291/30000 | Total reward = 44.00
2022-01-26 14:17:34.943 | DEBUG    | __main__:trials:24 - Trial = 14292/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.944 | DEBUG    | __main__:trials:29 - Trial = 14292/30000 | Total reward = 40.45
2022-01-26 14:17:34.948 | DEBUG    | __main__:trials:24 - Trial = 14293/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.949 | DEBUG    | __main__:trials:29 - Trial = 14293/30000 | Total reward = 44.91
2022-01-26 14:17:34.953 | DEBUG    | __main__:trials:24 - Trial = 14294/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.955 | DEBUG    | __main__:trials:29 - Trial = 14294/30000 | Total reward = 48.57
2022-01-26 14:17:34.958 | DEBUG    | __main__:trials:24 - Trial = 14295/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.960 | DEBUG    | __main__:trials:29 - Trial = 14295/30000 | Total reward = 48.54
2022-01-26 14:17:34.963 | DEBUG    | __main__:trials:24 - Trial = 14296/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.964 | DEBUG    | __main__:trials:29 - Trial = 14296/30000 | Total reward = 45.91
2022-01-26 14:17:34.968 | DEBUG    | __main__:trials:24 - Trial = 14297/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.970 | DEBUG    | __main__:trials:29 - Trial = 14297/30000 | Total reward = 44.05
2022-01-26 14:17:34.973 | DEBUG    | __main__:trials:24 - Trial = 14298/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.975 | DEBUG    | __main__:trials:29 - Trial = 14298/30000 | Total reward = 34.80
2022-01-26 14:17:34.978 | DEBUG    | __main__:trials:24 - Trial = 14299/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.980 | DEBUG    | __main__:trials:29 - Trial = 14299/30000 | Total reward = 42.20
2022-01-26 14:17:34.984 | DEBUG    | __main__:trials:24 - Trial = 14300/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.985 | DEBUG    | __main__:trials:29 - Trial = 14300/30000 | Total reward = 44.06
2022-01-26 14:17:34.988 | DEBUG    | __main__:trials:24 - Trial = 14301/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.990 | DEBUG    | __main__:trials:29 - Trial = 14301/30000 | Total reward = 53.48
2022-01-26 14:17:34.993 | DEBUG    | __main__:trials:26 - Trial = 14302/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:34.994 | DEBUG    | __main__:trials:29 - Trial = 14302/30000 | Total reward = 17.06
2022-01-26 14:17:34.998 | DEBUG    | __main__:trials:24 - Trial = 14303/30000 | Max number of steps (20) reached
2022-01-26 14:17:34.999 | DEBUG    | __main__:trials:29 - Trial = 14303/30000 | Total reward = 36.06
2022-01-26 14:17:35.004 | DEBUG    | __main__:trials:24 - Trial = 14304/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.004 | DEBUG    | __main__:trials:29 - Trial = 14304/30000 | Total reward = 49.25
2022-01-26 14:17:35.009 | DEBUG    | __main__:trials:24 - Trial = 14305/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.011 | DEBUG    | __main__:trials:29 - Trial = 14305/30000 | Total reward = 45.28
2022-01-26 14:17:35.014 | DEBUG    | __main__:trials:24 - Trial = 14306/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.016 | DEBUG    | __main__:trials:29 - Trial = 14306/30000 | Total reward = 61.68
2022-01-26 14:17:35.019 | DEBUG    | __main__:trials:24 - Trial = 14307/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.021 | DEBUG    | __main__:trials:29 - Trial = 14307/30000 | Total reward = 44.58
2022-01-26 14:17:35.024 | DEBUG    | __main__:trials:24 - Trial = 14308/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.026 | DEBUG    | __main__:trials:29 - Trial = 14308/30000 | Total reward = 49.62
2022-01-26 14:17:35.030 | DEBUG    | __main__:trials:24 - Trial = 14309/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.030 | DEBUG    | __main__:trials:29 - Trial = 14309/30000 | Total reward = 48.07
2022-01-26 14:17:35.035 | DEBUG    | __main__:trials:24 - Trial = 14310/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.037 | DEBUG    | __main__:trials:29 - Trial = 14310/30000 | Total reward = 52.06
2022-01-26 14:17:35.040 | DEBUG    | __main__:trials:24 - Trial = 14311/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.041 | DEBUG    | __main__:trials:29 - Trial = 14311/30000 | Total reward = 49.48
2022-01-26 14:17:35.046 | DEBUG    | __main__:trials:24 - Trial = 14312/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.047 | DEBUG    | __main__:trials:29 - Trial = 14312/30000 | Total reward = 41.91
2022-01-26 14:17:35.050 | DEBUG    | __main__:trials:24 - Trial = 14313/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.052 | DEBUG    | __main__:trials:29 - Trial = 14313/30000 | Total reward = 41.22
2022-01-26 14:17:35.056 | DEBUG    | __main__:trials:24 - Trial = 14314/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.057 | DEBUG    | __main__:trials:29 - Trial = 14314/30000 | Total reward = 54.61
2022-01-26 14:17:35.062 | DEBUG    | __main__:trials:24 - Trial = 14315/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.063 | DEBUG    | __main__:trials:29 - Trial = 14315/30000 | Total reward = 48.17
2022-01-26 14:17:35.067 | DEBUG    | __main__:trials:24 - Trial = 14316/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.069 | DEBUG    | __main__:trials:29 - Trial = 14316/30000 | Total reward = 43.78
2022-01-26 14:17:35.072 | DEBUG    | __main__:trials:24 - Trial = 14317/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.073 | DEBUG    | __main__:trials:29 - Trial = 14317/30000 | Total reward = 48.70
2022-01-26 14:17:35.076 | DEBUG    | __main__:trials:24 - Trial = 14318/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.078 | DEBUG    | __main__:trials:29 - Trial = 14318/30000 | Total reward = 42.46
2022-01-26 14:17:35.081 | DEBUG    | __main__:trials:24 - Trial = 14319/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.083 | DEBUG    | __main__:trials:29 - Trial = 14319/30000 | Total reward = 47.06
2022-01-26 14:17:35.086 | DEBUG    | __main__:trials:24 - Trial = 14320/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.088 | DEBUG    | __main__:trials:29 - Trial = 14320/30000 | Total reward = 43.03
2022-01-26 14:17:35.091 | DEBUG    | __main__:trials:24 - Trial = 14321/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.092 | DEBUG    | __main__:trials:29 - Trial = 14321/30000 | Total reward = 50.64
2022-01-26 14:17:35.096 | DEBUG    | __main__:trials:24 - Trial = 14322/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.097 | DEBUG    | __main__:trials:29 - Trial = 14322/30000 | Total reward = 60.66
2022-01-26 14:17:35.101 | DEBUG    | __main__:trials:24 - Trial = 14323/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.102 | DEBUG    | __main__:trials:29 - Trial = 14323/30000 | Total reward = 47.05
2022-01-26 14:17:35.106 | DEBUG    | __main__:trials:24 - Trial = 14324/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.107 | DEBUG    | __main__:trials:29 - Trial = 14324/30000 | Total reward = 38.07
2022-01-26 14:17:35.110 | DEBUG    | __main__:trials:24 - Trial = 14325/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.112 | DEBUG    | __main__:trials:29 - Trial = 14325/30000 | Total reward = 44.54
2022-01-26 14:17:35.115 | DEBUG    | __main__:trials:24 - Trial = 14326/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.117 | DEBUG    | __main__:trials:29 - Trial = 14326/30000 | Total reward = 47.51
2022-01-26 14:17:35.121 | DEBUG    | __main__:trials:24 - Trial = 14327/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.122 | DEBUG    | __main__:trials:29 - Trial = 14327/30000 | Total reward = 42.28
2022-01-26 14:17:35.125 | DEBUG    | __main__:trials:24 - Trial = 14328/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.126 | DEBUG    | __main__:trials:29 - Trial = 14328/30000 | Total reward = 46.87
2022-01-26 14:17:35.129 | DEBUG    | __main__:trials:24 - Trial = 14329/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.131 | DEBUG    | __main__:trials:29 - Trial = 14329/30000 | Total reward = 37.40
2022-01-26 14:17:35.134 | DEBUG    | __main__:trials:24 - Trial = 14330/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.135 | DEBUG    | __main__:trials:29 - Trial = 14330/30000 | Total reward = 44.39
2022-01-26 14:17:35.139 | DEBUG    | __main__:trials:24 - Trial = 14331/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.140 | DEBUG    | __main__:trials:29 - Trial = 14331/30000 | Total reward = 39.31
2022-01-26 14:17:35.144 | DEBUG    | __main__:trials:24 - Trial = 14332/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.145 | DEBUG    | __main__:trials:29 - Trial = 14332/30000 | Total reward = 35.32
2022-01-26 14:17:35.150 | DEBUG    | __main__:trials:24 - Trial = 14333/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.151 | DEBUG    | __main__:trials:29 - Trial = 14333/30000 | Total reward = 47.20
2022-01-26 14:17:35.155 | DEBUG    | __main__:trials:24 - Trial = 14334/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.156 | DEBUG    | __main__:trials:29 - Trial = 14334/30000 | Total reward = 40.75
2022-01-26 14:17:35.159 | DEBUG    | __main__:trials:24 - Trial = 14335/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.161 | DEBUG    | __main__:trials:29 - Trial = 14335/30000 | Total reward = 41.56
2022-01-26 14:17:35.164 | DEBUG    | __main__:trials:24 - Trial = 14336/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.166 | DEBUG    | __main__:trials:29 - Trial = 14336/30000 | Total reward = 41.47
2022-01-26 14:17:35.169 | DEBUG    | __main__:trials:24 - Trial = 14337/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.171 | DEBUG    | __main__:trials:29 - Trial = 14337/30000 | Total reward = 47.85
2022-01-26 14:17:35.174 | DEBUG    | __main__:trials:24 - Trial = 14338/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.176 | DEBUG    | __main__:trials:29 - Trial = 14338/30000 | Total reward = 46.61
2022-01-26 14:17:35.180 | DEBUG    | __main__:trials:24 - Trial = 14339/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.180 | DEBUG    | __main__:trials:29 - Trial = 14339/30000 | Total reward = 46.26
2022-01-26 14:17:35.185 | DEBUG    | __main__:trials:24 - Trial = 14340/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.186 | DEBUG    | __main__:trials:29 - Trial = 14340/30000 | Total reward = 30.02
2022-01-26 14:17:35.189 | DEBUG    | __main__:trials:24 - Trial = 14341/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.191 | DEBUG    | __main__:trials:29 - Trial = 14341/30000 | Total reward = 44.00
2022-01-26 14:17:35.195 | DEBUG    | __main__:trials:24 - Trial = 14342/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.196 | DEBUG    | __main__:trials:29 - Trial = 14342/30000 | Total reward = 48.85
2022-01-26 14:17:35.200 | DEBUG    | __main__:trials:24 - Trial = 14343/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.201 | DEBUG    | __main__:trials:29 - Trial = 14343/30000 | Total reward = 36.42
2022-01-26 14:17:35.205 | DEBUG    | __main__:trials:24 - Trial = 14344/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.207 | DEBUG    | __main__:trials:29 - Trial = 14344/30000 | Total reward = 43.22
2022-01-26 14:17:35.210 | DEBUG    | __main__:trials:24 - Trial = 14345/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.211 | DEBUG    | __main__:trials:29 - Trial = 14345/30000 | Total reward = 38.27
2022-01-26 14:17:35.216 | DEBUG    | __main__:trials:24 - Trial = 14346/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.217 | DEBUG    | __main__:trials:29 - Trial = 14346/30000 | Total reward = 44.87
2022-01-26 14:17:35.221 | DEBUG    | __main__:trials:24 - Trial = 14347/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.222 | DEBUG    | __main__:trials:29 - Trial = 14347/30000 | Total reward = 53.45
2022-01-26 14:17:35.226 | DEBUG    | __main__:trials:24 - Trial = 14348/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.227 | DEBUG    | __main__:trials:29 - Trial = 14348/30000 | Total reward = 54.31
2022-01-26 14:17:35.231 | DEBUG    | __main__:trials:24 - Trial = 14349/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.234 | DEBUG    | __main__:trials:29 - Trial = 14349/30000 | Total reward = 46.26
2022-01-26 14:17:35.237 | DEBUG    | __main__:trials:24 - Trial = 14350/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.238 | DEBUG    | __main__:trials:29 - Trial = 14350/30000 | Total reward = 43.79
2022-01-26 14:17:35.243 | DEBUG    | __main__:trials:24 - Trial = 14351/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.244 | DEBUG    | __main__:trials:29 - Trial = 14351/30000 | Total reward = 41.31
2022-01-26 14:17:35.248 | DEBUG    | __main__:trials:24 - Trial = 14352/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.249 | DEBUG    | __main__:trials:29 - Trial = 14352/30000 | Total reward = 47.05
2022-01-26 14:17:35.253 | DEBUG    | __main__:trials:24 - Trial = 14353/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.254 | DEBUG    | __main__:trials:29 - Trial = 14353/30000 | Total reward = 44.20
2022-01-26 14:17:35.257 | DEBUG    | __main__:trials:24 - Trial = 14354/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.258 | DEBUG    | __main__:trials:29 - Trial = 14354/30000 | Total reward = 45.92
2022-01-26 14:17:35.261 | DEBUG    | __main__:trials:26 - Trial = 14355/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:35.263 | DEBUG    | __main__:trials:29 - Trial = 14355/30000 | Total reward = 40.41
2022-01-26 14:17:35.266 | DEBUG    | __main__:trials:24 - Trial = 14356/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.268 | DEBUG    | __main__:trials:29 - Trial = 14356/30000 | Total reward = 54.23
2022-01-26 14:17:35.272 | DEBUG    | __main__:trials:24 - Trial = 14357/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.272 | DEBUG    | __main__:trials:29 - Trial = 14357/30000 | Total reward = 55.37
2022-01-26 14:17:35.277 | DEBUG    | __main__:trials:24 - Trial = 14358/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.278 | DEBUG    | __main__:trials:29 - Trial = 14358/30000 | Total reward = 47.05
2022-01-26 14:17:35.281 | DEBUG    | __main__:trials:24 - Trial = 14359/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.282 | DEBUG    | __main__:trials:29 - Trial = 14359/30000 | Total reward = 51.18
2022-01-26 14:17:35.285 | DEBUG    | __main__:trials:26 - Trial = 14360/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:35.286 | DEBUG    | __main__:trials:29 - Trial = 14360/30000 | Total reward = 18.04
2022-01-26 14:17:35.290 | DEBUG    | __main__:trials:24 - Trial = 14361/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.291 | DEBUG    | __main__:trials:29 - Trial = 14361/30000 | Total reward = 48.80
2022-01-26 14:17:35.294 | DEBUG    | __main__:trials:24 - Trial = 14362/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.296 | DEBUG    | __main__:trials:29 - Trial = 14362/30000 | Total reward = 46.87
2022-01-26 14:17:35.299 | DEBUG    | __main__:trials:24 - Trial = 14363/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.301 | DEBUG    | __main__:trials:29 - Trial = 14363/30000 | Total reward = 47.98
2022-01-26 14:17:35.304 | DEBUG    | __main__:trials:24 - Trial = 14364/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.305 | DEBUG    | __main__:trials:29 - Trial = 14364/30000 | Total reward = 48.45
2022-01-26 14:17:35.310 | DEBUG    | __main__:trials:24 - Trial = 14365/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.310 | DEBUG    | __main__:trials:29 - Trial = 14365/30000 | Total reward = 41.07
2022-01-26 14:17:35.315 | DEBUG    | __main__:trials:24 - Trial = 14366/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.315 | DEBUG    | __main__:trials:29 - Trial = 14366/30000 | Total reward = 48.78
2022-01-26 14:17:35.319 | DEBUG    | __main__:trials:24 - Trial = 14367/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.321 | DEBUG    | __main__:trials:29 - Trial = 14367/30000 | Total reward = 47.25
2022-01-26 14:17:35.325 | DEBUG    | __main__:trials:24 - Trial = 14368/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.326 | DEBUG    | __main__:trials:29 - Trial = 14368/30000 | Total reward = 46.72
2022-01-26 14:17:35.330 | DEBUG    | __main__:trials:24 - Trial = 14369/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.330 | DEBUG    | __main__:trials:29 - Trial = 14369/30000 | Total reward = 36.74
2022-01-26 14:17:35.334 | DEBUG    | __main__:trials:24 - Trial = 14370/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.335 | DEBUG    | __main__:trials:29 - Trial = 14370/30000 | Total reward = 47.05
2022-01-26 14:17:35.340 | DEBUG    | __main__:trials:24 - Trial = 14371/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.341 | DEBUG    | __main__:trials:29 - Trial = 14371/30000 | Total reward = 66.06
2022-01-26 14:17:35.345 | DEBUG    | __main__:trials:24 - Trial = 14372/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.347 | DEBUG    | __main__:trials:29 - Trial = 14372/30000 | Total reward = 43.00
2022-01-26 14:17:35.350 | DEBUG    | __main__:trials:24 - Trial = 14373/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.351 | DEBUG    | __main__:trials:29 - Trial = 14373/30000 | Total reward = 47.21
2022-01-26 14:17:35.355 | DEBUG    | __main__:trials:24 - Trial = 14374/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.355 | DEBUG    | __main__:trials:29 - Trial = 14374/30000 | Total reward = 45.22
2022-01-26 14:17:35.359 | DEBUG    | __main__:trials:24 - Trial = 14375/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.361 | DEBUG    | __main__:trials:29 - Trial = 14375/30000 | Total reward = 34.53
2022-01-26 14:17:35.365 | DEBUG    | __main__:trials:24 - Trial = 14376/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.366 | DEBUG    | __main__:trials:29 - Trial = 14376/30000 | Total reward = 42.87
2022-01-26 14:17:35.370 | DEBUG    | __main__:trials:24 - Trial = 14377/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.370 | DEBUG    | __main__:trials:29 - Trial = 14377/30000 | Total reward = 45.28
2022-01-26 14:17:35.374 | DEBUG    | __main__:trials:24 - Trial = 14378/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.376 | DEBUG    | __main__:trials:29 - Trial = 14378/30000 | Total reward = 44.76
2022-01-26 14:17:35.379 | DEBUG    | __main__:trials:24 - Trial = 14379/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.380 | DEBUG    | __main__:trials:29 - Trial = 14379/30000 | Total reward = 42.79
2022-01-26 14:17:35.384 | DEBUG    | __main__:trials:24 - Trial = 14380/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.385 | DEBUG    | __main__:trials:29 - Trial = 14380/30000 | Total reward = 44.99
2022-01-26 14:17:35.389 | DEBUG    | __main__:trials:24 - Trial = 14381/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.390 | DEBUG    | __main__:trials:29 - Trial = 14381/30000 | Total reward = 40.99
2022-01-26 14:17:35.395 | DEBUG    | __main__:trials:24 - Trial = 14382/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.395 | DEBUG    | __main__:trials:29 - Trial = 14382/30000 | Total reward = 46.72
2022-01-26 14:17:35.400 | DEBUG    | __main__:trials:24 - Trial = 14383/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.401 | DEBUG    | __main__:trials:29 - Trial = 14383/30000 | Total reward = 51.38
2022-01-26 14:17:35.404 | DEBUG    | __main__:trials:24 - Trial = 14384/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.406 | DEBUG    | __main__:trials:29 - Trial = 14384/30000 | Total reward = 43.66
2022-01-26 14:17:35.410 | DEBUG    | __main__:trials:24 - Trial = 14385/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.410 | DEBUG    | __main__:trials:29 - Trial = 14385/30000 | Total reward = 48.70
2022-01-26 14:17:35.414 | DEBUG    | __main__:trials:24 - Trial = 14386/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.416 | DEBUG    | __main__:trials:29 - Trial = 14386/30000 | Total reward = 47.05
2022-01-26 14:17:35.420 | DEBUG    | __main__:trials:24 - Trial = 14387/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.421 | DEBUG    | __main__:trials:29 - Trial = 14387/30000 | Total reward = 44.20
2022-01-26 14:17:35.424 | DEBUG    | __main__:trials:24 - Trial = 14388/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.426 | DEBUG    | __main__:trials:29 - Trial = 14388/30000 | Total reward = 53.60
2022-01-26 14:17:35.430 | DEBUG    | __main__:trials:24 - Trial = 14389/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.430 | DEBUG    | __main__:trials:29 - Trial = 14389/30000 | Total reward = 40.34
2022-01-26 14:17:35.435 | DEBUG    | __main__:trials:24 - Trial = 14390/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.437 | DEBUG    | __main__:trials:29 - Trial = 14390/30000 | Total reward = 43.57
2022-01-26 14:17:35.440 | DEBUG    | __main__:trials:24 - Trial = 14391/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.441 | DEBUG    | __main__:trials:29 - Trial = 14391/30000 | Total reward = 58.90
2022-01-26 14:17:35.445 | DEBUG    | __main__:trials:24 - Trial = 14392/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.447 | DEBUG    | __main__:trials:29 - Trial = 14392/30000 | Total reward = 33.61
2022-01-26 14:17:35.450 | DEBUG    | __main__:trials:24 - Trial = 14393/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.452 | DEBUG    | __main__:trials:29 - Trial = 14393/30000 | Total reward = 42.95
2022-01-26 14:17:35.455 | DEBUG    | __main__:trials:24 - Trial = 14394/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.457 | DEBUG    | __main__:trials:29 - Trial = 14394/30000 | Total reward = 48.72
2022-01-26 14:17:35.460 | DEBUG    | __main__:trials:24 - Trial = 14395/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.462 | DEBUG    | __main__:trials:29 - Trial = 14395/30000 | Total reward = 42.36
2022-01-26 14:17:35.465 | DEBUG    | __main__:trials:24 - Trial = 14396/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.466 | DEBUG    | __main__:trials:29 - Trial = 14396/30000 | Total reward = 63.38
2022-01-26 14:17:35.469 | DEBUG    | __main__:trials:24 - Trial = 14397/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.472 | DEBUG    | __main__:trials:29 - Trial = 14397/30000 | Total reward = 44.76
2022-01-26 14:17:35.476 | DEBUG    | __main__:trials:24 - Trial = 14398/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.477 | DEBUG    | __main__:trials:29 - Trial = 14398/30000 | Total reward = 48.81
2022-01-26 14:17:35.480 | DEBUG    | __main__:trials:24 - Trial = 14399/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.482 | DEBUG    | __main__:trials:29 - Trial = 14399/30000 | Total reward = 46.90
2022-01-26 14:17:35.485 | DEBUG    | __main__:trials:24 - Trial = 14400/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.486 | DEBUG    | __main__:trials:29 - Trial = 14400/30000 | Total reward = 41.05
2022-01-26 14:17:35.489 | DEBUG    | __main__:trials:24 - Trial = 14401/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.491 | DEBUG    | __main__:trials:29 - Trial = 14401/30000 | Total reward = 41.16
2022-01-26 14:17:35.495 | DEBUG    | __main__:trials:24 - Trial = 14402/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.497 | DEBUG    | __main__:trials:29 - Trial = 14402/30000 | Total reward = 51.40
2022-01-26 14:17:35.500 | DEBUG    | __main__:trials:24 - Trial = 14403/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.501 | DEBUG    | __main__:trials:29 - Trial = 14403/30000 | Total reward = 57.08
2022-01-26 14:17:35.505 | DEBUG    | __main__:trials:24 - Trial = 14404/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.506 | DEBUG    | __main__:trials:29 - Trial = 14404/30000 | Total reward = 44.58
2022-01-26 14:17:35.510 | DEBUG    | __main__:trials:24 - Trial = 14405/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.510 | DEBUG    | __main__:trials:29 - Trial = 14405/30000 | Total reward = 42.40
2022-01-26 14:17:35.515 | DEBUG    | __main__:trials:24 - Trial = 14406/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.516 | DEBUG    | __main__:trials:29 - Trial = 14406/30000 | Total reward = 52.62
2022-01-26 14:17:35.520 | DEBUG    | __main__:trials:24 - Trial = 14407/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.521 | DEBUG    | __main__:trials:29 - Trial = 14407/30000 | Total reward = 49.15
2022-01-26 14:17:35.525 | DEBUG    | __main__:trials:24 - Trial = 14408/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.526 | DEBUG    | __main__:trials:29 - Trial = 14408/30000 | Total reward = 54.47
2022-01-26 14:17:35.530 | DEBUG    | __main__:trials:24 - Trial = 14409/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.531 | DEBUG    | __main__:trials:29 - Trial = 14409/30000 | Total reward = 43.77
2022-01-26 14:17:35.535 | DEBUG    | __main__:trials:24 - Trial = 14410/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.536 | DEBUG    | __main__:trials:29 - Trial = 14410/30000 | Total reward = 43.06
2022-01-26 14:17:35.539 | DEBUG    | __main__:trials:24 - Trial = 14411/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.541 | DEBUG    | __main__:trials:29 - Trial = 14411/30000 | Total reward = 61.44
2022-01-26 14:17:35.545 | DEBUG    | __main__:trials:24 - Trial = 14412/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.545 | DEBUG    | __main__:trials:29 - Trial = 14412/30000 | Total reward = 55.38
2022-01-26 14:17:35.550 | DEBUG    | __main__:trials:24 - Trial = 14413/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.551 | DEBUG    | __main__:trials:29 - Trial = 14413/30000 | Total reward = 44.88
2022-01-26 14:17:35.555 | DEBUG    | __main__:trials:24 - Trial = 14414/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.556 | DEBUG    | __main__:trials:29 - Trial = 14414/30000 | Total reward = 47.04
2022-01-26 14:17:35.560 | DEBUG    | __main__:trials:24 - Trial = 14415/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.562 | DEBUG    | __main__:trials:29 - Trial = 14415/30000 | Total reward = 46.40
2022-01-26 14:17:35.566 | DEBUG    | __main__:trials:24 - Trial = 14416/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.567 | DEBUG    | __main__:trials:29 - Trial = 14416/30000 | Total reward = 43.52
2022-01-26 14:17:35.570 | DEBUG    | __main__:trials:24 - Trial = 14417/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.572 | DEBUG    | __main__:trials:29 - Trial = 14417/30000 | Total reward = 44.83
2022-01-26 14:17:35.575 | DEBUG    | __main__:trials:24 - Trial = 14418/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.577 | DEBUG    | __main__:trials:29 - Trial = 14418/30000 | Total reward = 54.78
2022-01-26 14:17:35.580 | DEBUG    | __main__:trials:24 - Trial = 14419/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.581 | DEBUG    | __main__:trials:29 - Trial = 14419/30000 | Total reward = 54.06
2022-01-26 14:17:35.585 | DEBUG    | __main__:trials:24 - Trial = 14420/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.587 | DEBUG    | __main__:trials:29 - Trial = 14420/30000 | Total reward = 44.66
2022-01-26 14:17:35.590 | DEBUG    | __main__:trials:24 - Trial = 14421/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.592 | DEBUG    | __main__:trials:29 - Trial = 14421/30000 | Total reward = 46.61
2022-01-26 14:17:35.595 | DEBUG    | __main__:trials:24 - Trial = 14422/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.597 | DEBUG    | __main__:trials:29 - Trial = 14422/30000 | Total reward = 47.61
2022-01-26 14:17:35.600 | DEBUG    | __main__:trials:24 - Trial = 14423/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.601 | DEBUG    | __main__:trials:29 - Trial = 14423/30000 | Total reward = 50.36
2022-01-26 14:17:35.604 | DEBUG    | __main__:trials:24 - Trial = 14424/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.606 | DEBUG    | __main__:trials:29 - Trial = 14424/30000 | Total reward = 46.20
2022-01-26 14:17:35.609 | DEBUG    | __main__:trials:24 - Trial = 14425/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.609 | DEBUG    | __main__:trials:29 - Trial = 14425/30000 | Total reward = 33.24
2022-01-26 14:17:35.614 | DEBUG    | __main__:trials:24 - Trial = 14426/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.615 | DEBUG    | __main__:trials:29 - Trial = 14426/30000 | Total reward = 42.52
2022-01-26 14:17:35.619 | DEBUG    | __main__:trials:24 - Trial = 14427/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.620 | DEBUG    | __main__:trials:29 - Trial = 14427/30000 | Total reward = 35.37
2022-01-26 14:17:35.624 | DEBUG    | __main__:trials:24 - Trial = 14428/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.625 | DEBUG    | __main__:trials:29 - Trial = 14428/30000 | Total reward = 50.07
2022-01-26 14:17:35.629 | DEBUG    | __main__:trials:24 - Trial = 14429/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.630 | DEBUG    | __main__:trials:29 - Trial = 14429/30000 | Total reward = 45.73
2022-01-26 14:17:35.633 | DEBUG    | __main__:trials:24 - Trial = 14430/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.635 | DEBUG    | __main__:trials:29 - Trial = 14430/30000 | Total reward = 56.45
2022-01-26 14:17:35.638 | DEBUG    | __main__:trials:24 - Trial = 14431/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.639 | DEBUG    | __main__:trials:29 - Trial = 14431/30000 | Total reward = 43.30
2022-01-26 14:17:35.643 | DEBUG    | __main__:trials:24 - Trial = 14432/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.644 | DEBUG    | __main__:trials:29 - Trial = 14432/30000 | Total reward = 43.31
2022-01-26 14:17:35.648 | DEBUG    | __main__:trials:24 - Trial = 14433/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.650 | DEBUG    | __main__:trials:29 - Trial = 14433/30000 | Total reward = 66.72
2022-01-26 14:17:35.653 | DEBUG    | __main__:trials:24 - Trial = 14434/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.654 | DEBUG    | __main__:trials:29 - Trial = 14434/30000 | Total reward = 43.98
2022-01-26 14:17:35.659 | DEBUG    | __main__:trials:24 - Trial = 14435/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.659 | DEBUG    | __main__:trials:29 - Trial = 14435/30000 | Total reward = 42.11
2022-01-26 14:17:35.664 | DEBUG    | __main__:trials:24 - Trial = 14436/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.665 | DEBUG    | __main__:trials:29 - Trial = 14436/30000 | Total reward = 60.14
2022-01-26 14:17:35.669 | DEBUG    | __main__:trials:24 - Trial = 14437/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.671 | DEBUG    | __main__:trials:29 - Trial = 14437/30000 | Total reward = 47.48
2022-01-26 14:17:35.674 | DEBUG    | __main__:trials:24 - Trial = 14438/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.676 | DEBUG    | __main__:trials:29 - Trial = 14438/30000 | Total reward = 40.05
2022-01-26 14:17:35.680 | DEBUG    | __main__:trials:24 - Trial = 14439/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.680 | DEBUG    | __main__:trials:29 - Trial = 14439/30000 | Total reward = 45.20
2022-01-26 14:17:35.685 | DEBUG    | __main__:trials:24 - Trial = 14440/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.686 | DEBUG    | __main__:trials:29 - Trial = 14440/30000 | Total reward = 42.41
2022-01-26 14:17:35.690 | DEBUG    | __main__:trials:24 - Trial = 14441/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.692 | DEBUG    | __main__:trials:29 - Trial = 14441/30000 | Total reward = 42.31
2022-01-26 14:17:35.696 | DEBUG    | __main__:trials:24 - Trial = 14442/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.697 | DEBUG    | __main__:trials:29 - Trial = 14442/30000 | Total reward = 58.99
2022-01-26 14:17:35.701 | DEBUG    | __main__:trials:24 - Trial = 14443/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.701 | DEBUG    | __main__:trials:29 - Trial = 14443/30000 | Total reward = 50.39
2022-01-26 14:17:35.705 | DEBUG    | __main__:trials:24 - Trial = 14444/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.706 | DEBUG    | __main__:trials:29 - Trial = 14444/30000 | Total reward = 45.61
2022-01-26 14:17:35.710 | DEBUG    | __main__:trials:24 - Trial = 14445/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.712 | DEBUG    | __main__:trials:29 - Trial = 14445/30000 | Total reward = 47.96
2022-01-26 14:17:35.716 | DEBUG    | __main__:trials:24 - Trial = 14446/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.717 | DEBUG    | __main__:trials:29 - Trial = 14446/30000 | Total reward = 43.31
2022-01-26 14:17:35.721 | DEBUG    | __main__:trials:24 - Trial = 14447/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.722 | DEBUG    | __main__:trials:29 - Trial = 14447/30000 | Total reward = 45.23
2022-01-26 14:17:35.726 | DEBUG    | __main__:trials:24 - Trial = 14448/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.727 | DEBUG    | __main__:trials:29 - Trial = 14448/30000 | Total reward = 46.61
2022-01-26 14:17:35.730 | DEBUG    | __main__:trials:24 - Trial = 14449/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.732 | DEBUG    | __main__:trials:29 - Trial = 14449/30000 | Total reward = 45.78
2022-01-26 14:17:35.735 | DEBUG    | __main__:trials:24 - Trial = 14450/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.737 | DEBUG    | __main__:trials:29 - Trial = 14450/30000 | Total reward = 57.55
2022-01-26 14:17:35.740 | DEBUG    | __main__:trials:24 - Trial = 14451/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.742 | DEBUG    | __main__:trials:29 - Trial = 14451/30000 | Total reward = 44.44
2022-01-26 14:17:35.746 | DEBUG    | __main__:trials:24 - Trial = 14452/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.748 | DEBUG    | __main__:trials:29 - Trial = 14452/30000 | Total reward = 48.97
2022-01-26 14:17:35.753 | DEBUG    | __main__:trials:24 - Trial = 14453/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.755 | DEBUG    | __main__:trials:29 - Trial = 14453/30000 | Total reward = 48.44
2022-01-26 14:17:35.760 | DEBUG    | __main__:trials:24 - Trial = 14454/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.761 | DEBUG    | __main__:trials:29 - Trial = 14454/30000 | Total reward = 36.30
2022-01-26 14:17:35.765 | DEBUG    | __main__:trials:24 - Trial = 14455/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.767 | DEBUG    | __main__:trials:29 - Trial = 14455/30000 | Total reward = 42.49
2022-01-26 14:17:35.770 | DEBUG    | __main__:trials:24 - Trial = 14456/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.771 | DEBUG    | __main__:trials:29 - Trial = 14456/30000 | Total reward = 42.73
2022-01-26 14:17:35.775 | DEBUG    | __main__:trials:24 - Trial = 14457/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.776 | DEBUG    | __main__:trials:29 - Trial = 14457/30000 | Total reward = 58.30
2022-01-26 14:17:35.780 | DEBUG    | __main__:trials:24 - Trial = 14458/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.781 | DEBUG    | __main__:trials:29 - Trial = 14458/30000 | Total reward = 36.98
2022-01-26 14:17:35.784 | DEBUG    | __main__:trials:24 - Trial = 14459/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.785 | DEBUG    | __main__:trials:29 - Trial = 14459/30000 | Total reward = 46.79
2022-01-26 14:17:35.789 | DEBUG    | __main__:trials:24 - Trial = 14460/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.790 | DEBUG    | __main__:trials:29 - Trial = 14460/30000 | Total reward = 52.76
2022-01-26 14:17:35.794 | DEBUG    | __main__:trials:24 - Trial = 14461/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.794 | DEBUG    | __main__:trials:29 - Trial = 14461/30000 | Total reward = 48.39
2022-01-26 14:17:35.798 | DEBUG    | __main__:trials:24 - Trial = 14462/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.800 | DEBUG    | __main__:trials:29 - Trial = 14462/30000 | Total reward = 47.66
2022-01-26 14:17:35.804 | DEBUG    | __main__:trials:24 - Trial = 14463/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.805 | DEBUG    | __main__:trials:29 - Trial = 14463/30000 | Total reward = 40.43
2022-01-26 14:17:35.809 | DEBUG    | __main__:trials:24 - Trial = 14464/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.809 | DEBUG    | __main__:trials:29 - Trial = 14464/30000 | Total reward = 42.23
2022-01-26 14:17:35.813 | DEBUG    | __main__:trials:24 - Trial = 14465/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.815 | DEBUG    | __main__:trials:29 - Trial = 14465/30000 | Total reward = 46.66
2022-01-26 14:17:35.819 | DEBUG    | __main__:trials:24 - Trial = 14466/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.819 | DEBUG    | __main__:trials:29 - Trial = 14466/30000 | Total reward = 51.57
2022-01-26 14:17:35.824 | DEBUG    | __main__:trials:24 - Trial = 14467/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.825 | DEBUG    | __main__:trials:29 - Trial = 14467/30000 | Total reward = 42.53
2022-01-26 14:17:35.829 | DEBUG    | __main__:trials:24 - Trial = 14468/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.830 | DEBUG    | __main__:trials:29 - Trial = 14468/30000 | Total reward = 53.76
2022-01-26 14:17:35.834 | DEBUG    | __main__:trials:24 - Trial = 14469/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.835 | DEBUG    | __main__:trials:29 - Trial = 14469/30000 | Total reward = 57.73
2022-01-26 14:17:35.839 | DEBUG    | __main__:trials:24 - Trial = 14470/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.840 | DEBUG    | __main__:trials:29 - Trial = 14470/30000 | Total reward = 46.06
2022-01-26 14:17:35.844 | DEBUG    | __main__:trials:24 - Trial = 14471/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.846 | DEBUG    | __main__:trials:29 - Trial = 14471/30000 | Total reward = 44.78
2022-01-26 14:17:35.849 | DEBUG    | __main__:trials:24 - Trial = 14472/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.850 | DEBUG    | __main__:trials:29 - Trial = 14472/30000 | Total reward = 46.79
2022-01-26 14:17:35.855 | DEBUG    | __main__:trials:24 - Trial = 14473/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.856 | DEBUG    | __main__:trials:29 - Trial = 14473/30000 | Total reward = 51.14
2022-01-26 14:17:35.860 | DEBUG    | __main__:trials:24 - Trial = 14474/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.862 | DEBUG    | __main__:trials:29 - Trial = 14474/30000 | Total reward = 48.64
2022-01-26 14:17:35.865 | DEBUG    | __main__:trials:24 - Trial = 14475/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.866 | DEBUG    | __main__:trials:29 - Trial = 14475/30000 | Total reward = 47.61
2022-01-26 14:17:35.870 | DEBUG    | __main__:trials:24 - Trial = 14476/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.871 | DEBUG    | __main__:trials:29 - Trial = 14476/30000 | Total reward = 47.72
2022-01-26 14:17:35.875 | DEBUG    | __main__:trials:24 - Trial = 14477/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.876 | DEBUG    | __main__:trials:29 - Trial = 14477/30000 | Total reward = 53.55
2022-01-26 14:17:35.880 | DEBUG    | __main__:trials:24 - Trial = 14478/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.881 | DEBUG    | __main__:trials:29 - Trial = 14478/30000 | Total reward = 48.27
2022-01-26 14:17:35.884 | DEBUG    | __main__:trials:24 - Trial = 14479/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.886 | DEBUG    | __main__:trials:29 - Trial = 14479/30000 | Total reward = 35.55
2022-01-26 14:17:35.889 | DEBUG    | __main__:trials:24 - Trial = 14480/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.890 | DEBUG    | __main__:trials:29 - Trial = 14480/30000 | Total reward = 35.89
2022-01-26 14:17:35.893 | DEBUG    | __main__:trials:24 - Trial = 14481/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.895 | DEBUG    | __main__:trials:29 - Trial = 14481/30000 | Total reward = 38.45
2022-01-26 14:17:35.898 | DEBUG    | __main__:trials:24 - Trial = 14482/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.899 | DEBUG    | __main__:trials:29 - Trial = 14482/30000 | Total reward = 48.43
2022-01-26 14:17:35.903 | DEBUG    | __main__:trials:24 - Trial = 14483/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.904 | DEBUG    | __main__:trials:29 - Trial = 14483/30000 | Total reward = 42.20
2022-01-26 14:17:35.908 | DEBUG    | __main__:trials:24 - Trial = 14484/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.909 | DEBUG    | __main__:trials:29 - Trial = 14484/30000 | Total reward = 47.28
2022-01-26 14:17:35.912 | DEBUG    | __main__:trials:24 - Trial = 14485/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.915 | DEBUG    | __main__:trials:29 - Trial = 14485/30000 | Total reward = 43.09
2022-01-26 14:17:35.918 | DEBUG    | __main__:trials:24 - Trial = 14486/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.919 | DEBUG    | __main__:trials:29 - Trial = 14486/30000 | Total reward = 45.58
2022-01-26 14:17:35.923 | DEBUG    | __main__:trials:24 - Trial = 14487/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.924 | DEBUG    | __main__:trials:29 - Trial = 14487/30000 | Total reward = 42.91
2022-01-26 14:17:35.927 | DEBUG    | __main__:trials:24 - Trial = 14488/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.928 | DEBUG    | __main__:trials:29 - Trial = 14488/30000 | Total reward = 55.26
2022-01-26 14:17:35.931 | DEBUG    | __main__:trials:24 - Trial = 14489/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.933 | DEBUG    | __main__:trials:29 - Trial = 14489/30000 | Total reward = 47.50
2022-01-26 14:17:35.936 | DEBUG    | __main__:trials:24 - Trial = 14490/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.938 | DEBUG    | __main__:trials:29 - Trial = 14490/30000 | Total reward = 47.73
2022-01-26 14:17:35.941 | DEBUG    | __main__:trials:24 - Trial = 14491/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.943 | DEBUG    | __main__:trials:29 - Trial = 14491/30000 | Total reward = 42.70
2022-01-26 14:17:35.947 | DEBUG    | __main__:trials:24 - Trial = 14492/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.948 | DEBUG    | __main__:trials:29 - Trial = 14492/30000 | Total reward = 44.82
2022-01-26 14:17:35.951 | DEBUG    | __main__:trials:24 - Trial = 14493/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.953 | DEBUG    | __main__:trials:29 - Trial = 14493/30000 | Total reward = 47.09
2022-01-26 14:17:35.956 | DEBUG    | __main__:trials:24 - Trial = 14494/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.957 | DEBUG    | __main__:trials:29 - Trial = 14494/30000 | Total reward = 53.10
2022-01-26 14:17:35.962 | DEBUG    | __main__:trials:24 - Trial = 14495/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.962 | DEBUG    | __main__:trials:29 - Trial = 14495/30000 | Total reward = 59.30
2022-01-26 14:17:35.967 | DEBUG    | __main__:trials:24 - Trial = 14496/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.968 | DEBUG    | __main__:trials:29 - Trial = 14496/30000 | Total reward = 37.25
2022-01-26 14:17:35.972 | DEBUG    | __main__:trials:24 - Trial = 14497/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.973 | DEBUG    | __main__:trials:29 - Trial = 14497/30000 | Total reward = 58.94
2022-01-26 14:17:35.976 | DEBUG    | __main__:trials:24 - Trial = 14498/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.978 | DEBUG    | __main__:trials:29 - Trial = 14498/30000 | Total reward = 49.68
2022-01-26 14:17:35.981 | DEBUG    | __main__:trials:24 - Trial = 14499/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.983 | DEBUG    | __main__:trials:29 - Trial = 14499/30000 | Total reward = 46.78
2022-01-26 14:17:35.987 | DEBUG    | __main__:trials:24 - Trial = 14500/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.988 | DEBUG    | __main__:trials:29 - Trial = 14500/30000 | Total reward = 51.36
2022-01-26 14:17:35.992 | DEBUG    | __main__:trials:24 - Trial = 14501/30000 | Max number of steps (20) reached
2022-01-26 14:17:35.993 | DEBUG    | __main__:trials:29 - Trial = 14501/30000 | Total reward = 53.23
2022-01-26 14:17:35.996 | DEBUG    | __main__:trials:26 - Trial = 14502/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:35.998 | DEBUG    | __main__:trials:29 - Trial = 14502/30000 | Total reward = 37.52
2022-01-26 14:17:36.002 | DEBUG    | __main__:trials:24 - Trial = 14503/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.003 | DEBUG    | __main__:trials:29 - Trial = 14503/30000 | Total reward = 57.36
2022-01-26 14:17:36.006 | DEBUG    | __main__:trials:24 - Trial = 14504/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.007 | DEBUG    | __main__:trials:29 - Trial = 14504/30000 | Total reward = 51.26
2022-01-26 14:17:36.011 | DEBUG    | __main__:trials:24 - Trial = 14505/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.012 | DEBUG    | __main__:trials:29 - Trial = 14505/30000 | Total reward = 39.40
2022-01-26 14:17:36.015 | DEBUG    | __main__:trials:24 - Trial = 14506/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.017 | DEBUG    | __main__:trials:29 - Trial = 14506/30000 | Total reward = 53.81
2022-01-26 14:17:36.021 | DEBUG    | __main__:trials:24 - Trial = 14507/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.021 | DEBUG    | __main__:trials:29 - Trial = 14507/30000 | Total reward = 63.30
2022-01-26 14:17:36.026 | DEBUG    | __main__:trials:24 - Trial = 14508/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.026 | DEBUG    | __main__:trials:29 - Trial = 14508/30000 | Total reward = 61.34
2022-01-26 14:17:36.030 | DEBUG    | __main__:trials:24 - Trial = 14509/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.032 | DEBUG    | __main__:trials:29 - Trial = 14509/30000 | Total reward = 47.20
2022-01-26 14:17:36.036 | DEBUG    | __main__:trials:24 - Trial = 14510/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.036 | DEBUG    | __main__:trials:29 - Trial = 14510/30000 | Total reward = 36.10
2022-01-26 14:17:36.041 | DEBUG    | __main__:trials:24 - Trial = 14511/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.043 | DEBUG    | __main__:trials:29 - Trial = 14511/30000 | Total reward = 57.72
2022-01-26 14:17:36.046 | DEBUG    | __main__:trials:24 - Trial = 14512/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.047 | DEBUG    | __main__:trials:29 - Trial = 14512/30000 | Total reward = 56.57
2022-01-26 14:17:36.051 | DEBUG    | __main__:trials:24 - Trial = 14513/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.052 | DEBUG    | __main__:trials:29 - Trial = 14513/30000 | Total reward = 51.97
2022-01-26 14:17:36.055 | DEBUG    | __main__:trials:26 - Trial = 14514/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:36.056 | DEBUG    | __main__:trials:29 - Trial = 14514/30000 | Total reward = 18.24
2022-01-26 14:17:36.060 | DEBUG    | __main__:trials:24 - Trial = 14515/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.061 | DEBUG    | __main__:trials:29 - Trial = 14515/30000 | Total reward = 55.11
2022-01-26 14:17:36.066 | DEBUG    | __main__:trials:24 - Trial = 14516/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.067 | DEBUG    | __main__:trials:29 - Trial = 14516/30000 | Total reward = 43.58
2022-01-26 14:17:36.071 | DEBUG    | __main__:trials:24 - Trial = 14517/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.072 | DEBUG    | __main__:trials:29 - Trial = 14517/30000 | Total reward = 42.71
2022-01-26 14:17:36.076 | DEBUG    | __main__:trials:24 - Trial = 14518/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.078 | DEBUG    | __main__:trials:29 - Trial = 14518/30000 | Total reward = 41.33
2022-01-26 14:17:36.081 | DEBUG    | __main__:trials:24 - Trial = 14519/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.083 | DEBUG    | __main__:trials:29 - Trial = 14519/30000 | Total reward = 61.22
2022-01-26 14:17:36.086 | DEBUG    | __main__:trials:24 - Trial = 14520/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.088 | DEBUG    | __main__:trials:29 - Trial = 14520/30000 | Total reward = 44.72
2022-01-26 14:17:36.091 | DEBUG    | __main__:trials:24 - Trial = 14521/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.093 | DEBUG    | __main__:trials:29 - Trial = 14521/30000 | Total reward = 38.99
2022-01-26 14:17:36.096 | DEBUG    | __main__:trials:24 - Trial = 14522/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.098 | DEBUG    | __main__:trials:29 - Trial = 14522/30000 | Total reward = 57.51
2022-01-26 14:17:36.102 | DEBUG    | __main__:trials:24 - Trial = 14523/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.103 | DEBUG    | __main__:trials:29 - Trial = 14523/30000 | Total reward = 62.09
2022-01-26 14:17:36.106 | DEBUG    | __main__:trials:24 - Trial = 14524/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.108 | DEBUG    | __main__:trials:29 - Trial = 14524/30000 | Total reward = 32.39
2022-01-26 14:17:36.112 | DEBUG    | __main__:trials:24 - Trial = 14525/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.113 | DEBUG    | __main__:trials:29 - Trial = 14525/30000 | Total reward = 60.50
2022-01-26 14:17:36.117 | DEBUG    | __main__:trials:24 - Trial = 14526/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.119 | DEBUG    | __main__:trials:29 - Trial = 14526/30000 | Total reward = 52.60
2022-01-26 14:17:36.122 | DEBUG    | __main__:trials:24 - Trial = 14527/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.124 | DEBUG    | __main__:trials:29 - Trial = 14527/30000 | Total reward = 60.43
2022-01-26 14:17:36.127 | DEBUG    | __main__:trials:24 - Trial = 14528/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.128 | DEBUG    | __main__:trials:29 - Trial = 14528/30000 | Total reward = 49.89
2022-01-26 14:17:36.132 | DEBUG    | __main__:trials:24 - Trial = 14529/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.133 | DEBUG    | __main__:trials:29 - Trial = 14529/30000 | Total reward = 58.89
2022-01-26 14:17:36.137 | DEBUG    | __main__:trials:24 - Trial = 14530/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.139 | DEBUG    | __main__:trials:29 - Trial = 14530/30000 | Total reward = 58.83
2022-01-26 14:17:36.143 | DEBUG    | __main__:trials:24 - Trial = 14531/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.144 | DEBUG    | __main__:trials:29 - Trial = 14531/30000 | Total reward = 45.84
2022-01-26 14:17:36.148 | DEBUG    | __main__:trials:24 - Trial = 14532/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.149 | DEBUG    | __main__:trials:29 - Trial = 14532/30000 | Total reward = 36.93
2022-01-26 14:17:36.153 | DEBUG    | __main__:trials:24 - Trial = 14533/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.155 | DEBUG    | __main__:trials:29 - Trial = 14533/30000 | Total reward = 41.69
2022-01-26 14:17:36.159 | DEBUG    | __main__:trials:24 - Trial = 14534/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.160 | DEBUG    | __main__:trials:29 - Trial = 14534/30000 | Total reward = 51.25
2022-01-26 14:17:36.164 | DEBUG    | __main__:trials:24 - Trial = 14535/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.165 | DEBUG    | __main__:trials:29 - Trial = 14535/30000 | Total reward = 41.17
2022-01-26 14:17:36.169 | DEBUG    | __main__:trials:24 - Trial = 14536/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.170 | DEBUG    | __main__:trials:29 - Trial = 14536/30000 | Total reward = 36.89
2022-01-26 14:17:36.174 | DEBUG    | __main__:trials:24 - Trial = 14537/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.176 | DEBUG    | __main__:trials:29 - Trial = 14537/30000 | Total reward = 66.52
2022-01-26 14:17:36.179 | DEBUG    | __main__:trials:26 - Trial = 14538/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:36.179 | DEBUG    | __main__:trials:29 - Trial = 14538/30000 | Total reward = 19.08
2022-01-26 14:17:36.183 | DEBUG    | __main__:trials:24 - Trial = 14539/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.184 | DEBUG    | __main__:trials:29 - Trial = 14539/30000 | Total reward = 37.12
2022-01-26 14:17:36.188 | DEBUG    | __main__:trials:24 - Trial = 14540/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.190 | DEBUG    | __main__:trials:29 - Trial = 14540/30000 | Total reward = 38.46
2022-01-26 14:17:36.194 | DEBUG    | __main__:trials:24 - Trial = 14541/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.196 | DEBUG    | __main__:trials:29 - Trial = 14541/30000 | Total reward = 40.51
2022-01-26 14:17:36.199 | DEBUG    | __main__:trials:24 - Trial = 14542/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.200 | DEBUG    | __main__:trials:29 - Trial = 14542/30000 | Total reward = 38.64
2022-01-26 14:17:36.204 | DEBUG    | __main__:trials:24 - Trial = 14543/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.206 | DEBUG    | __main__:trials:29 - Trial = 14543/30000 | Total reward = 38.64
2022-01-26 14:17:36.209 | DEBUG    | __main__:trials:24 - Trial = 14544/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.211 | DEBUG    | __main__:trials:29 - Trial = 14544/30000 | Total reward = 41.25
2022-01-26 14:17:36.215 | DEBUG    | __main__:trials:24 - Trial = 14545/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.216 | DEBUG    | __main__:trials:29 - Trial = 14545/30000 | Total reward = 56.07
2022-01-26 14:17:36.220 | DEBUG    | __main__:trials:24 - Trial = 14546/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.220 | DEBUG    | __main__:trials:29 - Trial = 14546/30000 | Total reward = 50.17
2022-01-26 14:17:36.225 | DEBUG    | __main__:trials:24 - Trial = 14547/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.225 | DEBUG    | __main__:trials:29 - Trial = 14547/30000 | Total reward = 60.61
2022-01-26 14:17:36.229 | DEBUG    | __main__:trials:24 - Trial = 14548/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.230 | DEBUG    | __main__:trials:29 - Trial = 14548/30000 | Total reward = 45.41
2022-01-26 14:17:36.235 | DEBUG    | __main__:trials:24 - Trial = 14549/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.236 | DEBUG    | __main__:trials:29 - Trial = 14549/30000 | Total reward = 46.47
2022-01-26 14:17:36.240 | DEBUG    | __main__:trials:24 - Trial = 14550/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.242 | DEBUG    | __main__:trials:29 - Trial = 14550/30000 | Total reward = 46.83
2022-01-26 14:17:36.246 | DEBUG    | __main__:trials:24 - Trial = 14551/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.246 | DEBUG    | __main__:trials:29 - Trial = 14551/30000 | Total reward = 43.00
2022-01-26 14:17:36.251 | DEBUG    | __main__:trials:24 - Trial = 14552/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.252 | DEBUG    | __main__:trials:29 - Trial = 14552/30000 | Total reward = 37.16
2022-01-26 14:17:36.256 | DEBUG    | __main__:trials:24 - Trial = 14553/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.257 | DEBUG    | __main__:trials:29 - Trial = 14553/30000 | Total reward = 24.81
2022-01-26 14:17:36.261 | DEBUG    | __main__:trials:24 - Trial = 14554/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.262 | DEBUG    | __main__:trials:29 - Trial = 14554/30000 | Total reward = 43.39
2022-01-26 14:17:36.266 | DEBUG    | __main__:trials:24 - Trial = 14555/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.268 | DEBUG    | __main__:trials:29 - Trial = 14555/30000 | Total reward = 46.18
2022-01-26 14:17:36.271 | DEBUG    | __main__:trials:24 - Trial = 14556/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.272 | DEBUG    | __main__:trials:29 - Trial = 14556/30000 | Total reward = 56.33
2022-01-26 14:17:36.276 | DEBUG    | __main__:trials:24 - Trial = 14557/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.277 | DEBUG    | __main__:trials:29 - Trial = 14557/30000 | Total reward = 29.05
2022-01-26 14:17:36.281 | DEBUG    | __main__:trials:24 - Trial = 14558/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.282 | DEBUG    | __main__:trials:29 - Trial = 14558/30000 | Total reward = 52.61
2022-01-26 14:17:36.286 | DEBUG    | __main__:trials:24 - Trial = 14559/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.287 | DEBUG    | __main__:trials:29 - Trial = 14559/30000 | Total reward = 44.88
2022-01-26 14:17:36.291 | DEBUG    | __main__:trials:24 - Trial = 14560/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.292 | DEBUG    | __main__:trials:29 - Trial = 14560/30000 | Total reward = 46.79
2022-01-26 14:17:36.296 | DEBUG    | __main__:trials:24 - Trial = 14561/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.297 | DEBUG    | __main__:trials:29 - Trial = 14561/30000 | Total reward = 49.43
2022-01-26 14:17:36.301 | DEBUG    | __main__:trials:24 - Trial = 14562/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.302 | DEBUG    | __main__:trials:29 - Trial = 14562/30000 | Total reward = 61.81
2022-01-26 14:17:36.306 | DEBUG    | __main__:trials:24 - Trial = 14563/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.307 | DEBUG    | __main__:trials:29 - Trial = 14563/30000 | Total reward = 41.47
2022-01-26 14:17:36.311 | DEBUG    | __main__:trials:24 - Trial = 14564/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.313 | DEBUG    | __main__:trials:29 - Trial = 14564/30000 | Total reward = 53.60
2022-01-26 14:17:36.316 | DEBUG    | __main__:trials:24 - Trial = 14565/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.318 | DEBUG    | __main__:trials:29 - Trial = 14565/30000 | Total reward = 52.82
2022-01-26 14:17:36.321 | DEBUG    | __main__:trials:24 - Trial = 14566/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.322 | DEBUG    | __main__:trials:29 - Trial = 14566/30000 | Total reward = 49.64
2022-01-26 14:17:36.326 | DEBUG    | __main__:trials:24 - Trial = 14567/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.328 | DEBUG    | __main__:trials:29 - Trial = 14567/30000 | Total reward = 50.07
2022-01-26 14:17:36.331 | DEBUG    | __main__:trials:24 - Trial = 14568/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.333 | DEBUG    | __main__:trials:29 - Trial = 14568/30000 | Total reward = 38.71
2022-01-26 14:17:36.336 | DEBUG    | __main__:trials:24 - Trial = 14569/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.337 | DEBUG    | __main__:trials:29 - Trial = 14569/30000 | Total reward = 62.12
2022-01-26 14:17:36.340 | DEBUG    | __main__:trials:24 - Trial = 14570/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.342 | DEBUG    | __main__:trials:29 - Trial = 14570/30000 | Total reward = 41.97
2022-01-26 14:17:36.345 | DEBUG    | __main__:trials:24 - Trial = 14571/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.346 | DEBUG    | __main__:trials:29 - Trial = 14571/30000 | Total reward = 49.37
2022-01-26 14:17:36.349 | DEBUG    | __main__:trials:24 - Trial = 14572/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.350 | DEBUG    | __main__:trials:29 - Trial = 14572/30000 | Total reward = 61.52
2022-01-26 14:17:36.353 | DEBUG    | __main__:trials:24 - Trial = 14573/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.353 | DEBUG    | __main__:trials:29 - Trial = 14573/30000 | Total reward = 54.57
2022-01-26 14:17:36.358 | DEBUG    | __main__:trials:24 - Trial = 14574/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.358 | DEBUG    | __main__:trials:29 - Trial = 14574/30000 | Total reward = 39.99
2022-01-26 14:17:36.363 | DEBUG    | __main__:trials:24 - Trial = 14575/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.364 | DEBUG    | __main__:trials:29 - Trial = 14575/30000 | Total reward = 51.28
2022-01-26 14:17:36.368 | DEBUG    | __main__:trials:24 - Trial = 14576/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.369 | DEBUG    | __main__:trials:29 - Trial = 14576/30000 | Total reward = 47.76
2022-01-26 14:17:36.372 | DEBUG    | __main__:trials:24 - Trial = 14577/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.374 | DEBUG    | __main__:trials:29 - Trial = 14577/30000 | Total reward = 44.49
2022-01-26 14:17:36.377 | DEBUG    | __main__:trials:24 - Trial = 14578/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.379 | DEBUG    | __main__:trials:29 - Trial = 14578/30000 | Total reward = 51.91
2022-01-26 14:17:36.382 | DEBUG    | __main__:trials:24 - Trial = 14579/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.383 | DEBUG    | __main__:trials:29 - Trial = 14579/30000 | Total reward = 36.41
2022-01-26 14:17:36.387 | DEBUG    | __main__:trials:24 - Trial = 14580/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.388 | DEBUG    | __main__:trials:29 - Trial = 14580/30000 | Total reward = 35.20
2022-01-26 14:17:36.392 | DEBUG    | __main__:trials:24 - Trial = 14581/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.393 | DEBUG    | __main__:trials:29 - Trial = 14581/30000 | Total reward = 45.75
2022-01-26 14:17:36.396 | DEBUG    | __main__:trials:24 - Trial = 14582/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.398 | DEBUG    | __main__:trials:29 - Trial = 14582/30000 | Total reward = 46.27
2022-01-26 14:17:36.402 | DEBUG    | __main__:trials:24 - Trial = 14583/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.403 | DEBUG    | __main__:trials:29 - Trial = 14583/30000 | Total reward = 45.54
2022-01-26 14:17:36.407 | DEBUG    | __main__:trials:24 - Trial = 14584/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.408 | DEBUG    | __main__:trials:29 - Trial = 14584/30000 | Total reward = 34.10
2022-01-26 14:17:36.412 | DEBUG    | __main__:trials:24 - Trial = 14585/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.414 | DEBUG    | __main__:trials:29 - Trial = 14585/30000 | Total reward = 52.48
2022-01-26 14:17:36.417 | DEBUG    | __main__:trials:24 - Trial = 14586/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.419 | DEBUG    | __main__:trials:29 - Trial = 14586/30000 | Total reward = 65.97
2022-01-26 14:17:36.423 | DEBUG    | __main__:trials:24 - Trial = 14587/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.423 | DEBUG    | __main__:trials:29 - Trial = 14587/30000 | Total reward = 47.67
2022-01-26 14:17:36.427 | DEBUG    | __main__:trials:24 - Trial = 14588/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.429 | DEBUG    | __main__:trials:29 - Trial = 14588/30000 | Total reward = 50.10
2022-01-26 14:17:36.432 | DEBUG    | __main__:trials:24 - Trial = 14589/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.433 | DEBUG    | __main__:trials:29 - Trial = 14589/30000 | Total reward = 55.09
2022-01-26 14:17:36.437 | DEBUG    | __main__:trials:24 - Trial = 14590/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.438 | DEBUG    | __main__:trials:29 - Trial = 14590/30000 | Total reward = 59.28
2022-01-26 14:17:36.441 | DEBUG    | __main__:trials:24 - Trial = 14591/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.443 | DEBUG    | __main__:trials:29 - Trial = 14591/30000 | Total reward = 52.48
2022-01-26 14:17:36.447 | DEBUG    | __main__:trials:24 - Trial = 14592/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.449 | DEBUG    | __main__:trials:29 - Trial = 14592/30000 | Total reward = 37.61
2022-01-26 14:17:36.452 | DEBUG    | __main__:trials:24 - Trial = 14593/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.453 | DEBUG    | __main__:trials:29 - Trial = 14593/30000 | Total reward = 41.13
2022-01-26 14:17:36.457 | DEBUG    | __main__:trials:24 - Trial = 14594/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.459 | DEBUG    | __main__:trials:29 - Trial = 14594/30000 | Total reward = 48.11
2022-01-26 14:17:36.462 | DEBUG    | __main__:trials:24 - Trial = 14595/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.464 | DEBUG    | __main__:trials:29 - Trial = 14595/30000 | Total reward = 33.04
2022-01-26 14:17:36.467 | DEBUG    | __main__:trials:24 - Trial = 14596/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.468 | DEBUG    | __main__:trials:29 - Trial = 14596/30000 | Total reward = 50.46
2022-01-26 14:17:36.472 | DEBUG    | __main__:trials:24 - Trial = 14597/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.473 | DEBUG    | __main__:trials:29 - Trial = 14597/30000 | Total reward = 47.46
2022-01-26 14:17:36.477 | DEBUG    | __main__:trials:24 - Trial = 14598/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.478 | DEBUG    | __main__:trials:29 - Trial = 14598/30000 | Total reward = 48.92
2022-01-26 14:17:36.482 | DEBUG    | __main__:trials:24 - Trial = 14599/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.483 | DEBUG    | __main__:trials:29 - Trial = 14599/30000 | Total reward = 64.98
2022-01-26 14:17:36.488 | DEBUG    | __main__:trials:24 - Trial = 14600/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.489 | DEBUG    | __main__:trials:29 - Trial = 14600/30000 | Total reward = 64.51
2022-01-26 14:17:36.492 | DEBUG    | __main__:trials:24 - Trial = 14601/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.494 | DEBUG    | __main__:trials:29 - Trial = 14601/30000 | Total reward = 51.42
2022-01-26 14:17:36.497 | DEBUG    | __main__:trials:24 - Trial = 14602/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.498 | DEBUG    | __main__:trials:29 - Trial = 14602/30000 | Total reward = 57.03
2022-01-26 14:17:36.502 | DEBUG    | __main__:trials:24 - Trial = 14603/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.503 | DEBUG    | __main__:trials:29 - Trial = 14603/30000 | Total reward = 53.60
2022-01-26 14:17:36.507 | DEBUG    | __main__:trials:24 - Trial = 14604/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.509 | DEBUG    | __main__:trials:29 - Trial = 14604/30000 | Total reward = 47.46
2022-01-26 14:17:36.512 | DEBUG    | __main__:trials:24 - Trial = 14605/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.514 | DEBUG    | __main__:trials:29 - Trial = 14605/30000 | Total reward = 53.60
2022-01-26 14:17:36.518 | DEBUG    | __main__:trials:24 - Trial = 14606/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.519 | DEBUG    | __main__:trials:29 - Trial = 14606/30000 | Total reward = 63.05
2022-01-26 14:17:36.523 | DEBUG    | __main__:trials:24 - Trial = 14607/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.524 | DEBUG    | __main__:trials:29 - Trial = 14607/30000 | Total reward = 51.72
2022-01-26 14:17:36.528 | DEBUG    | __main__:trials:24 - Trial = 14608/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.530 | DEBUG    | __main__:trials:29 - Trial = 14608/30000 | Total reward = 47.42
2022-01-26 14:17:36.533 | DEBUG    | __main__:trials:24 - Trial = 14609/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.535 | DEBUG    | __main__:trials:29 - Trial = 14609/30000 | Total reward = 49.44
2022-01-26 14:17:36.538 | DEBUG    | __main__:trials:24 - Trial = 14610/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.540 | DEBUG    | __main__:trials:29 - Trial = 14610/30000 | Total reward = 52.26
2022-01-26 14:17:36.544 | DEBUG    | __main__:trials:24 - Trial = 14611/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.545 | DEBUG    | __main__:trials:29 - Trial = 14611/30000 | Total reward = 50.94
2022-01-26 14:17:36.549 | DEBUG    | __main__:trials:24 - Trial = 14612/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.551 | DEBUG    | __main__:trials:29 - Trial = 14612/30000 | Total reward = 66.24
2022-01-26 14:17:36.554 | DEBUG    | __main__:trials:24 - Trial = 14613/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.556 | DEBUG    | __main__:trials:29 - Trial = 14613/30000 | Total reward = 49.88
2022-01-26 14:17:36.560 | DEBUG    | __main__:trials:24 - Trial = 14614/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.560 | DEBUG    | __main__:trials:29 - Trial = 14614/30000 | Total reward = 54.00
2022-01-26 14:17:36.565 | DEBUG    | __main__:trials:24 - Trial = 14615/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.566 | DEBUG    | __main__:trials:29 - Trial = 14615/30000 | Total reward = 51.67
2022-01-26 14:17:36.569 | DEBUG    | __main__:trials:24 - Trial = 14616/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.571 | DEBUG    | __main__:trials:29 - Trial = 14616/30000 | Total reward = 51.71
2022-01-26 14:17:36.574 | DEBUG    | __main__:trials:24 - Trial = 14617/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.576 | DEBUG    | __main__:trials:29 - Trial = 14617/30000 | Total reward = 46.88
2022-01-26 14:17:36.579 | DEBUG    | __main__:trials:24 - Trial = 14618/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.581 | DEBUG    | __main__:trials:29 - Trial = 14618/30000 | Total reward = 53.60
2022-01-26 14:17:36.584 | DEBUG    | __main__:trials:24 - Trial = 14619/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.586 | DEBUG    | __main__:trials:29 - Trial = 14619/30000 | Total reward = 53.60
2022-01-26 14:17:36.589 | DEBUG    | __main__:trials:24 - Trial = 14620/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.591 | DEBUG    | __main__:trials:29 - Trial = 14620/30000 | Total reward = 53.23
2022-01-26 14:17:36.594 | DEBUG    | __main__:trials:24 - Trial = 14621/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.596 | DEBUG    | __main__:trials:29 - Trial = 14621/30000 | Total reward = 52.82
2022-01-26 14:17:36.600 | DEBUG    | __main__:trials:24 - Trial = 14622/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.601 | DEBUG    | __main__:trials:29 - Trial = 14622/30000 | Total reward = 56.45
2022-01-26 14:17:36.605 | DEBUG    | __main__:trials:24 - Trial = 14623/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.607 | DEBUG    | __main__:trials:29 - Trial = 14623/30000 | Total reward = 38.61
2022-01-26 14:17:36.610 | DEBUG    | __main__:trials:24 - Trial = 14624/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.612 | DEBUG    | __main__:trials:29 - Trial = 14624/30000 | Total reward = 38.35
2022-01-26 14:17:36.615 | DEBUG    | __main__:trials:24 - Trial = 14625/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.617 | DEBUG    | __main__:trials:29 - Trial = 14625/30000 | Total reward = 35.56
2022-01-26 14:17:36.620 | DEBUG    | __main__:trials:24 - Trial = 14626/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.621 | DEBUG    | __main__:trials:29 - Trial = 14626/30000 | Total reward = 47.95
2022-01-26 14:17:36.624 | DEBUG    | __main__:trials:24 - Trial = 14627/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.626 | DEBUG    | __main__:trials:29 - Trial = 14627/30000 | Total reward = 54.74
2022-01-26 14:17:36.630 | DEBUG    | __main__:trials:24 - Trial = 14628/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.631 | DEBUG    | __main__:trials:29 - Trial = 14628/30000 | Total reward = 53.36
2022-01-26 14:17:36.635 | DEBUG    | __main__:trials:24 - Trial = 14629/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.637 | DEBUG    | __main__:trials:29 - Trial = 14629/30000 | Total reward = 52.55
2022-01-26 14:17:36.639 | DEBUG    | __main__:trials:24 - Trial = 14630/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.641 | DEBUG    | __main__:trials:29 - Trial = 14630/30000 | Total reward = 51.97
2022-01-26 14:17:36.644 | DEBUG    | __main__:trials:24 - Trial = 14631/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.646 | DEBUG    | __main__:trials:29 - Trial = 14631/30000 | Total reward = 45.10
2022-01-26 14:17:36.650 | DEBUG    | __main__:trials:24 - Trial = 14632/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.651 | DEBUG    | __main__:trials:29 - Trial = 14632/30000 | Total reward = 47.35
2022-01-26 14:17:36.655 | DEBUG    | __main__:trials:24 - Trial = 14633/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.656 | DEBUG    | __main__:trials:29 - Trial = 14633/30000 | Total reward = 52.03
2022-01-26 14:17:36.659 | DEBUG    | __main__:trials:24 - Trial = 14634/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.661 | DEBUG    | __main__:trials:29 - Trial = 14634/30000 | Total reward = 48.78
2022-01-26 14:17:36.664 | DEBUG    | __main__:trials:24 - Trial = 14635/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.666 | DEBUG    | __main__:trials:29 - Trial = 14635/30000 | Total reward = 45.17
2022-01-26 14:17:36.670 | DEBUG    | __main__:trials:24 - Trial = 14636/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.671 | DEBUG    | __main__:trials:29 - Trial = 14636/30000 | Total reward = 44.69
2022-01-26 14:17:36.675 | DEBUG    | __main__:trials:24 - Trial = 14637/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.676 | DEBUG    | __main__:trials:29 - Trial = 14637/30000 | Total reward = 46.85
2022-01-26 14:17:36.680 | DEBUG    | __main__:trials:24 - Trial = 14638/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.682 | DEBUG    | __main__:trials:29 - Trial = 14638/30000 | Total reward = 38.59
2022-01-26 14:17:36.685 | DEBUG    | __main__:trials:24 - Trial = 14639/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.687 | DEBUG    | __main__:trials:29 - Trial = 14639/30000 | Total reward = 44.49
2022-01-26 14:17:36.690 | DEBUG    | __main__:trials:24 - Trial = 14640/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.692 | DEBUG    | __main__:trials:29 - Trial = 14640/30000 | Total reward = 36.46
2022-01-26 14:17:36.695 | DEBUG    | __main__:trials:24 - Trial = 14641/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.697 | DEBUG    | __main__:trials:29 - Trial = 14641/30000 | Total reward = 47.75
2022-01-26 14:17:36.700 | DEBUG    | __main__:trials:24 - Trial = 14642/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.701 | DEBUG    | __main__:trials:29 - Trial = 14642/30000 | Total reward = 41.86
2022-01-26 14:17:36.705 | DEBUG    | __main__:trials:24 - Trial = 14643/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.706 | DEBUG    | __main__:trials:29 - Trial = 14643/30000 | Total reward = 48.74
2022-01-26 14:17:36.710 | DEBUG    | __main__:trials:24 - Trial = 14644/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.711 | DEBUG    | __main__:trials:29 - Trial = 14644/30000 | Total reward = 39.67
2022-01-26 14:17:36.714 | DEBUG    | __main__:trials:24 - Trial = 14645/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.716 | DEBUG    | __main__:trials:29 - Trial = 14645/30000 | Total reward = 46.99
2022-01-26 14:17:36.720 | DEBUG    | __main__:trials:24 - Trial = 14646/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.721 | DEBUG    | __main__:trials:29 - Trial = 14646/30000 | Total reward = 46.35
2022-01-26 14:17:36.725 | DEBUG    | __main__:trials:24 - Trial = 14647/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.727 | DEBUG    | __main__:trials:29 - Trial = 14647/30000 | Total reward = 39.35
2022-01-26 14:17:36.730 | DEBUG    | __main__:trials:24 - Trial = 14648/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.731 | DEBUG    | __main__:trials:29 - Trial = 14648/30000 | Total reward = 40.95
2022-01-26 14:17:36.735 | DEBUG    | __main__:trials:24 - Trial = 14649/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.736 | DEBUG    | __main__:trials:29 - Trial = 14649/30000 | Total reward = 33.51
2022-01-26 14:17:36.740 | DEBUG    | __main__:trials:24 - Trial = 14650/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.741 | DEBUG    | __main__:trials:29 - Trial = 14650/30000 | Total reward = 37.57
2022-01-26 14:17:36.744 | DEBUG    | __main__:trials:24 - Trial = 14651/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.745 | DEBUG    | __main__:trials:29 - Trial = 14651/30000 | Total reward = 53.50
2022-01-26 14:17:36.749 | DEBUG    | __main__:trials:24 - Trial = 14652/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.750 | DEBUG    | __main__:trials:29 - Trial = 14652/30000 | Total reward = 46.97
2022-01-26 14:17:36.753 | DEBUG    | __main__:trials:24 - Trial = 14653/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.754 | DEBUG    | __main__:trials:29 - Trial = 14653/30000 | Total reward = 33.62
2022-01-26 14:17:36.757 | DEBUG    | __main__:trials:24 - Trial = 14654/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.757 | DEBUG    | __main__:trials:29 - Trial = 14654/30000 | Total reward = 45.59
2022-01-26 14:17:36.762 | DEBUG    | __main__:trials:24 - Trial = 14655/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.762 | DEBUG    | __main__:trials:29 - Trial = 14655/30000 | Total reward = 46.46
2022-01-26 14:17:36.767 | DEBUG    | __main__:trials:24 - Trial = 14656/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.768 | DEBUG    | __main__:trials:29 - Trial = 14656/30000 | Total reward = 39.60
2022-01-26 14:17:36.772 | DEBUG    | __main__:trials:24 - Trial = 14657/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.773 | DEBUG    | __main__:trials:29 - Trial = 14657/30000 | Total reward = 39.61
2022-01-26 14:17:36.776 | DEBUG    | __main__:trials:24 - Trial = 14658/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.777 | DEBUG    | __main__:trials:29 - Trial = 14658/30000 | Total reward = 42.11
2022-01-26 14:17:36.780 | DEBUG    | __main__:trials:26 - Trial = 14659/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:36.781 | DEBUG    | __main__:trials:29 - Trial = 14659/30000 | Total reward = 20.15
2022-01-26 14:17:36.784 | DEBUG    | __main__:trials:24 - Trial = 14660/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.786 | DEBUG    | __main__:trials:29 - Trial = 14660/30000 | Total reward = 45.36
2022-01-26 14:17:36.790 | DEBUG    | __main__:trials:24 - Trial = 14661/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.791 | DEBUG    | __main__:trials:29 - Trial = 14661/30000 | Total reward = 34.89
2022-01-26 14:17:36.794 | DEBUG    | __main__:trials:24 - Trial = 14662/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.796 | DEBUG    | __main__:trials:29 - Trial = 14662/30000 | Total reward = 45.86
2022-01-26 14:17:36.799 | DEBUG    | __main__:trials:24 - Trial = 14663/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.801 | DEBUG    | __main__:trials:29 - Trial = 14663/30000 | Total reward = 45.98
2022-01-26 14:17:36.804 | DEBUG    | __main__:trials:24 - Trial = 14664/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.806 | DEBUG    | __main__:trials:29 - Trial = 14664/30000 | Total reward = 46.87
2022-01-26 14:17:36.810 | DEBUG    | __main__:trials:24 - Trial = 14665/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.811 | DEBUG    | __main__:trials:29 - Trial = 14665/30000 | Total reward = 43.51
2022-01-26 14:17:36.815 | DEBUG    | __main__:trials:24 - Trial = 14666/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.816 | DEBUG    | __main__:trials:29 - Trial = 14666/30000 | Total reward = 45.28
2022-01-26 14:17:36.820 | DEBUG    | __main__:trials:24 - Trial = 14667/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.821 | DEBUG    | __main__:trials:29 - Trial = 14667/30000 | Total reward = 40.84
2022-01-26 14:17:36.824 | DEBUG    | __main__:trials:24 - Trial = 14668/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.826 | DEBUG    | __main__:trials:29 - Trial = 14668/30000 | Total reward = 37.89
2022-01-26 14:17:36.830 | DEBUG    | __main__:trials:24 - Trial = 14669/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.831 | DEBUG    | __main__:trials:29 - Trial = 14669/30000 | Total reward = 48.40
2022-01-26 14:17:36.835 | DEBUG    | __main__:trials:24 - Trial = 14670/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.837 | DEBUG    | __main__:trials:29 - Trial = 14670/30000 | Total reward = 47.05
2022-01-26 14:17:36.840 | DEBUG    | __main__:trials:24 - Trial = 14671/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.842 | DEBUG    | __main__:trials:29 - Trial = 14671/30000 | Total reward = 41.17
2022-01-26 14:17:36.845 | DEBUG    | __main__:trials:26 - Trial = 14672/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:36.846 | DEBUG    | __main__:trials:29 - Trial = 14672/30000 | Total reward = 35.84
2022-01-26 14:17:36.850 | DEBUG    | __main__:trials:24 - Trial = 14673/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.853 | DEBUG    | __main__:trials:29 - Trial = 14673/30000 | Total reward = 50.93
2022-01-26 14:17:36.856 | DEBUG    | __main__:trials:24 - Trial = 14674/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.858 | DEBUG    | __main__:trials:29 - Trial = 14674/30000 | Total reward = 44.40
2022-01-26 14:17:36.861 | DEBUG    | __main__:trials:24 - Trial = 14675/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.862 | DEBUG    | __main__:trials:29 - Trial = 14675/30000 | Total reward = 42.89
2022-01-26 14:17:36.865 | DEBUG    | __main__:trials:24 - Trial = 14676/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.865 | DEBUG    | __main__:trials:29 - Trial = 14676/30000 | Total reward = 49.59
2022-01-26 14:17:36.870 | DEBUG    | __main__:trials:24 - Trial = 14677/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.870 | DEBUG    | __main__:trials:29 - Trial = 14677/30000 | Total reward = 59.20
2022-01-26 14:17:36.874 | DEBUG    | __main__:trials:24 - Trial = 14678/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.876 | DEBUG    | __main__:trials:29 - Trial = 14678/30000 | Total reward = 43.75
2022-01-26 14:17:36.879 | DEBUG    | __main__:trials:24 - Trial = 14679/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.881 | DEBUG    | __main__:trials:29 - Trial = 14679/30000 | Total reward = 37.17
2022-01-26 14:17:36.884 | DEBUG    | __main__:trials:24 - Trial = 14680/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.886 | DEBUG    | __main__:trials:29 - Trial = 14680/30000 | Total reward = 47.86
2022-01-26 14:17:36.889 | DEBUG    | __main__:trials:24 - Trial = 14681/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.890 | DEBUG    | __main__:trials:29 - Trial = 14681/30000 | Total reward = 43.61
2022-01-26 14:17:36.894 | DEBUG    | __main__:trials:24 - Trial = 14682/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.895 | DEBUG    | __main__:trials:29 - Trial = 14682/30000 | Total reward = 44.07
2022-01-26 14:17:36.898 | DEBUG    | __main__:trials:24 - Trial = 14683/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.900 | DEBUG    | __main__:trials:29 - Trial = 14683/30000 | Total reward = 42.68
2022-01-26 14:17:36.903 | DEBUG    | __main__:trials:24 - Trial = 14684/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.905 | DEBUG    | __main__:trials:29 - Trial = 14684/30000 | Total reward = 52.32
2022-01-26 14:17:36.909 | DEBUG    | __main__:trials:24 - Trial = 14685/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.909 | DEBUG    | __main__:trials:29 - Trial = 14685/30000 | Total reward = 44.56
2022-01-26 14:17:36.912 | DEBUG    | __main__:trials:24 - Trial = 14686/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.913 | DEBUG    | __main__:trials:29 - Trial = 14686/30000 | Total reward = 47.11
2022-01-26 14:17:36.917 | DEBUG    | __main__:trials:24 - Trial = 14687/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.918 | DEBUG    | __main__:trials:29 - Trial = 14687/30000 | Total reward = 47.05
2022-01-26 14:17:36.921 | DEBUG    | __main__:trials:24 - Trial = 14688/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.923 | DEBUG    | __main__:trials:29 - Trial = 14688/30000 | Total reward = 26.41
2022-01-26 14:17:36.927 | DEBUG    | __main__:trials:24 - Trial = 14689/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.927 | DEBUG    | __main__:trials:29 - Trial = 14689/30000 | Total reward = 47.60
2022-01-26 14:17:36.931 | DEBUG    | __main__:trials:24 - Trial = 14690/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.931 | DEBUG    | __main__:trials:29 - Trial = 14690/30000 | Total reward = 47.05
2022-01-26 14:17:36.935 | DEBUG    | __main__:trials:24 - Trial = 14691/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.936 | DEBUG    | __main__:trials:29 - Trial = 14691/30000 | Total reward = 40.86
2022-01-26 14:17:36.940 | DEBUG    | __main__:trials:24 - Trial = 14692/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.941 | DEBUG    | __main__:trials:29 - Trial = 14692/30000 | Total reward = 47.55
2022-01-26 14:17:36.945 | DEBUG    | __main__:trials:24 - Trial = 14693/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.946 | DEBUG    | __main__:trials:29 - Trial = 14693/30000 | Total reward = 48.76
2022-01-26 14:17:36.950 | DEBUG    | __main__:trials:24 - Trial = 14694/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.951 | DEBUG    | __main__:trials:29 - Trial = 14694/30000 | Total reward = 51.38
2022-01-26 14:17:36.955 | DEBUG    | __main__:trials:24 - Trial = 14695/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.956 | DEBUG    | __main__:trials:29 - Trial = 14695/30000 | Total reward = 46.76
2022-01-26 14:17:36.960 | DEBUG    | __main__:trials:24 - Trial = 14696/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.962 | DEBUG    | __main__:trials:29 - Trial = 14696/30000 | Total reward = 65.73
2022-01-26 14:17:36.966 | DEBUG    | __main__:trials:24 - Trial = 14697/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.967 | DEBUG    | __main__:trials:29 - Trial = 14697/30000 | Total reward = 46.08
2022-01-26 14:17:36.971 | DEBUG    | __main__:trials:24 - Trial = 14698/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.971 | DEBUG    | __main__:trials:29 - Trial = 14698/30000 | Total reward = 42.24
2022-01-26 14:17:36.976 | DEBUG    | __main__:trials:24 - Trial = 14699/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.977 | DEBUG    | __main__:trials:29 - Trial = 14699/30000 | Total reward = 47.41
2022-01-26 14:17:36.980 | DEBUG    | __main__:trials:24 - Trial = 14700/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.982 | DEBUG    | __main__:trials:29 - Trial = 14700/30000 | Total reward = 39.79
2022-01-26 14:17:36.986 | DEBUG    | __main__:trials:24 - Trial = 14701/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.987 | DEBUG    | __main__:trials:29 - Trial = 14701/30000 | Total reward = 44.02
2022-01-26 14:17:36.990 | DEBUG    | __main__:trials:24 - Trial = 14702/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.992 | DEBUG    | __main__:trials:29 - Trial = 14702/30000 | Total reward = 46.61
2022-01-26 14:17:36.995 | DEBUG    | __main__:trials:24 - Trial = 14703/30000 | Max number of steps (20) reached
2022-01-26 14:17:36.996 | DEBUG    | __main__:trials:29 - Trial = 14703/30000 | Total reward = 45.92
2022-01-26 14:17:37.000 | DEBUG    | __main__:trials:24 - Trial = 14704/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.002 | DEBUG    | __main__:trials:29 - Trial = 14704/30000 | Total reward = 63.40
2022-01-26 14:17:37.005 | DEBUG    | __main__:trials:24 - Trial = 14705/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.006 | DEBUG    | __main__:trials:29 - Trial = 14705/30000 | Total reward = 47.46
2022-01-26 14:17:37.010 | DEBUG    | __main__:trials:24 - Trial = 14706/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.012 | DEBUG    | __main__:trials:29 - Trial = 14706/30000 | Total reward = 43.25
2022-01-26 14:17:37.015 | DEBUG    | __main__:trials:24 - Trial = 14707/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.016 | DEBUG    | __main__:trials:29 - Trial = 14707/30000 | Total reward = 40.02
2022-01-26 14:17:37.020 | DEBUG    | __main__:trials:24 - Trial = 14708/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.022 | DEBUG    | __main__:trials:29 - Trial = 14708/30000 | Total reward = 51.40
2022-01-26 14:17:37.025 | DEBUG    | __main__:trials:24 - Trial = 14709/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.027 | DEBUG    | __main__:trials:29 - Trial = 14709/30000 | Total reward = 38.99
2022-01-26 14:17:37.030 | DEBUG    | __main__:trials:24 - Trial = 14710/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.032 | DEBUG    | __main__:trials:29 - Trial = 14710/30000 | Total reward = 32.37
2022-01-26 14:17:37.035 | DEBUG    | __main__:trials:24 - Trial = 14711/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.037 | DEBUG    | __main__:trials:29 - Trial = 14711/30000 | Total reward = 29.50
2022-01-26 14:17:37.040 | DEBUG    | __main__:trials:24 - Trial = 14712/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.041 | DEBUG    | __main__:trials:29 - Trial = 14712/30000 | Total reward = 42.69
2022-01-26 14:17:37.045 | DEBUG    | __main__:trials:24 - Trial = 14713/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.045 | DEBUG    | __main__:trials:29 - Trial = 14713/30000 | Total reward = 36.25
2022-01-26 14:17:37.049 | DEBUG    | __main__:trials:24 - Trial = 14714/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.051 | DEBUG    | __main__:trials:29 - Trial = 14714/30000 | Total reward = 39.45
2022-01-26 14:17:37.055 | DEBUG    | __main__:trials:24 - Trial = 14715/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.055 | DEBUG    | __main__:trials:29 - Trial = 14715/30000 | Total reward = 42.68
2022-01-26 14:17:37.060 | DEBUG    | __main__:trials:24 - Trial = 14716/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.060 | DEBUG    | __main__:trials:29 - Trial = 14716/30000 | Total reward = 33.05
2022-01-26 14:17:37.065 | DEBUG    | __main__:trials:24 - Trial = 14717/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.066 | DEBUG    | __main__:trials:29 - Trial = 14717/30000 | Total reward = 44.44
2022-01-26 14:17:37.070 | DEBUG    | __main__:trials:24 - Trial = 14718/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.071 | DEBUG    | __main__:trials:29 - Trial = 14718/30000 | Total reward = 40.92
2022-01-26 14:17:37.074 | DEBUG    | __main__:trials:24 - Trial = 14719/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.075 | DEBUG    | __main__:trials:29 - Trial = 14719/30000 | Total reward = 47.02
2022-01-26 14:17:37.079 | DEBUG    | __main__:trials:24 - Trial = 14720/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.081 | DEBUG    | __main__:trials:29 - Trial = 14720/30000 | Total reward = 39.47
2022-01-26 14:17:37.084 | DEBUG    | __main__:trials:24 - Trial = 14721/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.085 | DEBUG    | __main__:trials:29 - Trial = 14721/30000 | Total reward = 31.27
2022-01-26 14:17:37.089 | DEBUG    | __main__:trials:24 - Trial = 14722/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.090 | DEBUG    | __main__:trials:29 - Trial = 14722/30000 | Total reward = 39.13
2022-01-26 14:17:37.094 | DEBUG    | __main__:trials:24 - Trial = 14723/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.095 | DEBUG    | __main__:trials:29 - Trial = 14723/30000 | Total reward = 39.89
2022-01-26 14:17:37.099 | DEBUG    | __main__:trials:24 - Trial = 14724/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.100 | DEBUG    | __main__:trials:29 - Trial = 14724/30000 | Total reward = 48.24
2022-01-26 14:17:37.104 | DEBUG    | __main__:trials:24 - Trial = 14725/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.106 | DEBUG    | __main__:trials:29 - Trial = 14725/30000 | Total reward = 35.59
2022-01-26 14:17:37.109 | DEBUG    | __main__:trials:24 - Trial = 14726/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.111 | DEBUG    | __main__:trials:29 - Trial = 14726/30000 | Total reward = 40.92
2022-01-26 14:17:37.115 | DEBUG    | __main__:trials:24 - Trial = 14727/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.117 | DEBUG    | __main__:trials:29 - Trial = 14727/30000 | Total reward = 38.92
2022-01-26 14:17:37.120 | DEBUG    | __main__:trials:24 - Trial = 14728/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.121 | DEBUG    | __main__:trials:29 - Trial = 14728/30000 | Total reward = 39.68
2022-01-26 14:17:37.125 | DEBUG    | __main__:trials:24 - Trial = 14729/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.125 | DEBUG    | __main__:trials:29 - Trial = 14729/30000 | Total reward = 42.06
2022-01-26 14:17:37.129 | DEBUG    | __main__:trials:24 - Trial = 14730/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.130 | DEBUG    | __main__:trials:29 - Trial = 14730/30000 | Total reward = 35.47
2022-01-26 14:17:37.134 | DEBUG    | __main__:trials:24 - Trial = 14731/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.135 | DEBUG    | __main__:trials:29 - Trial = 14731/30000 | Total reward = 55.15
2022-01-26 14:17:37.139 | DEBUG    | __main__:trials:24 - Trial = 14732/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.141 | DEBUG    | __main__:trials:29 - Trial = 14732/30000 | Total reward = 32.85
2022-01-26 14:17:37.144 | DEBUG    | __main__:trials:24 - Trial = 14733/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.145 | DEBUG    | __main__:trials:29 - Trial = 14733/30000 | Total reward = 39.97
2022-01-26 14:17:37.149 | DEBUG    | __main__:trials:24 - Trial = 14734/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.151 | DEBUG    | __main__:trials:29 - Trial = 14734/30000 | Total reward = 37.77
2022-01-26 14:17:37.155 | DEBUG    | __main__:trials:24 - Trial = 14735/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.156 | DEBUG    | __main__:trials:29 - Trial = 14735/30000 | Total reward = 47.20
2022-01-26 14:17:37.159 | DEBUG    | __main__:trials:24 - Trial = 14736/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.161 | DEBUG    | __main__:trials:29 - Trial = 14736/30000 | Total reward = 33.43
2022-01-26 14:17:37.164 | DEBUG    | __main__:trials:24 - Trial = 14737/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.166 | DEBUG    | __main__:trials:29 - Trial = 14737/30000 | Total reward = 39.68
2022-01-26 14:17:37.169 | DEBUG    | __main__:trials:24 - Trial = 14738/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.170 | DEBUG    | __main__:trials:29 - Trial = 14738/30000 | Total reward = 46.09
2022-01-26 14:17:37.173 | DEBUG    | __main__:trials:24 - Trial = 14739/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.174 | DEBUG    | __main__:trials:29 - Trial = 14739/30000 | Total reward = 40.63
2022-01-26 14:17:37.177 | DEBUG    | __main__:trials:24 - Trial = 14740/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.178 | DEBUG    | __main__:trials:29 - Trial = 14740/30000 | Total reward = 36.95
2022-01-26 14:17:37.181 | DEBUG    | __main__:trials:24 - Trial = 14741/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.183 | DEBUG    | __main__:trials:29 - Trial = 14741/30000 | Total reward = 35.61
2022-01-26 14:17:37.186 | DEBUG    | __main__:trials:24 - Trial = 14742/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.188 | DEBUG    | __main__:trials:29 - Trial = 14742/30000 | Total reward = 47.45
2022-01-26 14:17:37.192 | DEBUG    | __main__:trials:24 - Trial = 14743/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.193 | DEBUG    | __main__:trials:29 - Trial = 14743/30000 | Total reward = 40.45
2022-01-26 14:17:37.197 | DEBUG    | __main__:trials:24 - Trial = 14744/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.198 | DEBUG    | __main__:trials:29 - Trial = 14744/30000 | Total reward = 30.70
2022-01-26 14:17:37.202 | DEBUG    | __main__:trials:24 - Trial = 14745/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.204 | DEBUG    | __main__:trials:29 - Trial = 14745/30000 | Total reward = 50.54
2022-01-26 14:17:37.208 | DEBUG    | __main__:trials:24 - Trial = 14746/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.208 | DEBUG    | __main__:trials:29 - Trial = 14746/30000 | Total reward = 42.71
2022-01-26 14:17:37.212 | DEBUG    | __main__:trials:24 - Trial = 14747/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.214 | DEBUG    | __main__:trials:29 - Trial = 14747/30000 | Total reward = 38.50
2022-01-26 14:17:37.218 | DEBUG    | __main__:trials:24 - Trial = 14748/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.219 | DEBUG    | __main__:trials:29 - Trial = 14748/30000 | Total reward = 38.92
2022-01-26 14:17:37.223 | DEBUG    | __main__:trials:24 - Trial = 14749/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.225 | DEBUG    | __main__:trials:29 - Trial = 14749/30000 | Total reward = 44.17
2022-01-26 14:17:37.228 | DEBUG    | __main__:trials:24 - Trial = 14750/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.229 | DEBUG    | __main__:trials:29 - Trial = 14750/30000 | Total reward = 46.59
2022-01-26 14:17:37.234 | DEBUG    | __main__:trials:24 - Trial = 14751/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.235 | DEBUG    | __main__:trials:29 - Trial = 14751/30000 | Total reward = 41.26
2022-01-26 14:17:37.239 | DEBUG    | __main__:trials:24 - Trial = 14752/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.241 | DEBUG    | __main__:trials:29 - Trial = 14752/30000 | Total reward = 29.35
2022-01-26 14:17:37.244 | DEBUG    | __main__:trials:24 - Trial = 14753/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.245 | DEBUG    | __main__:trials:29 - Trial = 14753/30000 | Total reward = 42.69
2022-01-26 14:17:37.250 | DEBUG    | __main__:trials:24 - Trial = 14754/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.251 | DEBUG    | __main__:trials:29 - Trial = 14754/30000 | Total reward = 43.55
2022-01-26 14:17:37.255 | DEBUG    | __main__:trials:24 - Trial = 14755/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.256 | DEBUG    | __main__:trials:29 - Trial = 14755/30000 | Total reward = 43.30
2022-01-26 14:17:37.260 | DEBUG    | __main__:trials:24 - Trial = 14756/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.261 | DEBUG    | __main__:trials:29 - Trial = 14756/30000 | Total reward = 46.69
2022-01-26 14:17:37.265 | DEBUG    | __main__:trials:24 - Trial = 14757/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.267 | DEBUG    | __main__:trials:29 - Trial = 14757/30000 | Total reward = 41.43
2022-01-26 14:17:37.272 | DEBUG    | __main__:trials:24 - Trial = 14758/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.274 | DEBUG    | __main__:trials:29 - Trial = 14758/30000 | Total reward = 42.67
2022-01-26 14:17:37.277 | DEBUG    | __main__:trials:24 - Trial = 14759/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.278 | DEBUG    | __main__:trials:29 - Trial = 14759/30000 | Total reward = 38.80
2022-01-26 14:17:37.283 | DEBUG    | __main__:trials:24 - Trial = 14760/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.285 | DEBUG    | __main__:trials:29 - Trial = 14760/30000 | Total reward = 38.45
2022-01-26 14:17:37.288 | DEBUG    | __main__:trials:24 - Trial = 14761/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.289 | DEBUG    | __main__:trials:29 - Trial = 14761/30000 | Total reward = 39.37
2022-01-26 14:17:37.293 | DEBUG    | __main__:trials:24 - Trial = 14762/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.293 | DEBUG    | __main__:trials:29 - Trial = 14762/30000 | Total reward = 35.85
2022-01-26 14:17:37.298 | DEBUG    | __main__:trials:24 - Trial = 14763/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.299 | DEBUG    | __main__:trials:29 - Trial = 14763/30000 | Total reward = 39.12
2022-01-26 14:17:37.303 | DEBUG    | __main__:trials:24 - Trial = 14764/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.304 | DEBUG    | __main__:trials:29 - Trial = 14764/30000 | Total reward = 39.61
2022-01-26 14:17:37.308 | DEBUG    | __main__:trials:24 - Trial = 14765/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.309 | DEBUG    | __main__:trials:29 - Trial = 14765/30000 | Total reward = 39.77
2022-01-26 14:17:37.314 | DEBUG    | __main__:trials:24 - Trial = 14766/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.315 | DEBUG    | __main__:trials:29 - Trial = 14766/30000 | Total reward = 38.54
2022-01-26 14:17:37.319 | DEBUG    | __main__:trials:24 - Trial = 14767/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.321 | DEBUG    | __main__:trials:29 - Trial = 14767/30000 | Total reward = 37.79
2022-01-26 14:17:37.324 | DEBUG    | __main__:trials:24 - Trial = 14768/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.326 | DEBUG    | __main__:trials:29 - Trial = 14768/30000 | Total reward = 35.00
2022-01-26 14:17:37.330 | DEBUG    | __main__:trials:24 - Trial = 14769/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.331 | DEBUG    | __main__:trials:29 - Trial = 14769/30000 | Total reward = 39.40
2022-01-26 14:17:37.335 | DEBUG    | __main__:trials:24 - Trial = 14770/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.336 | DEBUG    | __main__:trials:29 - Trial = 14770/30000 | Total reward = 40.04
2022-01-26 14:17:37.340 | DEBUG    | __main__:trials:24 - Trial = 14771/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.342 | DEBUG    | __main__:trials:29 - Trial = 14771/30000 | Total reward = 40.39
2022-01-26 14:17:37.346 | DEBUG    | __main__:trials:24 - Trial = 14772/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.347 | DEBUG    | __main__:trials:29 - Trial = 14772/30000 | Total reward = 40.14
2022-01-26 14:17:37.351 | DEBUG    | __main__:trials:24 - Trial = 14773/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.352 | DEBUG    | __main__:trials:29 - Trial = 14773/30000 | Total reward = 47.07
2022-01-26 14:17:37.355 | DEBUG    | __main__:trials:24 - Trial = 14774/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.357 | DEBUG    | __main__:trials:29 - Trial = 14774/30000 | Total reward = 46.61
2022-01-26 14:17:37.361 | DEBUG    | __main__:trials:24 - Trial = 14775/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.362 | DEBUG    | __main__:trials:29 - Trial = 14775/30000 | Total reward = 47.92
2022-01-26 14:17:37.366 | DEBUG    | __main__:trials:24 - Trial = 14776/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.367 | DEBUG    | __main__:trials:29 - Trial = 14776/30000 | Total reward = 39.50
2022-01-26 14:17:37.371 | DEBUG    | __main__:trials:24 - Trial = 14777/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.372 | DEBUG    | __main__:trials:29 - Trial = 14777/30000 | Total reward = 47.47
2022-01-26 14:17:37.376 | DEBUG    | __main__:trials:24 - Trial = 14778/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.377 | DEBUG    | __main__:trials:29 - Trial = 14778/30000 | Total reward = 38.15
2022-01-26 14:17:37.380 | DEBUG    | __main__:trials:24 - Trial = 14779/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.382 | DEBUG    | __main__:trials:29 - Trial = 14779/30000 | Total reward = 42.28
2022-01-26 14:17:37.386 | DEBUG    | __main__:trials:24 - Trial = 14780/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.387 | DEBUG    | __main__:trials:29 - Trial = 14780/30000 | Total reward = 47.41
2022-01-26 14:17:37.390 | DEBUG    | __main__:trials:24 - Trial = 14781/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.391 | DEBUG    | __main__:trials:29 - Trial = 14781/30000 | Total reward = 40.73
2022-01-26 14:17:37.394 | DEBUG    | __main__:trials:24 - Trial = 14782/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.396 | DEBUG    | __main__:trials:29 - Trial = 14782/30000 | Total reward = 44.77
2022-01-26 14:17:37.400 | DEBUG    | __main__:trials:24 - Trial = 14783/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.400 | DEBUG    | __main__:trials:29 - Trial = 14783/30000 | Total reward = 55.53
2022-01-26 14:17:37.404 | DEBUG    | __main__:trials:24 - Trial = 14784/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.405 | DEBUG    | __main__:trials:29 - Trial = 14784/30000 | Total reward = 32.25
2022-01-26 14:17:37.408 | DEBUG    | __main__:trials:24 - Trial = 14785/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.410 | DEBUG    | __main__:trials:29 - Trial = 14785/30000 | Total reward = 34.48
2022-01-26 14:17:37.414 | DEBUG    | __main__:trials:24 - Trial = 14786/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.415 | DEBUG    | __main__:trials:29 - Trial = 14786/30000 | Total reward = 37.07
2022-01-26 14:17:37.418 | DEBUG    | __main__:trials:24 - Trial = 14787/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.420 | DEBUG    | __main__:trials:29 - Trial = 14787/30000 | Total reward = 33.04
2022-01-26 14:17:37.423 | DEBUG    | __main__:trials:24 - Trial = 14788/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.424 | DEBUG    | __main__:trials:29 - Trial = 14788/30000 | Total reward = 44.25
2022-01-26 14:17:37.427 | DEBUG    | __main__:trials:24 - Trial = 14789/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.429 | DEBUG    | __main__:trials:29 - Trial = 14789/30000 | Total reward = 41.50
2022-01-26 14:17:37.432 | DEBUG    | __main__:trials:24 - Trial = 14790/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.433 | DEBUG    | __main__:trials:29 - Trial = 14790/30000 | Total reward = 41.84
2022-01-26 14:17:37.436 | DEBUG    | __main__:trials:24 - Trial = 14791/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.438 | DEBUG    | __main__:trials:29 - Trial = 14791/30000 | Total reward = 40.50
2022-01-26 14:17:37.441 | DEBUG    | __main__:trials:24 - Trial = 14792/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.442 | DEBUG    | __main__:trials:29 - Trial = 14792/30000 | Total reward = 38.37
2022-01-26 14:17:37.445 | DEBUG    | __main__:trials:24 - Trial = 14793/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.446 | DEBUG    | __main__:trials:29 - Trial = 14793/30000 | Total reward = 42.36
2022-01-26 14:17:37.449 | DEBUG    | __main__:trials:24 - Trial = 14794/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.450 | DEBUG    | __main__:trials:29 - Trial = 14794/30000 | Total reward = 37.01
2022-01-26 14:17:37.453 | DEBUG    | __main__:trials:24 - Trial = 14795/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.454 | DEBUG    | __main__:trials:29 - Trial = 14795/30000 | Total reward = 38.07
2022-01-26 14:17:37.458 | DEBUG    | __main__:trials:24 - Trial = 14796/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.458 | DEBUG    | __main__:trials:29 - Trial = 14796/30000 | Total reward = 39.99
2022-01-26 14:17:37.462 | DEBUG    | __main__:trials:24 - Trial = 14797/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.463 | DEBUG    | __main__:trials:29 - Trial = 14797/30000 | Total reward = 38.99
2022-01-26 14:17:37.466 | DEBUG    | __main__:trials:24 - Trial = 14798/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.468 | DEBUG    | __main__:trials:29 - Trial = 14798/30000 | Total reward = 36.12
2022-01-26 14:17:37.471 | DEBUG    | __main__:trials:24 - Trial = 14799/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.473 | DEBUG    | __main__:trials:29 - Trial = 14799/30000 | Total reward = 38.67
2022-01-26 14:17:37.476 | DEBUG    | __main__:trials:24 - Trial = 14800/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.477 | DEBUG    | __main__:trials:29 - Trial = 14800/30000 | Total reward = 38.17
2022-01-26 14:17:37.480 | DEBUG    | __main__:trials:24 - Trial = 14801/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.482 | DEBUG    | __main__:trials:29 - Trial = 14801/30000 | Total reward = 38.21
2022-01-26 14:17:37.485 | DEBUG    | __main__:trials:24 - Trial = 14802/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.487 | DEBUG    | __main__:trials:29 - Trial = 14802/30000 | Total reward = 41.77
2022-01-26 14:17:37.490 | DEBUG    | __main__:trials:24 - Trial = 14803/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.490 | DEBUG    | __main__:trials:29 - Trial = 14803/30000 | Total reward = 32.88
2022-01-26 14:17:37.494 | DEBUG    | __main__:trials:24 - Trial = 14804/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.494 | DEBUG    | __main__:trials:29 - Trial = 14804/30000 | Total reward = 36.33
2022-01-26 14:17:37.498 | DEBUG    | __main__:trials:24 - Trial = 14805/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.498 | DEBUG    | __main__:trials:29 - Trial = 14805/30000 | Total reward = 39.26
2022-01-26 14:17:37.502 | DEBUG    | __main__:trials:24 - Trial = 14806/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.504 | DEBUG    | __main__:trials:29 - Trial = 14806/30000 | Total reward = 40.10
2022-01-26 14:17:37.507 | DEBUG    | __main__:trials:24 - Trial = 14807/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.507 | DEBUG    | __main__:trials:29 - Trial = 14807/30000 | Total reward = 24.65
2022-01-26 14:17:37.511 | DEBUG    | __main__:trials:24 - Trial = 14808/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.513 | DEBUG    | __main__:trials:29 - Trial = 14808/30000 | Total reward = 40.61
2022-01-26 14:17:37.516 | DEBUG    | __main__:trials:24 - Trial = 14809/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.517 | DEBUG    | __main__:trials:29 - Trial = 14809/30000 | Total reward = 35.42
2022-01-26 14:17:37.520 | DEBUG    | __main__:trials:24 - Trial = 14810/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.522 | DEBUG    | __main__:trials:29 - Trial = 14810/30000 | Total reward = 41.38
2022-01-26 14:17:37.525 | DEBUG    | __main__:trials:24 - Trial = 14811/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.526 | DEBUG    | __main__:trials:29 - Trial = 14811/30000 | Total reward = 35.19
2022-01-26 14:17:37.529 | DEBUG    | __main__:trials:24 - Trial = 14812/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.530 | DEBUG    | __main__:trials:29 - Trial = 14812/30000 | Total reward = 38.59
2022-01-26 14:17:37.534 | DEBUG    | __main__:trials:24 - Trial = 14813/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.534 | DEBUG    | __main__:trials:29 - Trial = 14813/30000 | Total reward = 38.75
2022-01-26 14:17:37.538 | DEBUG    | __main__:trials:24 - Trial = 14814/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.539 | DEBUG    | __main__:trials:29 - Trial = 14814/30000 | Total reward = 36.25
2022-01-26 14:17:37.542 | DEBUG    | __main__:trials:24 - Trial = 14815/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.544 | DEBUG    | __main__:trials:29 - Trial = 14815/30000 | Total reward = 37.88
2022-01-26 14:17:37.547 | DEBUG    | __main__:trials:24 - Trial = 14816/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.549 | DEBUG    | __main__:trials:29 - Trial = 14816/30000 | Total reward = 32.82
2022-01-26 14:17:37.552 | DEBUG    | __main__:trials:24 - Trial = 14817/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.552 | DEBUG    | __main__:trials:29 - Trial = 14817/30000 | Total reward = 38.90
2022-01-26 14:17:37.556 | DEBUG    | __main__:trials:24 - Trial = 14818/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.556 | DEBUG    | __main__:trials:29 - Trial = 14818/30000 | Total reward = 38.99
2022-01-26 14:17:37.560 | DEBUG    | __main__:trials:24 - Trial = 14819/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.561 | DEBUG    | __main__:trials:29 - Trial = 14819/30000 | Total reward = 50.03
2022-01-26 14:17:37.564 | DEBUG    | __main__:trials:24 - Trial = 14820/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.566 | DEBUG    | __main__:trials:29 - Trial = 14820/30000 | Total reward = 42.78
2022-01-26 14:17:37.569 | DEBUG    | __main__:trials:24 - Trial = 14821/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.570 | DEBUG    | __main__:trials:29 - Trial = 14821/30000 | Total reward = 40.54
2022-01-26 14:17:37.574 | DEBUG    | __main__:trials:24 - Trial = 14822/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.576 | DEBUG    | __main__:trials:29 - Trial = 14822/30000 | Total reward = 40.25
2022-01-26 14:17:37.578 | DEBUG    | __main__:trials:24 - Trial = 14823/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.580 | DEBUG    | __main__:trials:29 - Trial = 14823/30000 | Total reward = 35.18
2022-01-26 14:17:37.583 | DEBUG    | __main__:trials:24 - Trial = 14824/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.585 | DEBUG    | __main__:trials:29 - Trial = 14824/30000 | Total reward = 44.75
2022-01-26 14:17:37.588 | DEBUG    | __main__:trials:24 - Trial = 14825/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.589 | DEBUG    | __main__:trials:29 - Trial = 14825/30000 | Total reward = 39.04
2022-01-26 14:17:37.592 | DEBUG    | __main__:trials:24 - Trial = 14826/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.594 | DEBUG    | __main__:trials:29 - Trial = 14826/30000 | Total reward = 25.73
2022-01-26 14:17:37.597 | DEBUG    | __main__:trials:24 - Trial = 14827/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.597 | DEBUG    | __main__:trials:29 - Trial = 14827/30000 | Total reward = 37.76
2022-01-26 14:17:37.601 | DEBUG    | __main__:trials:24 - Trial = 14828/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.601 | DEBUG    | __main__:trials:29 - Trial = 14828/30000 | Total reward = 51.88
2022-01-26 14:17:37.605 | DEBUG    | __main__:trials:24 - Trial = 14829/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.606 | DEBUG    | __main__:trials:29 - Trial = 14829/30000 | Total reward = 36.88
2022-01-26 14:17:37.610 | DEBUG    | __main__:trials:24 - Trial = 14830/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.610 | DEBUG    | __main__:trials:29 - Trial = 14830/30000 | Total reward = 42.61
2022-01-26 14:17:37.614 | DEBUG    | __main__:trials:24 - Trial = 14831/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.614 | DEBUG    | __main__:trials:29 - Trial = 14831/30000 | Total reward = 38.02
2022-01-26 14:17:37.618 | DEBUG    | __main__:trials:24 - Trial = 14832/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.618 | DEBUG    | __main__:trials:29 - Trial = 14832/30000 | Total reward = 38.60
2022-01-26 14:17:37.622 | DEBUG    | __main__:trials:24 - Trial = 14833/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.624 | DEBUG    | __main__:trials:29 - Trial = 14833/30000 | Total reward = 37.34
2022-01-26 14:17:37.627 | DEBUG    | __main__:trials:26 - Trial = 14834/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:37.628 | DEBUG    | __main__:trials:29 - Trial = 14834/30000 | Total reward = 30.05
2022-01-26 14:17:37.631 | DEBUG    | __main__:trials:24 - Trial = 14835/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.633 | DEBUG    | __main__:trials:29 - Trial = 14835/30000 | Total reward = 38.96
2022-01-26 14:17:37.636 | DEBUG    | __main__:trials:24 - Trial = 14836/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.637 | DEBUG    | __main__:trials:29 - Trial = 14836/30000 | Total reward = 45.68
2022-01-26 14:17:37.640 | DEBUG    | __main__:trials:24 - Trial = 14837/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.642 | DEBUG    | __main__:trials:29 - Trial = 14837/30000 | Total reward = 46.79
2022-01-26 14:17:37.645 | DEBUG    | __main__:trials:24 - Trial = 14838/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.646 | DEBUG    | __main__:trials:29 - Trial = 14838/30000 | Total reward = 44.77
2022-01-26 14:17:37.650 | DEBUG    | __main__:trials:24 - Trial = 14839/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.652 | DEBUG    | __main__:trials:29 - Trial = 14839/30000 | Total reward = 47.45
2022-01-26 14:17:37.654 | DEBUG    | __main__:trials:24 - Trial = 14840/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.656 | DEBUG    | __main__:trials:29 - Trial = 14840/30000 | Total reward = 45.82
2022-01-26 14:17:37.659 | DEBUG    | __main__:trials:24 - Trial = 14841/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.661 | DEBUG    | __main__:trials:29 - Trial = 14841/30000 | Total reward = 41.44
2022-01-26 14:17:37.663 | DEBUG    | __main__:trials:24 - Trial = 14842/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.664 | DEBUG    | __main__:trials:29 - Trial = 14842/30000 | Total reward = 45.78
2022-01-26 14:17:37.667 | DEBUG    | __main__:trials:24 - Trial = 14843/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.669 | DEBUG    | __main__:trials:29 - Trial = 14843/30000 | Total reward = 44.43
2022-01-26 14:17:37.672 | DEBUG    | __main__:trials:24 - Trial = 14844/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.674 | DEBUG    | __main__:trials:29 - Trial = 14844/30000 | Total reward = 47.52
2022-01-26 14:17:37.677 | DEBUG    | __main__:trials:24 - Trial = 14845/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.677 | DEBUG    | __main__:trials:29 - Trial = 14845/30000 | Total reward = 47.05
2022-01-26 14:17:37.680 | DEBUG    | __main__:trials:26 - Trial = 14846/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:37.681 | DEBUG    | __main__:trials:29 - Trial = 14846/30000 | Total reward = 26.13
2022-01-26 14:17:37.684 | DEBUG    | __main__:trials:24 - Trial = 14847/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.685 | DEBUG    | __main__:trials:29 - Trial = 14847/30000 | Total reward = 42.90
2022-01-26 14:17:37.688 | DEBUG    | __main__:trials:24 - Trial = 14848/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.690 | DEBUG    | __main__:trials:29 - Trial = 14848/30000 | Total reward = 44.69
2022-01-26 14:17:37.693 | DEBUG    | __main__:trials:24 - Trial = 14849/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.694 | DEBUG    | __main__:trials:29 - Trial = 14849/30000 | Total reward = 38.23
2022-01-26 14:17:37.697 | DEBUG    | __main__:trials:24 - Trial = 14850/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.698 | DEBUG    | __main__:trials:29 - Trial = 14850/30000 | Total reward = 47.66
2022-01-26 14:17:37.701 | DEBUG    | __main__:trials:24 - Trial = 14851/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.701 | DEBUG    | __main__:trials:29 - Trial = 14851/30000 | Total reward = 47.46
2022-01-26 14:17:37.705 | DEBUG    | __main__:trials:24 - Trial = 14852/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.706 | DEBUG    | __main__:trials:29 - Trial = 14852/30000 | Total reward = 50.08
2022-01-26 14:17:37.709 | DEBUG    | __main__:trials:24 - Trial = 14853/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.710 | DEBUG    | __main__:trials:29 - Trial = 14853/30000 | Total reward = 47.05
2022-01-26 14:17:37.713 | DEBUG    | __main__:trials:24 - Trial = 14854/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.714 | DEBUG    | __main__:trials:29 - Trial = 14854/30000 | Total reward = 47.05
2022-01-26 14:17:37.718 | DEBUG    | __main__:trials:24 - Trial = 14855/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.718 | DEBUG    | __main__:trials:29 - Trial = 14855/30000 | Total reward = 40.69
2022-01-26 14:17:37.722 | DEBUG    | __main__:trials:24 - Trial = 14856/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.724 | DEBUG    | __main__:trials:29 - Trial = 14856/30000 | Total reward = 43.81
2022-01-26 14:17:37.727 | DEBUG    | __main__:trials:24 - Trial = 14857/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.728 | DEBUG    | __main__:trials:29 - Trial = 14857/30000 | Total reward = 40.50
2022-01-26 14:17:37.731 | DEBUG    | __main__:trials:24 - Trial = 14858/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.733 | DEBUG    | __main__:trials:29 - Trial = 14858/30000 | Total reward = 50.63
2022-01-26 14:17:37.736 | DEBUG    | __main__:trials:24 - Trial = 14859/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.738 | DEBUG    | __main__:trials:29 - Trial = 14859/30000 | Total reward = 43.38
2022-01-26 14:17:37.741 | DEBUG    | __main__:trials:24 - Trial = 14860/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.743 | DEBUG    | __main__:trials:29 - Trial = 14860/30000 | Total reward = 48.21
2022-01-26 14:17:37.746 | DEBUG    | __main__:trials:24 - Trial = 14861/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.747 | DEBUG    | __main__:trials:29 - Trial = 14861/30000 | Total reward = 40.05
2022-01-26 14:17:37.751 | DEBUG    | __main__:trials:24 - Trial = 14862/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.753 | DEBUG    | __main__:trials:29 - Trial = 14862/30000 | Total reward = 40.14
2022-01-26 14:17:37.756 | DEBUG    | __main__:trials:24 - Trial = 14863/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.757 | DEBUG    | __main__:trials:29 - Trial = 14863/30000 | Total reward = 45.09
2022-01-26 14:17:37.761 | DEBUG    | __main__:trials:24 - Trial = 14864/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.762 | DEBUG    | __main__:trials:29 - Trial = 14864/30000 | Total reward = 37.07
2022-01-26 14:17:37.766 | DEBUG    | __main__:trials:24 - Trial = 14865/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.767 | DEBUG    | __main__:trials:29 - Trial = 14865/30000 | Total reward = 45.07
2022-01-26 14:17:37.770 | DEBUG    | __main__:trials:24 - Trial = 14866/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.771 | DEBUG    | __main__:trials:29 - Trial = 14866/30000 | Total reward = 44.95
2022-01-26 14:17:37.774 | DEBUG    | __main__:trials:24 - Trial = 14867/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.775 | DEBUG    | __main__:trials:29 - Trial = 14867/30000 | Total reward = 49.00
2022-01-26 14:17:37.778 | DEBUG    | __main__:trials:24 - Trial = 14868/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.779 | DEBUG    | __main__:trials:29 - Trial = 14868/30000 | Total reward = 42.97
2022-01-26 14:17:37.782 | DEBUG    | __main__:trials:24 - Trial = 14869/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.783 | DEBUG    | __main__:trials:29 - Trial = 14869/30000 | Total reward = 52.11
2022-01-26 14:17:37.787 | DEBUG    | __main__:trials:24 - Trial = 14870/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.789 | DEBUG    | __main__:trials:29 - Trial = 14870/30000 | Total reward = 48.36
2022-01-26 14:17:37.792 | DEBUG    | __main__:trials:24 - Trial = 14871/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.794 | DEBUG    | __main__:trials:29 - Trial = 14871/30000 | Total reward = 46.30
2022-01-26 14:17:37.798 | DEBUG    | __main__:trials:24 - Trial = 14872/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.799 | DEBUG    | __main__:trials:29 - Trial = 14872/30000 | Total reward = 43.89
2022-01-26 14:17:37.803 | DEBUG    | __main__:trials:24 - Trial = 14873/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.804 | DEBUG    | __main__:trials:29 - Trial = 14873/30000 | Total reward = 52.26
2022-01-26 14:17:37.808 | DEBUG    | __main__:trials:24 - Trial = 14874/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.810 | DEBUG    | __main__:trials:29 - Trial = 14874/30000 | Total reward = 43.09
2022-01-26 14:17:37.814 | DEBUG    | __main__:trials:24 - Trial = 14875/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.815 | DEBUG    | __main__:trials:29 - Trial = 14875/30000 | Total reward = 39.59
2022-01-26 14:17:37.819 | DEBUG    | __main__:trials:24 - Trial = 14876/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.820 | DEBUG    | __main__:trials:29 - Trial = 14876/30000 | Total reward = 41.88
2022-01-26 14:17:37.823 | DEBUG    | __main__:trials:24 - Trial = 14877/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.825 | DEBUG    | __main__:trials:29 - Trial = 14877/30000 | Total reward = 46.95
2022-01-26 14:17:37.829 | DEBUG    | __main__:trials:24 - Trial = 14878/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.830 | DEBUG    | __main__:trials:29 - Trial = 14878/30000 | Total reward = 36.30
2022-01-26 14:17:37.834 | DEBUG    | __main__:trials:24 - Trial = 14879/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.834 | DEBUG    | __main__:trials:29 - Trial = 14879/30000 | Total reward = 41.92
2022-01-26 14:17:37.839 | DEBUG    | __main__:trials:24 - Trial = 14880/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.840 | DEBUG    | __main__:trials:29 - Trial = 14880/30000 | Total reward = 41.06
2022-01-26 14:17:37.844 | DEBUG    | __main__:trials:24 - Trial = 14881/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.845 | DEBUG    | __main__:trials:29 - Trial = 14881/30000 | Total reward = 47.52
2022-01-26 14:17:37.849 | DEBUG    | __main__:trials:24 - Trial = 14882/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.851 | DEBUG    | __main__:trials:29 - Trial = 14882/30000 | Total reward = 50.81
2022-01-26 14:17:37.855 | DEBUG    | __main__:trials:24 - Trial = 14883/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.855 | DEBUG    | __main__:trials:29 - Trial = 14883/30000 | Total reward = 44.70
2022-01-26 14:17:37.860 | DEBUG    | __main__:trials:24 - Trial = 14884/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.862 | DEBUG    | __main__:trials:29 - Trial = 14884/30000 | Total reward = 47.58
2022-01-26 14:17:37.864 | DEBUG    | __main__:trials:24 - Trial = 14885/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.866 | DEBUG    | __main__:trials:29 - Trial = 14885/30000 | Total reward = 37.27
2022-01-26 14:17:37.870 | DEBUG    | __main__:trials:24 - Trial = 14886/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.871 | DEBUG    | __main__:trials:29 - Trial = 14886/30000 | Total reward = 64.77
2022-01-26 14:17:37.875 | DEBUG    | __main__:trials:24 - Trial = 14887/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.875 | DEBUG    | __main__:trials:29 - Trial = 14887/30000 | Total reward = 50.08
2022-01-26 14:17:37.880 | DEBUG    | __main__:trials:24 - Trial = 14888/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.881 | DEBUG    | __main__:trials:29 - Trial = 14888/30000 | Total reward = 47.29
2022-01-26 14:17:37.885 | DEBUG    | __main__:trials:24 - Trial = 14889/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.887 | DEBUG    | __main__:trials:29 - Trial = 14889/30000 | Total reward = 38.75
2022-01-26 14:17:37.890 | DEBUG    | __main__:trials:24 - Trial = 14890/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.891 | DEBUG    | __main__:trials:29 - Trial = 14890/30000 | Total reward = 41.62
2022-01-26 14:17:37.895 | DEBUG    | __main__:trials:24 - Trial = 14891/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.896 | DEBUG    | __main__:trials:29 - Trial = 14891/30000 | Total reward = 41.43
2022-01-26 14:17:37.900 | DEBUG    | __main__:trials:24 - Trial = 14892/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.902 | DEBUG    | __main__:trials:29 - Trial = 14892/30000 | Total reward = 47.05
2022-01-26 14:17:37.905 | DEBUG    | __main__:trials:24 - Trial = 14893/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.907 | DEBUG    | __main__:trials:29 - Trial = 14893/30000 | Total reward = 38.02
2022-01-26 14:17:37.911 | DEBUG    | __main__:trials:24 - Trial = 14894/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.912 | DEBUG    | __main__:trials:29 - Trial = 14894/30000 | Total reward = 63.93
2022-01-26 14:17:37.916 | DEBUG    | __main__:trials:24 - Trial = 14895/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.917 | DEBUG    | __main__:trials:29 - Trial = 14895/30000 | Total reward = 41.40
2022-01-26 14:17:37.921 | DEBUG    | __main__:trials:24 - Trial = 14896/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.922 | DEBUG    | __main__:trials:29 - Trial = 14896/30000 | Total reward = 40.50
2022-01-26 14:17:37.925 | DEBUG    | __main__:trials:24 - Trial = 14897/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.926 | DEBUG    | __main__:trials:29 - Trial = 14897/30000 | Total reward = 44.39
2022-01-26 14:17:37.930 | DEBUG    | __main__:trials:24 - Trial = 14898/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.930 | DEBUG    | __main__:trials:29 - Trial = 14898/30000 | Total reward = 34.81
2022-01-26 14:17:37.934 | DEBUG    | __main__:trials:24 - Trial = 14899/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.936 | DEBUG    | __main__:trials:29 - Trial = 14899/30000 | Total reward = 39.67
2022-01-26 14:17:37.939 | DEBUG    | __main__:trials:24 - Trial = 14900/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.939 | DEBUG    | __main__:trials:29 - Trial = 14900/30000 | Total reward = 65.92
2022-01-26 14:17:37.943 | DEBUG    | __main__:trials:24 - Trial = 14901/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.945 | DEBUG    | __main__:trials:29 - Trial = 14901/30000 | Total reward = 44.59
2022-01-26 14:17:37.948 | DEBUG    | __main__:trials:24 - Trial = 14902/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.949 | DEBUG    | __main__:trials:29 - Trial = 14902/30000 | Total reward = 46.61
2022-01-26 14:17:37.953 | DEBUG    | __main__:trials:24 - Trial = 14903/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.954 | DEBUG    | __main__:trials:29 - Trial = 14903/30000 | Total reward = 47.49
2022-01-26 14:17:37.958 | DEBUG    | __main__:trials:24 - Trial = 14904/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.959 | DEBUG    | __main__:trials:29 - Trial = 14904/30000 | Total reward = 48.11
2022-01-26 14:17:37.963 | DEBUG    | __main__:trials:24 - Trial = 14905/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.964 | DEBUG    | __main__:trials:29 - Trial = 14905/30000 | Total reward = 43.24
2022-01-26 14:17:37.968 | DEBUG    | __main__:trials:24 - Trial = 14906/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.969 | DEBUG    | __main__:trials:29 - Trial = 14906/30000 | Total reward = 47.46
2022-01-26 14:17:37.972 | DEBUG    | __main__:trials:24 - Trial = 14907/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.974 | DEBUG    | __main__:trials:29 - Trial = 14907/30000 | Total reward = 40.99
2022-01-26 14:17:37.977 | DEBUG    | __main__:trials:26 - Trial = 14908/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:37.978 | DEBUG    | __main__:trials:29 - Trial = 14908/30000 | Total reward = 33.52
2022-01-26 14:17:37.981 | DEBUG    | __main__:trials:24 - Trial = 14909/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.983 | DEBUG    | __main__:trials:29 - Trial = 14909/30000 | Total reward = 47.05
2022-01-26 14:17:37.987 | DEBUG    | __main__:trials:24 - Trial = 14910/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.989 | DEBUG    | __main__:trials:29 - Trial = 14910/30000 | Total reward = 36.86
2022-01-26 14:17:37.991 | DEBUG    | __main__:trials:24 - Trial = 14911/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.993 | DEBUG    | __main__:trials:29 - Trial = 14911/30000 | Total reward = 38.93
2022-01-26 14:17:37.997 | DEBUG    | __main__:trials:24 - Trial = 14912/30000 | Max number of steps (20) reached
2022-01-26 14:17:37.997 | DEBUG    | __main__:trials:29 - Trial = 14912/30000 | Total reward = 42.19
2022-01-26 14:17:38.001 | DEBUG    | __main__:trials:24 - Trial = 14913/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.002 | DEBUG    | __main__:trials:29 - Trial = 14913/30000 | Total reward = 46.47
2022-01-26 14:17:38.005 | DEBUG    | __main__:trials:24 - Trial = 14914/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.006 | DEBUG    | __main__:trials:29 - Trial = 14914/30000 | Total reward = 40.76
2022-01-26 14:17:38.010 | DEBUG    | __main__:trials:24 - Trial = 14915/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.011 | DEBUG    | __main__:trials:29 - Trial = 14915/30000 | Total reward = 47.85
2022-01-26 14:17:38.015 | DEBUG    | __main__:trials:24 - Trial = 14916/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.017 | DEBUG    | __main__:trials:29 - Trial = 14916/30000 | Total reward = 38.54
2022-01-26 14:17:38.020 | DEBUG    | __main__:trials:24 - Trial = 14917/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.021 | DEBUG    | __main__:trials:29 - Trial = 14917/30000 | Total reward = 45.24
2022-01-26 14:17:38.025 | DEBUG    | __main__:trials:24 - Trial = 14918/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.026 | DEBUG    | __main__:trials:29 - Trial = 14918/30000 | Total reward = 44.07
2022-01-26 14:17:38.029 | DEBUG    | __main__:trials:24 - Trial = 14919/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.030 | DEBUG    | __main__:trials:29 - Trial = 14919/30000 | Total reward = 43.08
2022-01-26 14:17:38.034 | DEBUG    | __main__:trials:24 - Trial = 14920/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.036 | DEBUG    | __main__:trials:29 - Trial = 14920/30000 | Total reward = 52.06
2022-01-26 14:17:38.039 | DEBUG    | __main__:trials:24 - Trial = 14921/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.040 | DEBUG    | __main__:trials:29 - Trial = 14921/30000 | Total reward = 41.18
2022-01-26 14:17:38.043 | DEBUG    | __main__:trials:24 - Trial = 14922/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.045 | DEBUG    | __main__:trials:29 - Trial = 14922/30000 | Total reward = 45.61
2022-01-26 14:17:38.048 | DEBUG    | __main__:trials:24 - Trial = 14923/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.050 | DEBUG    | __main__:trials:29 - Trial = 14923/30000 | Total reward = 44.64
2022-01-26 14:17:38.054 | DEBUG    | __main__:trials:26 - Trial = 14924/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:38.055 | DEBUG    | __main__:trials:29 - Trial = 14924/30000 | Total reward = 39.56
2022-01-26 14:17:38.059 | DEBUG    | __main__:trials:24 - Trial = 14925/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.060 | DEBUG    | __main__:trials:29 - Trial = 14925/30000 | Total reward = 45.08
2022-01-26 14:17:38.064 | DEBUG    | __main__:trials:24 - Trial = 14926/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.065 | DEBUG    | __main__:trials:29 - Trial = 14926/30000 | Total reward = 36.54
2022-01-26 14:17:38.069 | DEBUG    | __main__:trials:24 - Trial = 14927/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.071 | DEBUG    | __main__:trials:29 - Trial = 14927/30000 | Total reward = 47.05
2022-01-26 14:17:38.074 | DEBUG    | __main__:trials:24 - Trial = 14928/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.075 | DEBUG    | __main__:trials:29 - Trial = 14928/30000 | Total reward = 49.83
2022-01-26 14:17:38.079 | DEBUG    | __main__:trials:24 - Trial = 14929/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.080 | DEBUG    | __main__:trials:29 - Trial = 14929/30000 | Total reward = 45.61
2022-01-26 14:17:38.084 | DEBUG    | __main__:trials:24 - Trial = 14930/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.085 | DEBUG    | __main__:trials:29 - Trial = 14930/30000 | Total reward = 50.34
2022-01-26 14:17:38.089 | DEBUG    | __main__:trials:24 - Trial = 14931/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.091 | DEBUG    | __main__:trials:29 - Trial = 14931/30000 | Total reward = 45.24
2022-01-26 14:17:38.094 | DEBUG    | __main__:trials:24 - Trial = 14932/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.096 | DEBUG    | __main__:trials:29 - Trial = 14932/30000 | Total reward = 53.23
2022-01-26 14:17:38.099 | DEBUG    | __main__:trials:24 - Trial = 14933/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.100 | DEBUG    | __main__:trials:29 - Trial = 14933/30000 | Total reward = 45.90
2022-01-26 14:17:38.104 | DEBUG    | __main__:trials:24 - Trial = 14934/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.106 | DEBUG    | __main__:trials:29 - Trial = 14934/30000 | Total reward = 47.20
2022-01-26 14:17:38.109 | DEBUG    | __main__:trials:24 - Trial = 14935/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.111 | DEBUG    | __main__:trials:29 - Trial = 14935/30000 | Total reward = 35.38
2022-01-26 14:17:38.114 | DEBUG    | __main__:trials:24 - Trial = 14936/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.116 | DEBUG    | __main__:trials:29 - Trial = 14936/30000 | Total reward = 43.57
2022-01-26 14:17:38.120 | DEBUG    | __main__:trials:24 - Trial = 14937/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.120 | DEBUG    | __main__:trials:29 - Trial = 14937/30000 | Total reward = 37.20
2022-01-26 14:17:38.124 | DEBUG    | __main__:trials:24 - Trial = 14938/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.126 | DEBUG    | __main__:trials:29 - Trial = 14938/30000 | Total reward = 41.97
2022-01-26 14:17:38.129 | DEBUG    | __main__:trials:24 - Trial = 14939/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.130 | DEBUG    | __main__:trials:29 - Trial = 14939/30000 | Total reward = 40.31
2022-01-26 14:17:38.135 | DEBUG    | __main__:trials:24 - Trial = 14940/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.136 | DEBUG    | __main__:trials:29 - Trial = 14940/30000 | Total reward = 44.07
2022-01-26 14:17:38.140 | DEBUG    | __main__:trials:24 - Trial = 14941/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.141 | DEBUG    | __main__:trials:29 - Trial = 14941/30000 | Total reward = 44.03
2022-01-26 14:17:38.145 | DEBUG    | __main__:trials:24 - Trial = 14942/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.146 | DEBUG    | __main__:trials:29 - Trial = 14942/30000 | Total reward = 45.91
2022-01-26 14:17:38.150 | DEBUG    | __main__:trials:24 - Trial = 14943/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.151 | DEBUG    | __main__:trials:29 - Trial = 14943/30000 | Total reward = 46.24
2022-01-26 14:17:38.154 | DEBUG    | __main__:trials:24 - Trial = 14944/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.155 | DEBUG    | __main__:trials:29 - Trial = 14944/30000 | Total reward = 43.83
2022-01-26 14:17:38.158 | DEBUG    | __main__:trials:24 - Trial = 14945/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.160 | DEBUG    | __main__:trials:29 - Trial = 14945/30000 | Total reward = 44.64
2022-01-26 14:17:38.163 | DEBUG    | __main__:trials:24 - Trial = 14946/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.164 | DEBUG    | __main__:trials:29 - Trial = 14946/30000 | Total reward = 42.33
2022-01-26 14:17:38.167 | DEBUG    | __main__:trials:24 - Trial = 14947/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.169 | DEBUG    | __main__:trials:29 - Trial = 14947/30000 | Total reward = 47.23
2022-01-26 14:17:38.172 | DEBUG    | __main__:trials:24 - Trial = 14948/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.174 | DEBUG    | __main__:trials:29 - Trial = 14948/30000 | Total reward = 43.80
2022-01-26 14:17:38.178 | DEBUG    | __main__:trials:24 - Trial = 14949/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.179 | DEBUG    | __main__:trials:29 - Trial = 14949/30000 | Total reward = 47.05
2022-01-26 14:17:38.183 | DEBUG    | __main__:trials:24 - Trial = 14950/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.184 | DEBUG    | __main__:trials:29 - Trial = 14950/30000 | Total reward = 39.70
2022-01-26 14:17:38.188 | DEBUG    | __main__:trials:24 - Trial = 14951/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.189 | DEBUG    | __main__:trials:29 - Trial = 14951/30000 | Total reward = 47.20
2022-01-26 14:17:38.193 | DEBUG    | __main__:trials:24 - Trial = 14952/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.194 | DEBUG    | __main__:trials:29 - Trial = 14952/30000 | Total reward = 46.84
2022-01-26 14:17:38.199 | DEBUG    | __main__:trials:24 - Trial = 14953/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.200 | DEBUG    | __main__:trials:29 - Trial = 14953/30000 | Total reward = 45.15
2022-01-26 14:17:38.204 | DEBUG    | __main__:trials:24 - Trial = 14954/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.205 | DEBUG    | __main__:trials:29 - Trial = 14954/30000 | Total reward = 39.79
2022-01-26 14:17:38.209 | DEBUG    | __main__:trials:24 - Trial = 14955/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.210 | DEBUG    | __main__:trials:29 - Trial = 14955/30000 | Total reward = 59.99
2022-01-26 14:17:38.214 | DEBUG    | __main__:trials:24 - Trial = 14956/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.216 | DEBUG    | __main__:trials:29 - Trial = 14956/30000 | Total reward = 45.77
2022-01-26 14:17:38.219 | DEBUG    | __main__:trials:24 - Trial = 14957/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.221 | DEBUG    | __main__:trials:29 - Trial = 14957/30000 | Total reward = 45.62
2022-01-26 14:17:38.224 | DEBUG    | __main__:trials:24 - Trial = 14958/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.225 | DEBUG    | __main__:trials:29 - Trial = 14958/30000 | Total reward = 52.45
2022-01-26 14:17:38.228 | DEBUG    | __main__:trials:24 - Trial = 14959/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.229 | DEBUG    | __main__:trials:29 - Trial = 14959/30000 | Total reward = 52.41
2022-01-26 14:17:38.233 | DEBUG    | __main__:trials:24 - Trial = 14960/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.234 | DEBUG    | __main__:trials:29 - Trial = 14960/30000 | Total reward = 46.13
2022-01-26 14:17:38.238 | DEBUG    | __main__:trials:24 - Trial = 14961/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.239 | DEBUG    | __main__:trials:29 - Trial = 14961/30000 | Total reward = 52.64
2022-01-26 14:17:38.243 | DEBUG    | __main__:trials:24 - Trial = 14962/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.245 | DEBUG    | __main__:trials:29 - Trial = 14962/30000 | Total reward = 35.58
2022-01-26 14:17:38.248 | DEBUG    | __main__:trials:24 - Trial = 14963/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.250 | DEBUG    | __main__:trials:29 - Trial = 14963/30000 | Total reward = 48.19
2022-01-26 14:17:38.253 | DEBUG    | __main__:trials:24 - Trial = 14964/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.254 | DEBUG    | __main__:trials:29 - Trial = 14964/30000 | Total reward = 36.03
2022-01-26 14:17:38.258 | DEBUG    | __main__:trials:24 - Trial = 14965/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.260 | DEBUG    | __main__:trials:29 - Trial = 14965/30000 | Total reward = 47.05
2022-01-26 14:17:38.264 | DEBUG    | __main__:trials:24 - Trial = 14966/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.265 | DEBUG    | __main__:trials:29 - Trial = 14966/30000 | Total reward = 38.80
2022-01-26 14:17:38.269 | DEBUG    | __main__:trials:24 - Trial = 14967/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.271 | DEBUG    | __main__:trials:29 - Trial = 14967/30000 | Total reward = 46.24
2022-01-26 14:17:38.274 | DEBUG    | __main__:trials:24 - Trial = 14968/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.275 | DEBUG    | __main__:trials:29 - Trial = 14968/30000 | Total reward = 46.06
2022-01-26 14:17:38.279 | DEBUG    | __main__:trials:24 - Trial = 14969/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.281 | DEBUG    | __main__:trials:29 - Trial = 14969/30000 | Total reward = 45.11
2022-01-26 14:17:38.284 | DEBUG    | __main__:trials:24 - Trial = 14970/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.286 | DEBUG    | __main__:trials:29 - Trial = 14970/30000 | Total reward = 35.85
2022-01-26 14:17:38.289 | DEBUG    | __main__:trials:24 - Trial = 14971/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.290 | DEBUG    | __main__:trials:29 - Trial = 14971/30000 | Total reward = 51.99
2022-01-26 14:17:38.294 | DEBUG    | __main__:trials:24 - Trial = 14972/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.294 | DEBUG    | __main__:trials:29 - Trial = 14972/30000 | Total reward = 58.78
2022-01-26 14:17:38.299 | DEBUG    | __main__:trials:24 - Trial = 14973/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.300 | DEBUG    | __main__:trials:29 - Trial = 14973/30000 | Total reward = 43.49
2022-01-26 14:17:38.304 | DEBUG    | __main__:trials:24 - Trial = 14974/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.305 | DEBUG    | __main__:trials:29 - Trial = 14974/30000 | Total reward = 49.14
2022-01-26 14:17:38.308 | DEBUG    | __main__:trials:24 - Trial = 14975/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.310 | DEBUG    | __main__:trials:29 - Trial = 14975/30000 | Total reward = 43.47
2022-01-26 14:17:38.314 | DEBUG    | __main__:trials:24 - Trial = 14976/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.315 | DEBUG    | __main__:trials:29 - Trial = 14976/30000 | Total reward = 49.79
2022-01-26 14:17:38.319 | DEBUG    | __main__:trials:24 - Trial = 14977/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.321 | DEBUG    | __main__:trials:29 - Trial = 14977/30000 | Total reward = 47.78
2022-01-26 14:17:38.324 | DEBUG    | __main__:trials:24 - Trial = 14978/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.326 | DEBUG    | __main__:trials:29 - Trial = 14978/30000 | Total reward = 46.06
2022-01-26 14:17:38.330 | DEBUG    | __main__:trials:24 - Trial = 14979/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.331 | DEBUG    | __main__:trials:29 - Trial = 14979/30000 | Total reward = 46.65
2022-01-26 14:17:38.335 | DEBUG    | __main__:trials:26 - Trial = 14980/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:38.336 | DEBUG    | __main__:trials:29 - Trial = 14980/30000 | Total reward = 30.01
2022-01-26 14:17:38.340 | DEBUG    | __main__:trials:24 - Trial = 14981/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.341 | DEBUG    | __main__:trials:29 - Trial = 14981/30000 | Total reward = 56.42
2022-01-26 14:17:38.344 | DEBUG    | __main__:trials:24 - Trial = 14982/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.346 | DEBUG    | __main__:trials:29 - Trial = 14982/30000 | Total reward = 48.04
2022-01-26 14:17:38.350 | DEBUG    | __main__:trials:24 - Trial = 14983/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.351 | DEBUG    | __main__:trials:29 - Trial = 14983/30000 | Total reward = 52.42
2022-01-26 14:17:38.354 | DEBUG    | __main__:trials:24 - Trial = 14984/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.355 | DEBUG    | __main__:trials:29 - Trial = 14984/30000 | Total reward = 47.05
2022-01-26 14:17:38.359 | DEBUG    | __main__:trials:24 - Trial = 14985/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.360 | DEBUG    | __main__:trials:29 - Trial = 14985/30000 | Total reward = 52.55
2022-01-26 14:17:38.364 | DEBUG    | __main__:trials:24 - Trial = 14986/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.365 | DEBUG    | __main__:trials:29 - Trial = 14986/30000 | Total reward = 49.63
2022-01-26 14:17:38.369 | DEBUG    | __main__:trials:24 - Trial = 14987/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.371 | DEBUG    | __main__:trials:29 - Trial = 14987/30000 | Total reward = 38.89
2022-01-26 14:17:38.375 | DEBUG    | __main__:trials:24 - Trial = 14988/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.376 | DEBUG    | __main__:trials:29 - Trial = 14988/30000 | Total reward = 47.89
2022-01-26 14:17:38.380 | DEBUG    | __main__:trials:24 - Trial = 14989/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.381 | DEBUG    | __main__:trials:29 - Trial = 14989/30000 | Total reward = 60.31
2022-01-26 14:17:38.385 | DEBUG    | __main__:trials:24 - Trial = 14990/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.387 | DEBUG    | __main__:trials:29 - Trial = 14990/30000 | Total reward = 45.04
2022-01-26 14:17:38.390 | DEBUG    | __main__:trials:24 - Trial = 14991/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.391 | DEBUG    | __main__:trials:29 - Trial = 14991/30000 | Total reward = 59.82
2022-01-26 14:17:38.395 | DEBUG    | __main__:trials:24 - Trial = 14992/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.396 | DEBUG    | __main__:trials:29 - Trial = 14992/30000 | Total reward = 47.20
2022-01-26 14:17:38.400 | DEBUG    | __main__:trials:24 - Trial = 14993/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.402 | DEBUG    | __main__:trials:29 - Trial = 14993/30000 | Total reward = 43.00
2022-01-26 14:17:38.405 | DEBUG    | __main__:trials:24 - Trial = 14994/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.406 | DEBUG    | __main__:trials:29 - Trial = 14994/30000 | Total reward = 43.70
2022-01-26 14:17:38.411 | DEBUG    | __main__:trials:24 - Trial = 14995/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.412 | DEBUG    | __main__:trials:29 - Trial = 14995/30000 | Total reward = 53.60
2022-01-26 14:17:38.415 | DEBUG    | __main__:trials:24 - Trial = 14996/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.417 | DEBUG    | __main__:trials:29 - Trial = 14996/30000 | Total reward = 47.05
2022-01-26 14:17:38.420 | DEBUG    | __main__:trials:24 - Trial = 14997/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.421 | DEBUG    | __main__:trials:29 - Trial = 14997/30000 | Total reward = 47.33
2022-01-26 14:17:38.424 | DEBUG    | __main__:trials:24 - Trial = 14998/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.425 | DEBUG    | __main__:trials:29 - Trial = 14998/30000 | Total reward = 43.29
2022-01-26 14:17:38.429 | DEBUG    | __main__:trials:24 - Trial = 14999/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.430 | DEBUG    | __main__:trials:29 - Trial = 14999/30000 | Total reward = 46.18
2022-01-26 14:17:38.434 | DEBUG    | __main__:trials:24 - Trial = 15000/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.435 | DEBUG    | __main__:trials:29 - Trial = 15000/30000 | Total reward = 45.00
2022-01-26 14:17:38.439 | DEBUG    | __main__:trials:24 - Trial = 15001/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.440 | DEBUG    | __main__:trials:29 - Trial = 15001/30000 | Total reward = 47.74
2022-01-26 14:17:38.444 | DEBUG    | __main__:trials:24 - Trial = 15002/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.446 | DEBUG    | __main__:trials:29 - Trial = 15002/30000 | Total reward = 44.25
2022-01-26 14:17:38.449 | DEBUG    | __main__:trials:24 - Trial = 15003/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.451 | DEBUG    | __main__:trials:29 - Trial = 15003/30000 | Total reward = 43.56
2022-01-26 14:17:38.454 | DEBUG    | __main__:trials:24 - Trial = 15004/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.456 | DEBUG    | __main__:trials:29 - Trial = 15004/30000 | Total reward = 37.88
2022-01-26 14:17:38.459 | DEBUG    | __main__:trials:24 - Trial = 15005/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.461 | DEBUG    | __main__:trials:29 - Trial = 15005/30000 | Total reward = 37.55
2022-01-26 14:17:38.464 | DEBUG    | __main__:trials:24 - Trial = 15006/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.465 | DEBUG    | __main__:trials:29 - Trial = 15006/30000 | Total reward = 44.69
2022-01-26 14:17:38.469 | DEBUG    | __main__:trials:24 - Trial = 15007/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.470 | DEBUG    | __main__:trials:29 - Trial = 15007/30000 | Total reward = 44.72
2022-01-26 14:17:38.474 | DEBUG    | __main__:trials:24 - Trial = 15008/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.476 | DEBUG    | __main__:trials:29 - Trial = 15008/30000 | Total reward = 54.73
2022-01-26 14:17:38.479 | DEBUG    | __main__:trials:24 - Trial = 15009/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.481 | DEBUG    | __main__:trials:29 - Trial = 15009/30000 | Total reward = 47.05
2022-01-26 14:17:38.484 | DEBUG    | __main__:trials:24 - Trial = 15010/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.485 | DEBUG    | __main__:trials:29 - Trial = 15010/30000 | Total reward = 46.66
2022-01-26 14:17:38.488 | DEBUG    | __main__:trials:24 - Trial = 15011/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.489 | DEBUG    | __main__:trials:29 - Trial = 15011/30000 | Total reward = 54.67
2022-01-26 14:17:38.493 | DEBUG    | __main__:trials:24 - Trial = 15012/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.494 | DEBUG    | __main__:trials:29 - Trial = 15012/30000 | Total reward = 59.85
2022-01-26 14:17:38.498 | DEBUG    | __main__:trials:24 - Trial = 15013/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.498 | DEBUG    | __main__:trials:29 - Trial = 15013/30000 | Total reward = 48.08
2022-01-26 14:17:38.503 | DEBUG    | __main__:trials:24 - Trial = 15014/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.504 | DEBUG    | __main__:trials:29 - Trial = 15014/30000 | Total reward = 42.77
2022-01-26 14:17:38.507 | DEBUG    | __main__:trials:24 - Trial = 15015/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.509 | DEBUG    | __main__:trials:29 - Trial = 15015/30000 | Total reward = 39.01
2022-01-26 14:17:38.512 | DEBUG    | __main__:trials:24 - Trial = 15016/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.514 | DEBUG    | __main__:trials:29 - Trial = 15016/30000 | Total reward = 47.05
2022-01-26 14:17:38.517 | DEBUG    | __main__:trials:24 - Trial = 15017/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.518 | DEBUG    | __main__:trials:29 - Trial = 15017/30000 | Total reward = 48.04
2022-01-26 14:17:38.522 | DEBUG    | __main__:trials:24 - Trial = 15018/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.523 | DEBUG    | __main__:trials:29 - Trial = 15018/30000 | Total reward = 38.86
2022-01-26 14:17:38.527 | DEBUG    | __main__:trials:24 - Trial = 15019/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.528 | DEBUG    | __main__:trials:29 - Trial = 15019/30000 | Total reward = 42.44
2022-01-26 14:17:38.532 | DEBUG    | __main__:trials:24 - Trial = 15020/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.533 | DEBUG    | __main__:trials:29 - Trial = 15020/30000 | Total reward = 36.60
2022-01-26 14:17:38.537 | DEBUG    | __main__:trials:24 - Trial = 15021/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.539 | DEBUG    | __main__:trials:29 - Trial = 15021/30000 | Total reward = 61.55
2022-01-26 14:17:38.542 | DEBUG    | __main__:trials:24 - Trial = 15022/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.544 | DEBUG    | __main__:trials:29 - Trial = 15022/30000 | Total reward = 50.18
2022-01-26 14:17:38.548 | DEBUG    | __main__:trials:24 - Trial = 15023/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.549 | DEBUG    | __main__:trials:29 - Trial = 15023/30000 | Total reward = 40.69
2022-01-26 14:17:38.552 | DEBUG    | __main__:trials:24 - Trial = 15024/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.554 | DEBUG    | __main__:trials:29 - Trial = 15024/30000 | Total reward = 36.68
2022-01-26 14:17:38.558 | DEBUG    | __main__:trials:24 - Trial = 15025/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.560 | DEBUG    | __main__:trials:29 - Trial = 15025/30000 | Total reward = 38.26
2022-01-26 14:17:38.563 | DEBUG    | __main__:trials:24 - Trial = 15026/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.564 | DEBUG    | __main__:trials:29 - Trial = 15026/30000 | Total reward = 45.98
2022-01-26 14:17:38.568 | DEBUG    | __main__:trials:24 - Trial = 15027/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.570 | DEBUG    | __main__:trials:29 - Trial = 15027/30000 | Total reward = 45.94
2022-01-26 14:17:38.573 | DEBUG    | __main__:trials:24 - Trial = 15028/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.575 | DEBUG    | __main__:trials:29 - Trial = 15028/30000 | Total reward = 53.39
2022-01-26 14:17:38.579 | DEBUG    | __main__:trials:24 - Trial = 15029/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.580 | DEBUG    | __main__:trials:29 - Trial = 15029/30000 | Total reward = 45.01
2022-01-26 14:17:38.585 | DEBUG    | __main__:trials:24 - Trial = 15030/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.586 | DEBUG    | __main__:trials:29 - Trial = 15030/30000 | Total reward = 39.60
2022-01-26 14:17:38.590 | DEBUG    | __main__:trials:24 - Trial = 15031/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.590 | DEBUG    | __main__:trials:29 - Trial = 15031/30000 | Total reward = 25.44
2022-01-26 14:17:38.594 | DEBUG    | __main__:trials:24 - Trial = 15032/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.595 | DEBUG    | __main__:trials:29 - Trial = 15032/30000 | Total reward = 42.35
2022-01-26 14:17:38.598 | DEBUG    | __main__:trials:24 - Trial = 15033/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.599 | DEBUG    | __main__:trials:29 - Trial = 15033/30000 | Total reward = 44.30
2022-01-26 14:17:38.603 | DEBUG    | __main__:trials:24 - Trial = 15034/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.605 | DEBUG    | __main__:trials:29 - Trial = 15034/30000 | Total reward = 48.44
2022-01-26 14:17:38.607 | DEBUG    | __main__:trials:24 - Trial = 15035/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.609 | DEBUG    | __main__:trials:29 - Trial = 15035/30000 | Total reward = 46.61
2022-01-26 14:17:38.613 | DEBUG    | __main__:trials:24 - Trial = 15036/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.614 | DEBUG    | __main__:trials:29 - Trial = 15036/30000 | Total reward = 45.79
2022-01-26 14:17:38.617 | DEBUG    | __main__:trials:24 - Trial = 15037/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.619 | DEBUG    | __main__:trials:29 - Trial = 15037/30000 | Total reward = 47.24
2022-01-26 14:17:38.622 | DEBUG    | __main__:trials:24 - Trial = 15038/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.624 | DEBUG    | __main__:trials:29 - Trial = 15038/30000 | Total reward = 35.93
2022-01-26 14:17:38.627 | DEBUG    | __main__:trials:24 - Trial = 15039/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.628 | DEBUG    | __main__:trials:29 - Trial = 15039/30000 | Total reward = 48.29
2022-01-26 14:17:38.633 | DEBUG    | __main__:trials:24 - Trial = 15040/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.633 | DEBUG    | __main__:trials:29 - Trial = 15040/30000 | Total reward = 47.12
2022-01-26 14:17:38.637 | DEBUG    | __main__:trials:24 - Trial = 15041/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.638 | DEBUG    | __main__:trials:29 - Trial = 15041/30000 | Total reward = 41.51
2022-01-26 14:17:38.641 | DEBUG    | __main__:trials:24 - Trial = 15042/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.642 | DEBUG    | __main__:trials:29 - Trial = 15042/30000 | Total reward = 45.98
2022-01-26 14:17:38.645 | DEBUG    | __main__:trials:24 - Trial = 15043/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.647 | DEBUG    | __main__:trials:29 - Trial = 15043/30000 | Total reward = 47.74
2022-01-26 14:17:38.650 | DEBUG    | __main__:trials:24 - Trial = 15044/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.652 | DEBUG    | __main__:trials:29 - Trial = 15044/30000 | Total reward = 54.80
2022-01-26 14:17:38.655 | DEBUG    | __main__:trials:24 - Trial = 15045/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.657 | DEBUG    | __main__:trials:29 - Trial = 15045/30000 | Total reward = 40.04
2022-01-26 14:17:38.660 | DEBUG    | __main__:trials:24 - Trial = 15046/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.662 | DEBUG    | __main__:trials:29 - Trial = 15046/30000 | Total reward = 51.04
2022-01-26 14:17:38.665 | DEBUG    | __main__:trials:24 - Trial = 15047/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.667 | DEBUG    | __main__:trials:29 - Trial = 15047/30000 | Total reward = 42.24
2022-01-26 14:17:38.671 | DEBUG    | __main__:trials:24 - Trial = 15048/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.672 | DEBUG    | __main__:trials:29 - Trial = 15048/30000 | Total reward = 45.47
2022-01-26 14:17:38.676 | DEBUG    | __main__:trials:24 - Trial = 15049/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.677 | DEBUG    | __main__:trials:29 - Trial = 15049/30000 | Total reward = 41.07
2022-01-26 14:17:38.680 | DEBUG    | __main__:trials:24 - Trial = 15050/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.682 | DEBUG    | __main__:trials:29 - Trial = 15050/30000 | Total reward = 53.47
2022-01-26 14:17:38.686 | DEBUG    | __main__:trials:24 - Trial = 15051/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.686 | DEBUG    | __main__:trials:29 - Trial = 15051/30000 | Total reward = 47.43
2022-01-26 14:17:38.690 | DEBUG    | __main__:trials:24 - Trial = 15052/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.692 | DEBUG    | __main__:trials:29 - Trial = 15052/30000 | Total reward = 53.60
2022-01-26 14:17:38.695 | DEBUG    | __main__:trials:24 - Trial = 15053/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.696 | DEBUG    | __main__:trials:29 - Trial = 15053/30000 | Total reward = 49.39
2022-01-26 14:17:38.700 | DEBUG    | __main__:trials:24 - Trial = 15054/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.701 | DEBUG    | __main__:trials:29 - Trial = 15054/30000 | Total reward = 43.75
2022-01-26 14:17:38.704 | DEBUG    | __main__:trials:24 - Trial = 15055/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.706 | DEBUG    | __main__:trials:29 - Trial = 15055/30000 | Total reward = 39.28
2022-01-26 14:17:38.710 | DEBUG    | __main__:trials:24 - Trial = 15056/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.711 | DEBUG    | __main__:trials:29 - Trial = 15056/30000 | Total reward = 56.80
2022-01-26 14:17:38.714 | DEBUG    | __main__:trials:24 - Trial = 15057/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.715 | DEBUG    | __main__:trials:29 - Trial = 15057/30000 | Total reward = 39.09
2022-01-26 14:17:38.719 | DEBUG    | __main__:trials:24 - Trial = 15058/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.721 | DEBUG    | __main__:trials:29 - Trial = 15058/30000 | Total reward = 56.20
2022-01-26 14:17:38.724 | DEBUG    | __main__:trials:24 - Trial = 15059/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.726 | DEBUG    | __main__:trials:29 - Trial = 15059/30000 | Total reward = 47.63
2022-01-26 14:17:38.730 | DEBUG    | __main__:trials:24 - Trial = 15060/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.731 | DEBUG    | __main__:trials:29 - Trial = 15060/30000 | Total reward = 43.45
2022-01-26 14:17:38.735 | DEBUG    | __main__:trials:24 - Trial = 15061/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.737 | DEBUG    | __main__:trials:29 - Trial = 15061/30000 | Total reward = 48.42
2022-01-26 14:17:38.740 | DEBUG    | __main__:trials:24 - Trial = 15062/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.742 | DEBUG    | __main__:trials:29 - Trial = 15062/30000 | Total reward = 45.28
2022-01-26 14:17:38.746 | DEBUG    | __main__:trials:24 - Trial = 15063/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.747 | DEBUG    | __main__:trials:29 - Trial = 15063/30000 | Total reward = 47.05
2022-01-26 14:17:38.751 | DEBUG    | __main__:trials:24 - Trial = 15064/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.753 | DEBUG    | __main__:trials:29 - Trial = 15064/30000 | Total reward = 47.05
2022-01-26 14:17:38.756 | DEBUG    | __main__:trials:24 - Trial = 15065/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.757 | DEBUG    | __main__:trials:29 - Trial = 15065/30000 | Total reward = 57.84
2022-01-26 14:17:38.761 | DEBUG    | __main__:trials:24 - Trial = 15066/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.762 | DEBUG    | __main__:trials:29 - Trial = 15066/30000 | Total reward = 47.05
2022-01-26 14:17:38.767 | DEBUG    | __main__:trials:24 - Trial = 15067/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.768 | DEBUG    | __main__:trials:29 - Trial = 15067/30000 | Total reward = 43.03
2022-01-26 14:17:38.772 | DEBUG    | __main__:trials:24 - Trial = 15068/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.774 | DEBUG    | __main__:trials:29 - Trial = 15068/30000 | Total reward = 44.62
2022-01-26 14:17:38.777 | DEBUG    | __main__:trials:24 - Trial = 15069/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.779 | DEBUG    | __main__:trials:29 - Trial = 15069/30000 | Total reward = 46.37
2022-01-26 14:17:38.782 | DEBUG    | __main__:trials:24 - Trial = 15070/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.783 | DEBUG    | __main__:trials:29 - Trial = 15070/30000 | Total reward = 42.09
2022-01-26 14:17:38.787 | DEBUG    | __main__:trials:24 - Trial = 15071/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.789 | DEBUG    | __main__:trials:29 - Trial = 15071/30000 | Total reward = 18.71
2022-01-26 14:17:38.792 | DEBUG    | __main__:trials:24 - Trial = 15072/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.794 | DEBUG    | __main__:trials:29 - Trial = 15072/30000 | Total reward = 39.95
2022-01-26 14:17:38.797 | DEBUG    | __main__:trials:24 - Trial = 15073/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.798 | DEBUG    | __main__:trials:29 - Trial = 15073/30000 | Total reward = 41.84
2022-01-26 14:17:38.802 | DEBUG    | __main__:trials:24 - Trial = 15074/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.803 | DEBUG    | __main__:trials:29 - Trial = 15074/30000 | Total reward = 39.29
2022-01-26 14:17:38.806 | DEBUG    | __main__:trials:24 - Trial = 15075/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.808 | DEBUG    | __main__:trials:29 - Trial = 15075/30000 | Total reward = 46.05
2022-01-26 14:17:38.811 | DEBUG    | __main__:trials:24 - Trial = 15076/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.812 | DEBUG    | __main__:trials:29 - Trial = 15076/30000 | Total reward = 38.81
2022-01-26 14:17:38.815 | DEBUG    | __main__:trials:24 - Trial = 15077/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.817 | DEBUG    | __main__:trials:29 - Trial = 15077/30000 | Total reward = 38.39
2022-01-26 14:17:38.820 | DEBUG    | __main__:trials:24 - Trial = 15078/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.821 | DEBUG    | __main__:trials:29 - Trial = 15078/30000 | Total reward = 39.64
2022-01-26 14:17:38.826 | DEBUG    | __main__:trials:24 - Trial = 15079/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.827 | DEBUG    | __main__:trials:29 - Trial = 15079/30000 | Total reward = 47.19
2022-01-26 14:17:38.831 | DEBUG    | __main__:trials:24 - Trial = 15080/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.833 | DEBUG    | __main__:trials:29 - Trial = 15080/30000 | Total reward = 29.62
2022-01-26 14:17:38.835 | DEBUG    | __main__:trials:24 - Trial = 15081/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.837 | DEBUG    | __main__:trials:29 - Trial = 15081/30000 | Total reward = 39.52
2022-01-26 14:17:38.841 | DEBUG    | __main__:trials:24 - Trial = 15082/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.842 | DEBUG    | __main__:trials:29 - Trial = 15082/30000 | Total reward = 43.44
2022-01-26 14:17:38.846 | DEBUG    | __main__:trials:24 - Trial = 15083/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.847 | DEBUG    | __main__:trials:29 - Trial = 15083/30000 | Total reward = 42.89
2022-01-26 14:17:38.851 | DEBUG    | __main__:trials:24 - Trial = 15084/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.851 | DEBUG    | __main__:trials:29 - Trial = 15084/30000 | Total reward = 37.59
2022-01-26 14:17:38.855 | DEBUG    | __main__:trials:24 - Trial = 15085/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.856 | DEBUG    | __main__:trials:29 - Trial = 15085/30000 | Total reward = 41.11
2022-01-26 14:17:38.860 | DEBUG    | __main__:trials:24 - Trial = 15086/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.862 | DEBUG    | __main__:trials:29 - Trial = 15086/30000 | Total reward = 36.75
2022-01-26 14:17:38.865 | DEBUG    | __main__:trials:24 - Trial = 15087/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.866 | DEBUG    | __main__:trials:29 - Trial = 15087/30000 | Total reward = 37.75
2022-01-26 14:17:38.869 | DEBUG    | __main__:trials:24 - Trial = 15088/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.870 | DEBUG    | __main__:trials:29 - Trial = 15088/30000 | Total reward = 27.33
2022-01-26 14:17:38.874 | DEBUG    | __main__:trials:24 - Trial = 15089/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.876 | DEBUG    | __main__:trials:29 - Trial = 15089/30000 | Total reward = 46.44
2022-01-26 14:17:38.879 | DEBUG    | __main__:trials:24 - Trial = 15090/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.881 | DEBUG    | __main__:trials:29 - Trial = 15090/30000 | Total reward = 37.39
2022-01-26 14:17:38.884 | DEBUG    | __main__:trials:24 - Trial = 15091/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.886 | DEBUG    | __main__:trials:29 - Trial = 15091/30000 | Total reward = 46.12
2022-01-26 14:17:38.889 | DEBUG    | __main__:trials:24 - Trial = 15092/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.890 | DEBUG    | __main__:trials:29 - Trial = 15092/30000 | Total reward = 40.30
2022-01-26 14:17:38.894 | DEBUG    | __main__:trials:24 - Trial = 15093/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.895 | DEBUG    | __main__:trials:29 - Trial = 15093/30000 | Total reward = 37.65
2022-01-26 14:17:38.899 | DEBUG    | __main__:trials:24 - Trial = 15094/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.901 | DEBUG    | __main__:trials:29 - Trial = 15094/30000 | Total reward = 56.14
2022-01-26 14:17:38.904 | DEBUG    | __main__:trials:24 - Trial = 15095/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.906 | DEBUG    | __main__:trials:29 - Trial = 15095/30000 | Total reward = 44.97
2022-01-26 14:17:38.910 | DEBUG    | __main__:trials:24 - Trial = 15096/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.910 | DEBUG    | __main__:trials:29 - Trial = 15096/30000 | Total reward = 38.88
2022-01-26 14:17:38.914 | DEBUG    | __main__:trials:24 - Trial = 15097/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.916 | DEBUG    | __main__:trials:29 - Trial = 15097/30000 | Total reward = 37.31
2022-01-26 14:17:38.920 | DEBUG    | __main__:trials:24 - Trial = 15098/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.921 | DEBUG    | __main__:trials:29 - Trial = 15098/30000 | Total reward = 44.33
2022-01-26 14:17:38.924 | DEBUG    | __main__:trials:24 - Trial = 15099/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.926 | DEBUG    | __main__:trials:29 - Trial = 15099/30000 | Total reward = 41.93
2022-01-26 14:17:38.929 | DEBUG    | __main__:trials:24 - Trial = 15100/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.931 | DEBUG    | __main__:trials:29 - Trial = 15100/30000 | Total reward = 45.11
2022-01-26 14:17:38.935 | DEBUG    | __main__:trials:24 - Trial = 15101/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.935 | DEBUG    | __main__:trials:29 - Trial = 15101/30000 | Total reward = 58.75
2022-01-26 14:17:38.939 | DEBUG    | __main__:trials:24 - Trial = 15102/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.941 | DEBUG    | __main__:trials:29 - Trial = 15102/30000 | Total reward = 46.89
2022-01-26 14:17:38.943 | DEBUG    | __main__:trials:24 - Trial = 15103/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.945 | DEBUG    | __main__:trials:29 - Trial = 15103/30000 | Total reward = 40.59
2022-01-26 14:17:38.948 | DEBUG    | __main__:trials:24 - Trial = 15104/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.950 | DEBUG    | __main__:trials:29 - Trial = 15104/30000 | Total reward = 52.13
2022-01-26 14:17:38.953 | DEBUG    | __main__:trials:24 - Trial = 15105/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.954 | DEBUG    | __main__:trials:29 - Trial = 15105/30000 | Total reward = 46.59
2022-01-26 14:17:38.958 | DEBUG    | __main__:trials:24 - Trial = 15106/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.959 | DEBUG    | __main__:trials:29 - Trial = 15106/30000 | Total reward = 39.63
2022-01-26 14:17:38.963 | DEBUG    | __main__:trials:24 - Trial = 15107/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.964 | DEBUG    | __main__:trials:29 - Trial = 15107/30000 | Total reward = 40.80
2022-01-26 14:17:38.967 | DEBUG    | __main__:trials:24 - Trial = 15108/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.969 | DEBUG    | __main__:trials:29 - Trial = 15108/30000 | Total reward = 30.08
2022-01-26 14:17:38.973 | DEBUG    | __main__:trials:24 - Trial = 15109/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.975 | DEBUG    | __main__:trials:29 - Trial = 15109/30000 | Total reward = 45.34
2022-01-26 14:17:38.978 | DEBUG    | __main__:trials:24 - Trial = 15110/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.979 | DEBUG    | __main__:trials:29 - Trial = 15110/30000 | Total reward = 33.90
2022-01-26 14:17:38.983 | DEBUG    | __main__:trials:24 - Trial = 15111/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.985 | DEBUG    | __main__:trials:29 - Trial = 15111/30000 | Total reward = 38.07
2022-01-26 14:17:38.988 | DEBUG    | __main__:trials:24 - Trial = 15112/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.989 | DEBUG    | __main__:trials:29 - Trial = 15112/30000 | Total reward = 33.13
2022-01-26 14:17:38.993 | DEBUG    | __main__:trials:24 - Trial = 15113/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.994 | DEBUG    | __main__:trials:29 - Trial = 15113/30000 | Total reward = 41.52
2022-01-26 14:17:38.998 | DEBUG    | __main__:trials:24 - Trial = 15114/30000 | Max number of steps (20) reached
2022-01-26 14:17:38.999 | DEBUG    | __main__:trials:29 - Trial = 15114/30000 | Total reward = 38.51
2022-01-26 14:17:39.003 | DEBUG    | __main__:trials:24 - Trial = 15115/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.003 | DEBUG    | __main__:trials:29 - Trial = 15115/30000 | Total reward = 37.53
2022-01-26 14:17:39.008 | DEBUG    | __main__:trials:24 - Trial = 15116/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.009 | DEBUG    | __main__:trials:29 - Trial = 15116/30000 | Total reward = 45.52
2022-01-26 14:17:39.013 | DEBUG    | __main__:trials:24 - Trial = 15117/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.014 | DEBUG    | __main__:trials:29 - Trial = 15117/30000 | Total reward = 42.73
2022-01-26 14:17:39.017 | DEBUG    | __main__:trials:24 - Trial = 15118/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.019 | DEBUG    | __main__:trials:29 - Trial = 15118/30000 | Total reward = 40.99
2022-01-26 14:17:39.023 | DEBUG    | __main__:trials:24 - Trial = 15119/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.025 | DEBUG    | __main__:trials:29 - Trial = 15119/30000 | Total reward = 62.77
2022-01-26 14:17:39.028 | DEBUG    | __main__:trials:24 - Trial = 15120/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.030 | DEBUG    | __main__:trials:29 - Trial = 15120/30000 | Total reward = 33.41
2022-01-26 14:17:39.033 | DEBUG    | __main__:trials:24 - Trial = 15121/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.034 | DEBUG    | __main__:trials:29 - Trial = 15121/30000 | Total reward = 47.46
2022-01-26 14:17:39.038 | DEBUG    | __main__:trials:24 - Trial = 15122/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.039 | DEBUG    | __main__:trials:29 - Trial = 15122/30000 | Total reward = 53.98
2022-01-26 14:17:39.042 | DEBUG    | __main__:trials:24 - Trial = 15123/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.044 | DEBUG    | __main__:trials:29 - Trial = 15123/30000 | Total reward = 30.52
2022-01-26 14:17:39.048 | DEBUG    | __main__:trials:24 - Trial = 15124/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.048 | DEBUG    | __main__:trials:29 - Trial = 15124/30000 | Total reward = 51.09
2022-01-26 14:17:39.052 | DEBUG    | __main__:trials:24 - Trial = 15125/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.053 | DEBUG    | __main__:trials:29 - Trial = 15125/30000 | Total reward = 40.69
2022-01-26 14:17:39.057 | DEBUG    | __main__:trials:24 - Trial = 15126/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.058 | DEBUG    | __main__:trials:29 - Trial = 15126/30000 | Total reward = 37.60
2022-01-26 14:17:39.062 | DEBUG    | __main__:trials:24 - Trial = 15127/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.063 | DEBUG    | __main__:trials:29 - Trial = 15127/30000 | Total reward = 38.52
2022-01-26 14:17:39.066 | DEBUG    | __main__:trials:24 - Trial = 15128/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.068 | DEBUG    | __main__:trials:29 - Trial = 15128/30000 | Total reward = 38.87
2022-01-26 14:17:39.071 | DEBUG    | __main__:trials:24 - Trial = 15129/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.073 | DEBUG    | __main__:trials:29 - Trial = 15129/30000 | Total reward = 36.32
2022-01-26 14:17:39.076 | DEBUG    | __main__:trials:24 - Trial = 15130/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.077 | DEBUG    | __main__:trials:29 - Trial = 15130/30000 | Total reward = 35.13
2022-01-26 14:17:39.081 | DEBUG    | __main__:trials:24 - Trial = 15131/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.083 | DEBUG    | __main__:trials:29 - Trial = 15131/30000 | Total reward = 39.26
2022-01-26 14:17:39.086 | DEBUG    | __main__:trials:24 - Trial = 15132/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.088 | DEBUG    | __main__:trials:29 - Trial = 15132/30000 | Total reward = 45.55
2022-01-26 14:17:39.092 | DEBUG    | __main__:trials:24 - Trial = 15133/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.093 | DEBUG    | __main__:trials:29 - Trial = 15133/30000 | Total reward = 39.82
2022-01-26 14:17:39.096 | DEBUG    | __main__:trials:26 - Trial = 15134/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:39.098 | DEBUG    | __main__:trials:29 - Trial = 15134/30000 | Total reward = 30.72
2022-01-26 14:17:39.102 | DEBUG    | __main__:trials:24 - Trial = 15135/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.103 | DEBUG    | __main__:trials:29 - Trial = 15135/30000 | Total reward = 37.31
2022-01-26 14:17:39.106 | DEBUG    | __main__:trials:24 - Trial = 15136/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.108 | DEBUG    | __main__:trials:29 - Trial = 15136/30000 | Total reward = 39.33
2022-01-26 14:17:39.112 | DEBUG    | __main__:trials:24 - Trial = 15137/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.113 | DEBUG    | __main__:trials:29 - Trial = 15137/30000 | Total reward = 36.84
2022-01-26 14:17:39.116 | DEBUG    | __main__:trials:24 - Trial = 15138/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.118 | DEBUG    | __main__:trials:29 - Trial = 15138/30000 | Total reward = 36.93
2022-01-26 14:17:39.121 | DEBUG    | __main__:trials:24 - Trial = 15139/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.122 | DEBUG    | __main__:trials:29 - Trial = 15139/30000 | Total reward = 32.19
2022-01-26 14:17:39.126 | DEBUG    | __main__:trials:24 - Trial = 15140/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.127 | DEBUG    | __main__:trials:29 - Trial = 15140/30000 | Total reward = 36.25
2022-01-26 14:17:39.130 | DEBUG    | __main__:trials:24 - Trial = 15141/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.132 | DEBUG    | __main__:trials:29 - Trial = 15141/30000 | Total reward = 35.19
2022-01-26 14:17:39.136 | DEBUG    | __main__:trials:24 - Trial = 15142/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.137 | DEBUG    | __main__:trials:29 - Trial = 15142/30000 | Total reward = 45.97
2022-01-26 14:17:39.141 | DEBUG    | __main__:trials:24 - Trial = 15143/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.142 | DEBUG    | __main__:trials:29 - Trial = 15143/30000 | Total reward = 43.96
2022-01-26 14:17:39.146 | DEBUG    | __main__:trials:24 - Trial = 15144/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.147 | DEBUG    | __main__:trials:29 - Trial = 15144/30000 | Total reward = 49.24
2022-01-26 14:17:39.151 | DEBUG    | __main__:trials:24 - Trial = 15145/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.153 | DEBUG    | __main__:trials:29 - Trial = 15145/30000 | Total reward = 47.05
2022-01-26 14:17:39.156 | DEBUG    | __main__:trials:24 - Trial = 15146/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.157 | DEBUG    | __main__:trials:29 - Trial = 15146/30000 | Total reward = 45.10
2022-01-26 14:17:39.160 | DEBUG    | __main__:trials:24 - Trial = 15147/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.162 | DEBUG    | __main__:trials:29 - Trial = 15147/30000 | Total reward = 41.74
2022-01-26 14:17:39.166 | DEBUG    | __main__:trials:24 - Trial = 15148/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.167 | DEBUG    | __main__:trials:29 - Trial = 15148/30000 | Total reward = 48.74
2022-01-26 14:17:39.171 | DEBUG    | __main__:trials:24 - Trial = 15149/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.171 | DEBUG    | __main__:trials:29 - Trial = 15149/30000 | Total reward = 45.24
2022-01-26 14:17:39.176 | DEBUG    | __main__:trials:24 - Trial = 15150/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.177 | DEBUG    | __main__:trials:29 - Trial = 15150/30000 | Total reward = 45.86
2022-01-26 14:17:39.180 | DEBUG    | __main__:trials:24 - Trial = 15151/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.181 | DEBUG    | __main__:trials:29 - Trial = 15151/30000 | Total reward = 41.98
2022-01-26 14:17:39.185 | DEBUG    | __main__:trials:24 - Trial = 15152/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.185 | DEBUG    | __main__:trials:29 - Trial = 15152/30000 | Total reward = 46.94
2022-01-26 14:17:39.189 | DEBUG    | __main__:trials:24 - Trial = 15153/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.189 | DEBUG    | __main__:trials:29 - Trial = 15153/30000 | Total reward = 47.05
2022-01-26 14:17:39.193 | DEBUG    | __main__:trials:24 - Trial = 15154/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.194 | DEBUG    | __main__:trials:29 - Trial = 15154/30000 | Total reward = 46.93
2022-01-26 14:17:39.197 | DEBUG    | __main__:trials:24 - Trial = 15155/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.198 | DEBUG    | __main__:trials:29 - Trial = 15155/30000 | Total reward = 47.05
2022-01-26 14:17:39.201 | DEBUG    | __main__:trials:24 - Trial = 15156/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.202 | DEBUG    | __main__:trials:29 - Trial = 15156/30000 | Total reward = 49.00
2022-01-26 14:17:39.205 | DEBUG    | __main__:trials:24 - Trial = 15157/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.207 | DEBUG    | __main__:trials:29 - Trial = 15157/30000 | Total reward = 47.56
2022-01-26 14:17:39.210 | DEBUG    | __main__:trials:24 - Trial = 15158/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.211 | DEBUG    | __main__:trials:29 - Trial = 15158/30000 | Total reward = 46.01
2022-01-26 14:17:39.215 | DEBUG    | __main__:trials:24 - Trial = 15159/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.215 | DEBUG    | __main__:trials:29 - Trial = 15159/30000 | Total reward = 45.72
2022-01-26 14:17:39.219 | DEBUG    | __main__:trials:24 - Trial = 15160/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.219 | DEBUG    | __main__:trials:29 - Trial = 15160/30000 | Total reward = 44.47
2022-01-26 14:17:39.223 | DEBUG    | __main__:trials:24 - Trial = 15161/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.225 | DEBUG    | __main__:trials:29 - Trial = 15161/30000 | Total reward = 52.90
2022-01-26 14:17:39.228 | DEBUG    | __main__:trials:24 - Trial = 15162/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.230 | DEBUG    | __main__:trials:29 - Trial = 15162/30000 | Total reward = 52.93
2022-01-26 14:17:39.233 | DEBUG    | __main__:trials:24 - Trial = 15163/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.233 | DEBUG    | __main__:trials:29 - Trial = 15163/30000 | Total reward = 50.04
2022-01-26 14:17:39.236 | DEBUG    | __main__:trials:24 - Trial = 15164/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.238 | DEBUG    | __main__:trials:29 - Trial = 15164/30000 | Total reward = 38.27
2022-01-26 14:17:39.242 | DEBUG    | __main__:trials:24 - Trial = 15165/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.244 | DEBUG    | __main__:trials:29 - Trial = 15165/30000 | Total reward = 49.25
2022-01-26 14:17:39.247 | DEBUG    | __main__:trials:24 - Trial = 15166/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.249 | DEBUG    | __main__:trials:29 - Trial = 15166/30000 | Total reward = 48.21
2022-01-26 14:17:39.252 | DEBUG    | __main__:trials:24 - Trial = 15167/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.253 | DEBUG    | __main__:trials:29 - Trial = 15167/30000 | Total reward = 37.61
2022-01-26 14:17:39.257 | DEBUG    | __main__:trials:24 - Trial = 15168/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.259 | DEBUG    | __main__:trials:29 - Trial = 15168/30000 | Total reward = 39.84
2022-01-26 14:17:39.262 | DEBUG    | __main__:trials:24 - Trial = 15169/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.264 | DEBUG    | __main__:trials:29 - Trial = 15169/30000 | Total reward = 39.28
2022-01-26 14:17:39.267 | DEBUG    | __main__:trials:24 - Trial = 15170/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.268 | DEBUG    | __main__:trials:29 - Trial = 15170/30000 | Total reward = 40.82
2022-01-26 14:17:39.272 | DEBUG    | __main__:trials:24 - Trial = 15171/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.273 | DEBUG    | __main__:trials:29 - Trial = 15171/30000 | Total reward = 47.11
2022-01-26 14:17:39.276 | DEBUG    | __main__:trials:24 - Trial = 15172/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.277 | DEBUG    | __main__:trials:29 - Trial = 15172/30000 | Total reward = 41.36
2022-01-26 14:17:39.281 | DEBUG    | __main__:trials:24 - Trial = 15173/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.281 | DEBUG    | __main__:trials:29 - Trial = 15173/30000 | Total reward = 48.48
2022-01-26 14:17:39.285 | DEBUG    | __main__:trials:24 - Trial = 15174/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.286 | DEBUG    | __main__:trials:29 - Trial = 15174/30000 | Total reward = 47.22
2022-01-26 14:17:39.290 | DEBUG    | __main__:trials:24 - Trial = 15175/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.291 | DEBUG    | __main__:trials:29 - Trial = 15175/30000 | Total reward = 49.42
2022-01-26 14:17:39.294 | DEBUG    | __main__:trials:24 - Trial = 15176/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.295 | DEBUG    | __main__:trials:29 - Trial = 15176/30000 | Total reward = 52.73
2022-01-26 14:17:39.298 | DEBUG    | __main__:trials:24 - Trial = 15177/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.300 | DEBUG    | __main__:trials:29 - Trial = 15177/30000 | Total reward = 47.05
2022-01-26 14:17:39.303 | DEBUG    | __main__:trials:24 - Trial = 15178/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.305 | DEBUG    | __main__:trials:29 - Trial = 15178/30000 | Total reward = 44.68
2022-01-26 14:17:39.308 | DEBUG    | __main__:trials:24 - Trial = 15179/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.309 | DEBUG    | __main__:trials:29 - Trial = 15179/30000 | Total reward = 43.31
2022-01-26 14:17:39.313 | DEBUG    | __main__:trials:24 - Trial = 15180/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.314 | DEBUG    | __main__:trials:29 - Trial = 15180/30000 | Total reward = 53.93
2022-01-26 14:17:39.318 | DEBUG    | __main__:trials:24 - Trial = 15181/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.319 | DEBUG    | __main__:trials:29 - Trial = 15181/30000 | Total reward = 49.65
2022-01-26 14:17:39.323 | DEBUG    | __main__:trials:24 - Trial = 15182/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.324 | DEBUG    | __main__:trials:29 - Trial = 15182/30000 | Total reward = 45.93
2022-01-26 14:17:39.328 | DEBUG    | __main__:trials:24 - Trial = 15183/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.329 | DEBUG    | __main__:trials:29 - Trial = 15183/30000 | Total reward = 38.45
2022-01-26 14:17:39.332 | DEBUG    | __main__:trials:24 - Trial = 15184/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.334 | DEBUG    | __main__:trials:29 - Trial = 15184/30000 | Total reward = 32.78
2022-01-26 14:17:39.337 | DEBUG    | __main__:trials:24 - Trial = 15185/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.339 | DEBUG    | __main__:trials:29 - Trial = 15185/30000 | Total reward = 47.05
2022-01-26 14:17:39.343 | DEBUG    | __main__:trials:24 - Trial = 15186/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.343 | DEBUG    | __main__:trials:29 - Trial = 15186/30000 | Total reward = 50.70
2022-01-26 14:17:39.347 | DEBUG    | __main__:trials:24 - Trial = 15187/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.349 | DEBUG    | __main__:trials:29 - Trial = 15187/30000 | Total reward = 51.90
2022-01-26 14:17:39.352 | DEBUG    | __main__:trials:24 - Trial = 15188/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.353 | DEBUG    | __main__:trials:29 - Trial = 15188/30000 | Total reward = 39.26
2022-01-26 14:17:39.357 | DEBUG    | __main__:trials:24 - Trial = 15189/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.359 | DEBUG    | __main__:trials:29 - Trial = 15189/30000 | Total reward = 38.22
2022-01-26 14:17:39.362 | DEBUG    | __main__:trials:24 - Trial = 15190/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.364 | DEBUG    | __main__:trials:29 - Trial = 15190/30000 | Total reward = 48.14
2022-01-26 14:17:39.367 | DEBUG    | __main__:trials:24 - Trial = 15191/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.369 | DEBUG    | __main__:trials:29 - Trial = 15191/30000 | Total reward = 44.96
2022-01-26 14:17:39.372 | DEBUG    | __main__:trials:24 - Trial = 15192/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.374 | DEBUG    | __main__:trials:29 - Trial = 15192/30000 | Total reward = 38.30
2022-01-26 14:17:39.377 | DEBUG    | __main__:trials:24 - Trial = 15193/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.378 | DEBUG    | __main__:trials:29 - Trial = 15193/30000 | Total reward = 42.98
2022-01-26 14:17:39.382 | DEBUG    | __main__:trials:24 - Trial = 15194/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.384 | DEBUG    | __main__:trials:29 - Trial = 15194/30000 | Total reward = 33.20
2022-01-26 14:17:39.386 | DEBUG    | __main__:trials:24 - Trial = 15195/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.388 | DEBUG    | __main__:trials:29 - Trial = 15195/30000 | Total reward = 37.31
2022-01-26 14:17:39.392 | DEBUG    | __main__:trials:24 - Trial = 15196/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.392 | DEBUG    | __main__:trials:29 - Trial = 15196/30000 | Total reward = 53.23
2022-01-26 14:17:39.397 | DEBUG    | __main__:trials:24 - Trial = 15197/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.397 | DEBUG    | __main__:trials:29 - Trial = 15197/30000 | Total reward = 51.57
2022-01-26 14:17:39.401 | DEBUG    | __main__:trials:24 - Trial = 15198/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.402 | DEBUG    | __main__:trials:29 - Trial = 15198/30000 | Total reward = 54.16
2022-01-26 14:17:39.406 | DEBUG    | __main__:trials:24 - Trial = 15199/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.407 | DEBUG    | __main__:trials:29 - Trial = 15199/30000 | Total reward = 58.03
2022-01-26 14:17:39.411 | DEBUG    | __main__:trials:24 - Trial = 15200/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.412 | DEBUG    | __main__:trials:29 - Trial = 15200/30000 | Total reward = 42.04
2022-01-26 14:17:39.416 | DEBUG    | __main__:trials:24 - Trial = 15201/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.417 | DEBUG    | __main__:trials:29 - Trial = 15201/30000 | Total reward = 52.97
2022-01-26 14:17:39.421 | DEBUG    | __main__:trials:24 - Trial = 15202/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.422 | DEBUG    | __main__:trials:29 - Trial = 15202/30000 | Total reward = 47.09
2022-01-26 14:17:39.426 | DEBUG    | __main__:trials:24 - Trial = 15203/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.428 | DEBUG    | __main__:trials:29 - Trial = 15203/30000 | Total reward = 41.91
2022-01-26 14:17:39.432 | DEBUG    | __main__:trials:24 - Trial = 15204/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.433 | DEBUG    | __main__:trials:29 - Trial = 15204/30000 | Total reward = 47.93
2022-01-26 14:17:39.436 | DEBUG    | __main__:trials:24 - Trial = 15205/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.437 | DEBUG    | __main__:trials:29 - Trial = 15205/30000 | Total reward = 44.61
2022-01-26 14:17:39.440 | DEBUG    | __main__:trials:24 - Trial = 15206/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.442 | DEBUG    | __main__:trials:29 - Trial = 15206/30000 | Total reward = 40.05
2022-01-26 14:17:39.445 | DEBUG    | __main__:trials:24 - Trial = 15207/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.446 | DEBUG    | __main__:trials:29 - Trial = 15207/30000 | Total reward = 48.16
2022-01-26 14:17:39.450 | DEBUG    | __main__:trials:24 - Trial = 15208/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.452 | DEBUG    | __main__:trials:29 - Trial = 15208/30000 | Total reward = 41.62
2022-01-26 14:17:39.455 | DEBUG    | __main__:trials:24 - Trial = 15209/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.457 | DEBUG    | __main__:trials:29 - Trial = 15209/30000 | Total reward = 46.00
2022-01-26 14:17:39.459 | DEBUG    | __main__:trials:24 - Trial = 15210/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.461 | DEBUG    | __main__:trials:29 - Trial = 15210/30000 | Total reward = 42.28
2022-01-26 14:17:39.465 | DEBUG    | __main__:trials:24 - Trial = 15211/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.466 | DEBUG    | __main__:trials:29 - Trial = 15211/30000 | Total reward = 42.90
2022-01-26 14:17:39.470 | DEBUG    | __main__:trials:24 - Trial = 15212/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.471 | DEBUG    | __main__:trials:29 - Trial = 15212/30000 | Total reward = 38.48
2022-01-26 14:17:39.475 | DEBUG    | __main__:trials:24 - Trial = 15213/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.476 | DEBUG    | __main__:trials:29 - Trial = 15213/30000 | Total reward = 47.67
2022-01-26 14:17:39.480 | DEBUG    | __main__:trials:24 - Trial = 15214/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.480 | DEBUG    | __main__:trials:29 - Trial = 15214/30000 | Total reward = 44.83
2022-01-26 14:17:39.485 | DEBUG    | __main__:trials:24 - Trial = 15215/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.486 | DEBUG    | __main__:trials:29 - Trial = 15215/30000 | Total reward = 49.50
2022-01-26 14:17:39.489 | DEBUG    | __main__:trials:24 - Trial = 15216/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.490 | DEBUG    | __main__:trials:29 - Trial = 15216/30000 | Total reward = 50.02
2022-01-26 14:17:39.493 | DEBUG    | __main__:trials:24 - Trial = 15217/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.494 | DEBUG    | __main__:trials:29 - Trial = 15217/30000 | Total reward = 44.41
2022-01-26 14:17:39.498 | DEBUG    | __main__:trials:24 - Trial = 15218/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.499 | DEBUG    | __main__:trials:29 - Trial = 15218/30000 | Total reward = 43.16
2022-01-26 14:17:39.503 | DEBUG    | __main__:trials:24 - Trial = 15219/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.504 | DEBUG    | __main__:trials:29 - Trial = 15219/30000 | Total reward = 35.44
2022-01-26 14:17:39.508 | DEBUG    | __main__:trials:24 - Trial = 15220/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.510 | DEBUG    | __main__:trials:29 - Trial = 15220/30000 | Total reward = 45.43
2022-01-26 14:17:39.513 | DEBUG    | __main__:trials:24 - Trial = 15221/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.514 | DEBUG    | __main__:trials:29 - Trial = 15221/30000 | Total reward = 45.53
2022-01-26 14:17:39.518 | DEBUG    | __main__:trials:24 - Trial = 15222/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.519 | DEBUG    | __main__:trials:29 - Trial = 15222/30000 | Total reward = 43.95
2022-01-26 14:17:39.523 | DEBUG    | __main__:trials:24 - Trial = 15223/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.524 | DEBUG    | __main__:trials:29 - Trial = 15223/30000 | Total reward = 48.18
2022-01-26 14:17:39.528 | DEBUG    | __main__:trials:24 - Trial = 15224/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.530 | DEBUG    | __main__:trials:29 - Trial = 15224/30000 | Total reward = 47.26
2022-01-26 14:17:39.533 | DEBUG    | __main__:trials:24 - Trial = 15225/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.535 | DEBUG    | __main__:trials:29 - Trial = 15225/30000 | Total reward = 49.26
2022-01-26 14:17:39.539 | DEBUG    | __main__:trials:24 - Trial = 15226/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.539 | DEBUG    | __main__:trials:29 - Trial = 15226/30000 | Total reward = 44.77
2022-01-26 14:17:39.543 | DEBUG    | __main__:trials:24 - Trial = 15227/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.544 | DEBUG    | __main__:trials:29 - Trial = 15227/30000 | Total reward = 50.45
2022-01-26 14:17:39.547 | DEBUG    | __main__:trials:24 - Trial = 15228/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.549 | DEBUG    | __main__:trials:29 - Trial = 15228/30000 | Total reward = 46.61
2022-01-26 14:17:39.552 | DEBUG    | __main__:trials:24 - Trial = 15229/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.554 | DEBUG    | __main__:trials:29 - Trial = 15229/30000 | Total reward = 44.47
2022-01-26 14:17:39.557 | DEBUG    | __main__:trials:24 - Trial = 15230/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.558 | DEBUG    | __main__:trials:29 - Trial = 15230/30000 | Total reward = 50.39
2022-01-26 14:17:39.562 | DEBUG    | __main__:trials:24 - Trial = 15231/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.563 | DEBUG    | __main__:trials:29 - Trial = 15231/30000 | Total reward = 40.32
2022-01-26 14:17:39.567 | DEBUG    | __main__:trials:24 - Trial = 15232/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.568 | DEBUG    | __main__:trials:29 - Trial = 15232/30000 | Total reward = 50.92
2022-01-26 14:17:39.572 | DEBUG    | __main__:trials:24 - Trial = 15233/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.573 | DEBUG    | __main__:trials:29 - Trial = 15233/30000 | Total reward = 42.99
2022-01-26 14:17:39.577 | DEBUG    | __main__:trials:24 - Trial = 15234/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.578 | DEBUG    | __main__:trials:29 - Trial = 15234/30000 | Total reward = 45.03
2022-01-26 14:17:39.582 | DEBUG    | __main__:trials:24 - Trial = 15235/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.584 | DEBUG    | __main__:trials:29 - Trial = 15235/30000 | Total reward = 43.98
2022-01-26 14:17:39.587 | DEBUG    | __main__:trials:24 - Trial = 15236/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.589 | DEBUG    | __main__:trials:29 - Trial = 15236/30000 | Total reward = 48.06
2022-01-26 14:17:39.592 | DEBUG    | __main__:trials:24 - Trial = 15237/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.593 | DEBUG    | __main__:trials:29 - Trial = 15237/30000 | Total reward = 48.26
2022-01-26 14:17:39.596 | DEBUG    | __main__:trials:24 - Trial = 15238/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.598 | DEBUG    | __main__:trials:29 - Trial = 15238/30000 | Total reward = 36.59
2022-01-26 14:17:39.602 | DEBUG    | __main__:trials:24 - Trial = 15239/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.602 | DEBUG    | __main__:trials:29 - Trial = 15239/30000 | Total reward = 44.18
2022-01-26 14:17:39.606 | DEBUG    | __main__:trials:24 - Trial = 15240/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.606 | DEBUG    | __main__:trials:29 - Trial = 15240/30000 | Total reward = 45.92
2022-01-26 14:17:39.610 | DEBUG    | __main__:trials:24 - Trial = 15241/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.612 | DEBUG    | __main__:trials:29 - Trial = 15241/30000 | Total reward = 44.41
2022-01-26 14:17:39.615 | DEBUG    | __main__:trials:24 - Trial = 15242/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.616 | DEBUG    | __main__:trials:29 - Trial = 15242/30000 | Total reward = 59.26
2022-01-26 14:17:39.620 | DEBUG    | __main__:trials:24 - Trial = 15243/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.621 | DEBUG    | __main__:trials:29 - Trial = 15243/30000 | Total reward = 35.24
2022-01-26 14:17:39.625 | DEBUG    | __main__:trials:24 - Trial = 15244/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.626 | DEBUG    | __main__:trials:29 - Trial = 15244/30000 | Total reward = 37.85
2022-01-26 14:17:39.631 | DEBUG    | __main__:trials:24 - Trial = 15245/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.632 | DEBUG    | __main__:trials:29 - Trial = 15245/30000 | Total reward = 52.93
2022-01-26 14:17:39.636 | DEBUG    | __main__:trials:24 - Trial = 15246/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.638 | DEBUG    | __main__:trials:29 - Trial = 15246/30000 | Total reward = 39.77
2022-01-26 14:17:39.641 | DEBUG    | __main__:trials:24 - Trial = 15247/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.643 | DEBUG    | __main__:trials:29 - Trial = 15247/30000 | Total reward = 49.89
2022-01-26 14:17:39.647 | DEBUG    | __main__:trials:24 - Trial = 15248/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.648 | DEBUG    | __main__:trials:29 - Trial = 15248/30000 | Total reward = 47.50
2022-01-26 14:17:39.652 | DEBUG    | __main__:trials:24 - Trial = 15249/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.653 | DEBUG    | __main__:trials:29 - Trial = 15249/30000 | Total reward = 49.80
2022-01-26 14:17:39.657 | DEBUG    | __main__:trials:24 - Trial = 15250/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.658 | DEBUG    | __main__:trials:29 - Trial = 15250/30000 | Total reward = 45.07
2022-01-26 14:17:39.662 | DEBUG    | __main__:trials:24 - Trial = 15251/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.664 | DEBUG    | __main__:trials:29 - Trial = 15251/30000 | Total reward = 43.35
2022-01-26 14:17:39.668 | DEBUG    | __main__:trials:24 - Trial = 15252/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.668 | DEBUG    | __main__:trials:29 - Trial = 15252/30000 | Total reward = 49.00
2022-01-26 14:17:39.673 | DEBUG    | __main__:trials:24 - Trial = 15253/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.674 | DEBUG    | __main__:trials:29 - Trial = 15253/30000 | Total reward = 50.07
2022-01-26 14:17:39.678 | DEBUG    | __main__:trials:24 - Trial = 15254/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.679 | DEBUG    | __main__:trials:29 - Trial = 15254/30000 | Total reward = 39.12
2022-01-26 14:17:39.683 | DEBUG    | __main__:trials:24 - Trial = 15255/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.684 | DEBUG    | __main__:trials:29 - Trial = 15255/30000 | Total reward = 48.19
2022-01-26 14:17:39.688 | DEBUG    | __main__:trials:24 - Trial = 15256/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.690 | DEBUG    | __main__:trials:29 - Trial = 15256/30000 | Total reward = 49.18
2022-01-26 14:17:39.693 | DEBUG    | __main__:trials:24 - Trial = 15257/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.694 | DEBUG    | __main__:trials:29 - Trial = 15257/30000 | Total reward = 53.01
2022-01-26 14:17:39.699 | DEBUG    | __main__:trials:24 - Trial = 15258/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.699 | DEBUG    | __main__:trials:29 - Trial = 15258/30000 | Total reward = 53.60
2022-01-26 14:17:39.703 | DEBUG    | __main__:trials:24 - Trial = 15259/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.704 | DEBUG    | __main__:trials:29 - Trial = 15259/30000 | Total reward = 37.69
2022-01-26 14:17:39.708 | DEBUG    | __main__:trials:24 - Trial = 15260/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.709 | DEBUG    | __main__:trials:29 - Trial = 15260/30000 | Total reward = 40.51
2022-01-26 14:17:39.712 | DEBUG    | __main__:trials:24 - Trial = 15261/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.713 | DEBUG    | __main__:trials:29 - Trial = 15261/30000 | Total reward = 48.52
2022-01-26 14:17:39.716 | DEBUG    | __main__:trials:24 - Trial = 15262/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.717 | DEBUG    | __main__:trials:29 - Trial = 15262/30000 | Total reward = 45.45
2022-01-26 14:17:39.720 | DEBUG    | __main__:trials:24 - Trial = 15263/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.722 | DEBUG    | __main__:trials:29 - Trial = 15263/30000 | Total reward = 50.98
2022-01-26 14:17:39.726 | DEBUG    | __main__:trials:24 - Trial = 15264/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.726 | DEBUG    | __main__:trials:29 - Trial = 15264/30000 | Total reward = 49.17
2022-01-26 14:17:39.730 | DEBUG    | __main__:trials:24 - Trial = 15265/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.731 | DEBUG    | __main__:trials:29 - Trial = 15265/30000 | Total reward = 42.45
2022-01-26 14:17:39.735 | DEBUG    | __main__:trials:24 - Trial = 15266/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.736 | DEBUG    | __main__:trials:29 - Trial = 15266/30000 | Total reward = 45.01
2022-01-26 14:17:39.740 | DEBUG    | __main__:trials:24 - Trial = 15267/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.741 | DEBUG    | __main__:trials:29 - Trial = 15267/30000 | Total reward = 46.09
2022-01-26 14:17:39.745 | DEBUG    | __main__:trials:24 - Trial = 15268/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.746 | DEBUG    | __main__:trials:29 - Trial = 15268/30000 | Total reward = 45.52
2022-01-26 14:17:39.750 | DEBUG    | __main__:trials:24 - Trial = 15269/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.752 | DEBUG    | __main__:trials:29 - Trial = 15269/30000 | Total reward = 67.48
2022-01-26 14:17:39.755 | DEBUG    | __main__:trials:24 - Trial = 15270/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.757 | DEBUG    | __main__:trials:29 - Trial = 15270/30000 | Total reward = 47.99
2022-01-26 14:17:39.760 | DEBUG    | __main__:trials:24 - Trial = 15271/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.762 | DEBUG    | __main__:trials:29 - Trial = 15271/30000 | Total reward = 59.97
2022-01-26 14:17:39.765 | DEBUG    | __main__:trials:24 - Trial = 15272/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.766 | DEBUG    | __main__:trials:29 - Trial = 15272/30000 | Total reward = 48.07
2022-01-26 14:17:39.770 | DEBUG    | __main__:trials:24 - Trial = 15273/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.771 | DEBUG    | __main__:trials:29 - Trial = 15273/30000 | Total reward = 48.80
2022-01-26 14:17:39.775 | DEBUG    | __main__:trials:24 - Trial = 15274/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.776 | DEBUG    | __main__:trials:29 - Trial = 15274/30000 | Total reward = 57.86
2022-01-26 14:17:39.779 | DEBUG    | __main__:trials:24 - Trial = 15275/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.781 | DEBUG    | __main__:trials:29 - Trial = 15275/30000 | Total reward = 58.15
2022-01-26 14:17:39.784 | DEBUG    | __main__:trials:24 - Trial = 15276/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.785 | DEBUG    | __main__:trials:29 - Trial = 15276/30000 | Total reward = 51.81
2022-01-26 14:17:39.789 | DEBUG    | __main__:trials:24 - Trial = 15277/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.791 | DEBUG    | __main__:trials:29 - Trial = 15277/30000 | Total reward = 50.76
2022-01-26 14:17:39.794 | DEBUG    | __main__:trials:24 - Trial = 15278/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.795 | DEBUG    | __main__:trials:29 - Trial = 15278/30000 | Total reward = 47.16
2022-01-26 14:17:39.798 | DEBUG    | __main__:trials:24 - Trial = 15279/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.800 | DEBUG    | __main__:trials:29 - Trial = 15279/30000 | Total reward = 37.51
2022-01-26 14:17:39.803 | DEBUG    | __main__:trials:24 - Trial = 15280/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.805 | DEBUG    | __main__:trials:29 - Trial = 15280/30000 | Total reward = 51.85
2022-01-26 14:17:39.808 | DEBUG    | __main__:trials:24 - Trial = 15281/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.810 | DEBUG    | __main__:trials:29 - Trial = 15281/30000 | Total reward = 54.32
2022-01-26 14:17:39.814 | DEBUG    | __main__:trials:24 - Trial = 15282/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.814 | DEBUG    | __main__:trials:29 - Trial = 15282/30000 | Total reward = 37.74
2022-01-26 14:17:39.819 | DEBUG    | __main__:trials:24 - Trial = 15283/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.820 | DEBUG    | __main__:trials:29 - Trial = 15283/30000 | Total reward = 54.65
2022-01-26 14:17:39.824 | DEBUG    | __main__:trials:24 - Trial = 15284/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.824 | DEBUG    | __main__:trials:29 - Trial = 15284/30000 | Total reward = 57.08
2022-01-26 14:17:39.829 | DEBUG    | __main__:trials:24 - Trial = 15285/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.831 | DEBUG    | __main__:trials:29 - Trial = 15285/30000 | Total reward = 32.18
2022-01-26 14:17:39.834 | DEBUG    | __main__:trials:24 - Trial = 15286/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.836 | DEBUG    | __main__:trials:29 - Trial = 15286/30000 | Total reward = 47.05
2022-01-26 14:17:39.839 | DEBUG    | __main__:trials:24 - Trial = 15287/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.841 | DEBUG    | __main__:trials:29 - Trial = 15287/30000 | Total reward = 58.54
2022-01-26 14:17:39.845 | DEBUG    | __main__:trials:24 - Trial = 15288/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.846 | DEBUG    | __main__:trials:29 - Trial = 15288/30000 | Total reward = 58.13
2022-01-26 14:17:39.850 | DEBUG    | __main__:trials:24 - Trial = 15289/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.851 | DEBUG    | __main__:trials:29 - Trial = 15289/30000 | Total reward = 45.83
2022-01-26 14:17:39.855 | DEBUG    | __main__:trials:24 - Trial = 15290/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.856 | DEBUG    | __main__:trials:29 - Trial = 15290/30000 | Total reward = 39.81
2022-01-26 14:17:39.859 | DEBUG    | __main__:trials:24 - Trial = 15291/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.861 | DEBUG    | __main__:trials:29 - Trial = 15291/30000 | Total reward = 63.45
2022-01-26 14:17:39.864 | DEBUG    | __main__:trials:24 - Trial = 15292/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.865 | DEBUG    | __main__:trials:29 - Trial = 15292/30000 | Total reward = 48.83
2022-01-26 14:17:39.870 | DEBUG    | __main__:trials:24 - Trial = 15293/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.871 | DEBUG    | __main__:trials:29 - Trial = 15293/30000 | Total reward = 39.34
2022-01-26 14:17:39.875 | DEBUG    | __main__:trials:24 - Trial = 15294/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.876 | DEBUG    | __main__:trials:29 - Trial = 15294/30000 | Total reward = 43.13
2022-01-26 14:17:39.881 | DEBUG    | __main__:trials:24 - Trial = 15295/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.881 | DEBUG    | __main__:trials:29 - Trial = 15295/30000 | Total reward = 57.10
2022-01-26 14:17:39.885 | DEBUG    | __main__:trials:24 - Trial = 15296/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.886 | DEBUG    | __main__:trials:29 - Trial = 15296/30000 | Total reward = 43.11
2022-01-26 14:17:39.889 | DEBUG    | __main__:trials:24 - Trial = 15297/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.890 | DEBUG    | __main__:trials:29 - Trial = 15297/30000 | Total reward = 58.16
2022-01-26 14:17:39.893 | DEBUG    | __main__:trials:24 - Trial = 15298/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.894 | DEBUG    | __main__:trials:29 - Trial = 15298/30000 | Total reward = 42.17
2022-01-26 14:17:39.897 | DEBUG    | __main__:trials:24 - Trial = 15299/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.898 | DEBUG    | __main__:trials:29 - Trial = 15299/30000 | Total reward = 45.95
2022-01-26 14:17:39.902 | DEBUG    | __main__:trials:24 - Trial = 15300/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.902 | DEBUG    | __main__:trials:29 - Trial = 15300/30000 | Total reward = 45.74
2022-01-26 14:17:39.906 | DEBUG    | __main__:trials:24 - Trial = 15301/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.907 | DEBUG    | __main__:trials:29 - Trial = 15301/30000 | Total reward = 44.92
2022-01-26 14:17:39.910 | DEBUG    | __main__:trials:24 - Trial = 15302/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.912 | DEBUG    | __main__:trials:29 - Trial = 15302/30000 | Total reward = 49.49
2022-01-26 14:17:39.915 | DEBUG    | __main__:trials:24 - Trial = 15303/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.917 | DEBUG    | __main__:trials:29 - Trial = 15303/30000 | Total reward = 60.60
2022-01-26 14:17:39.920 | DEBUG    | __main__:trials:24 - Trial = 15304/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.921 | DEBUG    | __main__:trials:29 - Trial = 15304/30000 | Total reward = 47.22
2022-01-26 14:17:39.925 | DEBUG    | __main__:trials:24 - Trial = 15305/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.926 | DEBUG    | __main__:trials:29 - Trial = 15305/30000 | Total reward = 52.83
2022-01-26 14:17:39.929 | DEBUG    | __main__:trials:24 - Trial = 15306/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.930 | DEBUG    | __main__:trials:29 - Trial = 15306/30000 | Total reward = 53.36
2022-01-26 14:17:39.934 | DEBUG    | __main__:trials:24 - Trial = 15307/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.935 | DEBUG    | __main__:trials:29 - Trial = 15307/30000 | Total reward = 48.68
2022-01-26 14:17:39.938 | DEBUG    | __main__:trials:24 - Trial = 15308/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.939 | DEBUG    | __main__:trials:29 - Trial = 15308/30000 | Total reward = 46.97
2022-01-26 14:17:39.942 | DEBUG    | __main__:trials:24 - Trial = 15309/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.943 | DEBUG    | __main__:trials:29 - Trial = 15309/30000 | Total reward = 53.63
2022-01-26 14:17:39.947 | DEBUG    | __main__:trials:24 - Trial = 15310/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.947 | DEBUG    | __main__:trials:29 - Trial = 15310/30000 | Total reward = 57.70
2022-01-26 14:17:39.951 | DEBUG    | __main__:trials:24 - Trial = 15311/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.951 | DEBUG    | __main__:trials:29 - Trial = 15311/30000 | Total reward = 56.55
2022-01-26 14:17:39.956 | DEBUG    | __main__:trials:24 - Trial = 15312/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.956 | DEBUG    | __main__:trials:29 - Trial = 15312/30000 | Total reward = 44.18
2022-01-26 14:17:39.959 | DEBUG    | __main__:trials:24 - Trial = 15313/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.960 | DEBUG    | __main__:trials:29 - Trial = 15313/30000 | Total reward = 46.78
2022-01-26 14:17:39.963 | DEBUG    | __main__:trials:24 - Trial = 15314/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.964 | DEBUG    | __main__:trials:29 - Trial = 15314/30000 | Total reward = 55.91
2022-01-26 14:17:39.967 | DEBUG    | __main__:trials:24 - Trial = 15315/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.968 | DEBUG    | __main__:trials:29 - Trial = 15315/30000 | Total reward = 42.31
2022-01-26 14:17:39.971 | DEBUG    | __main__:trials:24 - Trial = 15316/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.973 | DEBUG    | __main__:trials:29 - Trial = 15316/30000 | Total reward = 43.88
2022-01-26 14:17:39.976 | DEBUG    | __main__:trials:24 - Trial = 15317/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.976 | DEBUG    | __main__:trials:29 - Trial = 15317/30000 | Total reward = 57.12
2022-01-26 14:17:39.979 | DEBUG    | __main__:trials:24 - Trial = 15318/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.980 | DEBUG    | __main__:trials:29 - Trial = 15318/30000 | Total reward = 35.25
2022-01-26 14:17:39.983 | DEBUG    | __main__:trials:24 - Trial = 15319/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.984 | DEBUG    | __main__:trials:29 - Trial = 15319/30000 | Total reward = 42.58
2022-01-26 14:17:39.987 | DEBUG    | __main__:trials:24 - Trial = 15320/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.988 | DEBUG    | __main__:trials:29 - Trial = 15320/30000 | Total reward = 51.03
2022-01-26 14:17:39.991 | DEBUG    | __main__:trials:24 - Trial = 15321/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.992 | DEBUG    | __main__:trials:29 - Trial = 15321/30000 | Total reward = 40.81
2022-01-26 14:17:39.995 | DEBUG    | __main__:trials:24 - Trial = 15322/30000 | Max number of steps (20) reached
2022-01-26 14:17:39.996 | DEBUG    | __main__:trials:29 - Trial = 15322/30000 | Total reward = 39.75
2022-01-26 14:17:39.999 | DEBUG    | __main__:trials:24 - Trial = 15323/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.001 | DEBUG    | __main__:trials:29 - Trial = 15323/30000 | Total reward = 49.46
2022-01-26 14:17:40.004 | DEBUG    | __main__:trials:26 - Trial = 15324/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.004 | DEBUG    | __main__:trials:29 - Trial = 15324/30000 | Total reward = 31.19
2022-01-26 14:17:40.008 | DEBUG    | __main__:trials:24 - Trial = 15325/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.008 | DEBUG    | __main__:trials:29 - Trial = 15325/30000 | Total reward = 45.86
2022-01-26 14:17:40.013 | DEBUG    | __main__:trials:24 - Trial = 15326/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.013 | DEBUG    | __main__:trials:29 - Trial = 15326/30000 | Total reward = 46.61
2022-01-26 14:17:40.017 | DEBUG    | __main__:trials:24 - Trial = 15327/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.018 | DEBUG    | __main__:trials:29 - Trial = 15327/30000 | Total reward = 42.87
2022-01-26 14:17:40.021 | DEBUG    | __main__:trials:24 - Trial = 15328/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.022 | DEBUG    | __main__:trials:29 - Trial = 15328/30000 | Total reward = 44.56
2022-01-26 14:17:40.025 | DEBUG    | __main__:trials:24 - Trial = 15329/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.026 | DEBUG    | __main__:trials:29 - Trial = 15329/30000 | Total reward = 46.20
2022-01-26 14:17:40.030 | DEBUG    | __main__:trials:24 - Trial = 15330/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.032 | DEBUG    | __main__:trials:29 - Trial = 15330/30000 | Total reward = 48.29
2022-01-26 14:17:40.035 | DEBUG    | __main__:trials:26 - Trial = 15331/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.036 | DEBUG    | __main__:trials:29 - Trial = 15331/30000 | Total reward = 32.03
2022-01-26 14:17:40.040 | DEBUG    | __main__:trials:24 - Trial = 15332/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.041 | DEBUG    | __main__:trials:29 - Trial = 15332/30000 | Total reward = 43.07
2022-01-26 14:17:40.044 | DEBUG    | __main__:trials:24 - Trial = 15333/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.046 | DEBUG    | __main__:trials:29 - Trial = 15333/30000 | Total reward = 47.79
2022-01-26 14:17:40.049 | DEBUG    | __main__:trials:24 - Trial = 15334/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.050 | DEBUG    | __main__:trials:29 - Trial = 15334/30000 | Total reward = 43.72
2022-01-26 14:17:40.055 | DEBUG    | __main__:trials:24 - Trial = 15335/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.055 | DEBUG    | __main__:trials:29 - Trial = 15335/30000 | Total reward = 37.30
2022-01-26 14:17:40.059 | DEBUG    | __main__:trials:24 - Trial = 15336/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.061 | DEBUG    | __main__:trials:29 - Trial = 15336/30000 | Total reward = 48.99
2022-01-26 14:17:40.064 | DEBUG    | __main__:trials:24 - Trial = 15337/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.065 | DEBUG    | __main__:trials:29 - Trial = 15337/30000 | Total reward = 36.18
2022-01-26 14:17:40.068 | DEBUG    | __main__:trials:26 - Trial = 15338/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.069 | DEBUG    | __main__:trials:29 - Trial = 15338/30000 | Total reward = 31.54
2022-01-26 14:17:40.073 | DEBUG    | __main__:trials:24 - Trial = 15339/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.075 | DEBUG    | __main__:trials:29 - Trial = 15339/30000 | Total reward = 57.31
2022-01-26 14:17:40.078 | DEBUG    | __main__:trials:24 - Trial = 15340/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.080 | DEBUG    | __main__:trials:29 - Trial = 15340/30000 | Total reward = 42.37
2022-01-26 14:17:40.083 | DEBUG    | __main__:trials:24 - Trial = 15341/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.085 | DEBUG    | __main__:trials:29 - Trial = 15341/30000 | Total reward = 46.35
2022-01-26 14:17:40.088 | DEBUG    | __main__:trials:24 - Trial = 15342/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.089 | DEBUG    | __main__:trials:29 - Trial = 15342/30000 | Total reward = 49.92
2022-01-26 14:17:40.093 | DEBUG    | __main__:trials:24 - Trial = 15343/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.095 | DEBUG    | __main__:trials:29 - Trial = 15343/30000 | Total reward = 45.89
2022-01-26 14:17:40.098 | DEBUG    | __main__:trials:24 - Trial = 15344/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.100 | DEBUG    | __main__:trials:29 - Trial = 15344/30000 | Total reward = 50.38
2022-01-26 14:17:40.103 | DEBUG    | __main__:trials:24 - Trial = 15345/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.104 | DEBUG    | __main__:trials:29 - Trial = 15345/30000 | Total reward = 52.86
2022-01-26 14:17:40.109 | DEBUG    | __main__:trials:24 - Trial = 15346/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.110 | DEBUG    | __main__:trials:29 - Trial = 15346/30000 | Total reward = 45.83
2022-01-26 14:17:40.114 | DEBUG    | __main__:trials:24 - Trial = 15347/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.114 | DEBUG    | __main__:trials:29 - Trial = 15347/30000 | Total reward = 36.86
2022-01-26 14:17:40.119 | DEBUG    | __main__:trials:24 - Trial = 15348/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.120 | DEBUG    | __main__:trials:29 - Trial = 15348/30000 | Total reward = 38.86
2022-01-26 14:17:40.124 | DEBUG    | __main__:trials:24 - Trial = 15349/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.124 | DEBUG    | __main__:trials:29 - Trial = 15349/30000 | Total reward = 45.21
2022-01-26 14:17:40.128 | DEBUG    | __main__:trials:24 - Trial = 15350/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.130 | DEBUG    | __main__:trials:29 - Trial = 15350/30000 | Total reward = 46.13
2022-01-26 14:17:40.134 | DEBUG    | __main__:trials:24 - Trial = 15351/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.134 | DEBUG    | __main__:trials:29 - Trial = 15351/30000 | Total reward = 51.82
2022-01-26 14:17:40.138 | DEBUG    | __main__:trials:24 - Trial = 15352/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.139 | DEBUG    | __main__:trials:29 - Trial = 15352/30000 | Total reward = 39.54
2022-01-26 14:17:40.144 | DEBUG    | __main__:trials:24 - Trial = 15353/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.144 | DEBUG    | __main__:trials:29 - Trial = 15353/30000 | Total reward = 48.12
2022-01-26 14:17:40.149 | DEBUG    | __main__:trials:24 - Trial = 15354/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.149 | DEBUG    | __main__:trials:29 - Trial = 15354/30000 | Total reward = 38.09
2022-01-26 14:17:40.153 | DEBUG    | __main__:trials:24 - Trial = 15355/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.154 | DEBUG    | __main__:trials:29 - Trial = 15355/30000 | Total reward = 45.24
2022-01-26 14:17:40.157 | DEBUG    | __main__:trials:24 - Trial = 15356/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.160 | DEBUG    | __main__:trials:29 - Trial = 15356/30000 | Total reward = 45.55
2022-01-26 14:17:40.163 | DEBUG    | __main__:trials:24 - Trial = 15357/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.164 | DEBUG    | __main__:trials:29 - Trial = 15357/30000 | Total reward = 43.75
2022-01-26 14:17:40.168 | DEBUG    | __main__:trials:24 - Trial = 15358/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.169 | DEBUG    | __main__:trials:29 - Trial = 15358/30000 | Total reward = 46.29
2022-01-26 14:17:40.172 | DEBUG    | __main__:trials:24 - Trial = 15359/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.174 | DEBUG    | __main__:trials:29 - Trial = 15359/30000 | Total reward = 52.19
2022-01-26 14:17:40.177 | DEBUG    | __main__:trials:24 - Trial = 15360/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.178 | DEBUG    | __main__:trials:29 - Trial = 15360/30000 | Total reward = 38.95
2022-01-26 14:17:40.181 | DEBUG    | __main__:trials:24 - Trial = 15361/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.182 | DEBUG    | __main__:trials:29 - Trial = 15361/30000 | Total reward = 47.74
2022-01-26 14:17:40.185 | DEBUG    | __main__:trials:24 - Trial = 15362/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.187 | DEBUG    | __main__:trials:29 - Trial = 15362/30000 | Total reward = 55.37
2022-01-26 14:17:40.191 | DEBUG    | __main__:trials:24 - Trial = 15363/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.192 | DEBUG    | __main__:trials:29 - Trial = 15363/30000 | Total reward = 41.87
2022-01-26 14:17:40.196 | DEBUG    | __main__:trials:24 - Trial = 15364/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.197 | DEBUG    | __main__:trials:29 - Trial = 15364/30000 | Total reward = 61.52
2022-01-26 14:17:40.201 | DEBUG    | __main__:trials:24 - Trial = 15365/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.202 | DEBUG    | __main__:trials:29 - Trial = 15365/30000 | Total reward = 36.56
2022-01-26 14:17:40.206 | DEBUG    | __main__:trials:24 - Trial = 15366/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.208 | DEBUG    | __main__:trials:29 - Trial = 15366/30000 | Total reward = 40.79
2022-01-26 14:17:40.210 | DEBUG    | __main__:trials:26 - Trial = 15367/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.212 | DEBUG    | __main__:trials:29 - Trial = 15367/30000 | Total reward = 21.71
2022-01-26 14:17:40.215 | DEBUG    | __main__:trials:24 - Trial = 15368/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.217 | DEBUG    | __main__:trials:29 - Trial = 15368/30000 | Total reward = 52.23
2022-01-26 14:17:40.220 | DEBUG    | __main__:trials:24 - Trial = 15369/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.221 | DEBUG    | __main__:trials:29 - Trial = 15369/30000 | Total reward = 37.61
2022-01-26 14:17:40.226 | DEBUG    | __main__:trials:24 - Trial = 15370/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.227 | DEBUG    | __main__:trials:29 - Trial = 15370/30000 | Total reward = 43.04
2022-01-26 14:17:40.230 | DEBUG    | __main__:trials:24 - Trial = 15371/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.232 | DEBUG    | __main__:trials:29 - Trial = 15371/30000 | Total reward = 56.67
2022-01-26 14:17:40.234 | DEBUG    | __main__:trials:24 - Trial = 15372/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.236 | DEBUG    | __main__:trials:29 - Trial = 15372/30000 | Total reward = 42.96
2022-01-26 14:17:40.240 | DEBUG    | __main__:trials:24 - Trial = 15373/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.241 | DEBUG    | __main__:trials:29 - Trial = 15373/30000 | Total reward = 49.42
2022-01-26 14:17:40.244 | DEBUG    | __main__:trials:24 - Trial = 15374/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.245 | DEBUG    | __main__:trials:29 - Trial = 15374/30000 | Total reward = 41.56
2022-01-26 14:17:40.249 | DEBUG    | __main__:trials:24 - Trial = 15375/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.249 | DEBUG    | __main__:trials:29 - Trial = 15375/30000 | Total reward = 49.11
2022-01-26 14:17:40.253 | DEBUG    | __main__:trials:24 - Trial = 15376/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.253 | DEBUG    | __main__:trials:29 - Trial = 15376/30000 | Total reward = 58.79
2022-01-26 14:17:40.257 | DEBUG    | __main__:trials:24 - Trial = 15377/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.258 | DEBUG    | __main__:trials:29 - Trial = 15377/30000 | Total reward = 54.47
2022-01-26 14:17:40.262 | DEBUG    | __main__:trials:24 - Trial = 15378/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.263 | DEBUG    | __main__:trials:29 - Trial = 15378/30000 | Total reward = 33.81
2022-01-26 14:17:40.267 | DEBUG    | __main__:trials:24 - Trial = 15379/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.268 | DEBUG    | __main__:trials:29 - Trial = 15379/30000 | Total reward = 60.09
2022-01-26 14:17:40.272 | DEBUG    | __main__:trials:24 - Trial = 15380/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.273 | DEBUG    | __main__:trials:29 - Trial = 15380/30000 | Total reward = 47.42
2022-01-26 14:17:40.277 | DEBUG    | __main__:trials:24 - Trial = 15381/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.278 | DEBUG    | __main__:trials:29 - Trial = 15381/30000 | Total reward = 51.36
2022-01-26 14:17:40.282 | DEBUG    | __main__:trials:24 - Trial = 15382/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.282 | DEBUG    | __main__:trials:29 - Trial = 15382/30000 | Total reward = 32.83
2022-01-26 14:17:40.286 | DEBUG    | __main__:trials:24 - Trial = 15383/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.288 | DEBUG    | __main__:trials:29 - Trial = 15383/30000 | Total reward = 38.56
2022-01-26 14:17:40.292 | DEBUG    | __main__:trials:24 - Trial = 15384/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.293 | DEBUG    | __main__:trials:29 - Trial = 15384/30000 | Total reward = 34.34
2022-01-26 14:17:40.297 | DEBUG    | __main__:trials:24 - Trial = 15385/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.298 | DEBUG    | __main__:trials:29 - Trial = 15385/30000 | Total reward = 34.80
2022-01-26 14:17:40.302 | DEBUG    | __main__:trials:24 - Trial = 15386/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.303 | DEBUG    | __main__:trials:29 - Trial = 15386/30000 | Total reward = 44.84
2022-01-26 14:17:40.307 | DEBUG    | __main__:trials:24 - Trial = 15387/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.308 | DEBUG    | __main__:trials:29 - Trial = 15387/30000 | Total reward = 42.08
2022-01-26 14:17:40.312 | DEBUG    | __main__:trials:24 - Trial = 15388/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.314 | DEBUG    | __main__:trials:29 - Trial = 15388/30000 | Total reward = 41.35
2022-01-26 14:17:40.318 | DEBUG    | __main__:trials:24 - Trial = 15389/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.320 | DEBUG    | __main__:trials:29 - Trial = 15389/30000 | Total reward = 59.00
2022-01-26 14:17:40.323 | DEBUG    | __main__:trials:24 - Trial = 15390/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.324 | DEBUG    | __main__:trials:29 - Trial = 15390/30000 | Total reward = 44.84
2022-01-26 14:17:40.328 | DEBUG    | __main__:trials:24 - Trial = 15391/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.330 | DEBUG    | __main__:trials:29 - Trial = 15391/30000 | Total reward = 44.27
2022-01-26 14:17:40.333 | DEBUG    | __main__:trials:24 - Trial = 15392/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.335 | DEBUG    | __main__:trials:29 - Trial = 15392/30000 | Total reward = 44.03
2022-01-26 14:17:40.340 | DEBUG    | __main__:trials:24 - Trial = 15393/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.341 | DEBUG    | __main__:trials:29 - Trial = 15393/30000 | Total reward = 38.58
2022-01-26 14:17:40.345 | DEBUG    | __main__:trials:24 - Trial = 15394/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.346 | DEBUG    | __main__:trials:29 - Trial = 15394/30000 | Total reward = 42.00
2022-01-26 14:17:40.350 | DEBUG    | __main__:trials:24 - Trial = 15395/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.352 | DEBUG    | __main__:trials:29 - Trial = 15395/30000 | Total reward = 47.45
2022-01-26 14:17:40.355 | DEBUG    | __main__:trials:24 - Trial = 15396/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.357 | DEBUG    | __main__:trials:29 - Trial = 15396/30000 | Total reward = 36.81
2022-01-26 14:17:40.360 | DEBUG    | __main__:trials:24 - Trial = 15397/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.362 | DEBUG    | __main__:trials:29 - Trial = 15397/30000 | Total reward = 40.77
2022-01-26 14:17:40.365 | DEBUG    | __main__:trials:24 - Trial = 15398/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.368 | DEBUG    | __main__:trials:29 - Trial = 15398/30000 | Total reward = 40.14
2022-01-26 14:17:40.371 | DEBUG    | __main__:trials:24 - Trial = 15399/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.372 | DEBUG    | __main__:trials:29 - Trial = 15399/30000 | Total reward = 37.85
2022-01-26 14:17:40.375 | DEBUG    | __main__:trials:24 - Trial = 15400/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.377 | DEBUG    | __main__:trials:29 - Trial = 15400/30000 | Total reward = 61.19
2022-01-26 14:17:40.381 | DEBUG    | __main__:trials:24 - Trial = 15401/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.382 | DEBUG    | __main__:trials:29 - Trial = 15401/30000 | Total reward = 35.29
2022-01-26 14:17:40.386 | DEBUG    | __main__:trials:24 - Trial = 15402/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.387 | DEBUG    | __main__:trials:29 - Trial = 15402/30000 | Total reward = 41.57
2022-01-26 14:17:40.391 | DEBUG    | __main__:trials:24 - Trial = 15403/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.392 | DEBUG    | __main__:trials:29 - Trial = 15403/30000 | Total reward = 39.28
2022-01-26 14:17:40.396 | DEBUG    | __main__:trials:24 - Trial = 15404/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.397 | DEBUG    | __main__:trials:29 - Trial = 15404/30000 | Total reward = 45.73
2022-01-26 14:17:40.401 | DEBUG    | __main__:trials:24 - Trial = 15405/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.402 | DEBUG    | __main__:trials:29 - Trial = 15405/30000 | Total reward = 36.58
2022-01-26 14:17:40.406 | DEBUG    | __main__:trials:24 - Trial = 15406/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.406 | DEBUG    | __main__:trials:29 - Trial = 15406/30000 | Total reward = 41.18
2022-01-26 14:17:40.410 | DEBUG    | __main__:trials:24 - Trial = 15407/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.412 | DEBUG    | __main__:trials:29 - Trial = 15407/30000 | Total reward = 37.78
2022-01-26 14:17:40.416 | DEBUG    | __main__:trials:24 - Trial = 15408/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.417 | DEBUG    | __main__:trials:29 - Trial = 15408/30000 | Total reward = 35.59
2022-01-26 14:17:40.421 | DEBUG    | __main__:trials:24 - Trial = 15409/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.423 | DEBUG    | __main__:trials:29 - Trial = 15409/30000 | Total reward = 37.09
2022-01-26 14:17:40.426 | DEBUG    | __main__:trials:24 - Trial = 15410/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.427 | DEBUG    | __main__:trials:29 - Trial = 15410/30000 | Total reward = 64.60
2022-01-26 14:17:40.430 | DEBUG    | __main__:trials:24 - Trial = 15411/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.432 | DEBUG    | __main__:trials:29 - Trial = 15411/30000 | Total reward = 23.06
2022-01-26 14:17:40.435 | DEBUG    | __main__:trials:24 - Trial = 15412/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.437 | DEBUG    | __main__:trials:29 - Trial = 15412/30000 | Total reward = 52.98
2022-01-26 14:17:40.441 | DEBUG    | __main__:trials:24 - Trial = 15413/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.442 | DEBUG    | __main__:trials:29 - Trial = 15413/30000 | Total reward = 43.59
2022-01-26 14:17:40.446 | DEBUG    | __main__:trials:24 - Trial = 15414/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.448 | DEBUG    | __main__:trials:29 - Trial = 15414/30000 | Total reward = 47.63
2022-01-26 14:17:40.452 | DEBUG    | __main__:trials:24 - Trial = 15415/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.452 | DEBUG    | __main__:trials:29 - Trial = 15415/30000 | Total reward = 50.26
2022-01-26 14:17:40.456 | DEBUG    | __main__:trials:24 - Trial = 15416/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.458 | DEBUG    | __main__:trials:29 - Trial = 15416/30000 | Total reward = 48.38
2022-01-26 14:17:40.461 | DEBUG    | __main__:trials:24 - Trial = 15417/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.462 | DEBUG    | __main__:trials:29 - Trial = 15417/30000 | Total reward = 46.45
2022-01-26 14:17:40.466 | DEBUG    | __main__:trials:24 - Trial = 15418/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.467 | DEBUG    | __main__:trials:29 - Trial = 15418/30000 | Total reward = 34.20
2022-01-26 14:17:40.471 | DEBUG    | __main__:trials:24 - Trial = 15419/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.472 | DEBUG    | __main__:trials:29 - Trial = 15419/30000 | Total reward = 50.15
2022-01-26 14:17:40.476 | DEBUG    | __main__:trials:24 - Trial = 15420/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.478 | DEBUG    | __main__:trials:29 - Trial = 15420/30000 | Total reward = 40.77
2022-01-26 14:17:40.481 | DEBUG    | __main__:trials:24 - Trial = 15421/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.483 | DEBUG    | __main__:trials:29 - Trial = 15421/30000 | Total reward = 57.31
2022-01-26 14:17:40.486 | DEBUG    | __main__:trials:24 - Trial = 15422/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.488 | DEBUG    | __main__:trials:29 - Trial = 15422/30000 | Total reward = 27.54
2022-01-26 14:17:40.491 | DEBUG    | __main__:trials:24 - Trial = 15423/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.493 | DEBUG    | __main__:trials:29 - Trial = 15423/30000 | Total reward = 45.62
2022-01-26 14:17:40.497 | DEBUG    | __main__:trials:24 - Trial = 15424/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.497 | DEBUG    | __main__:trials:29 - Trial = 15424/30000 | Total reward = 41.71
2022-01-26 14:17:40.500 | DEBUG    | __main__:trials:24 - Trial = 15425/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.502 | DEBUG    | __main__:trials:29 - Trial = 15425/30000 | Total reward = 42.13
2022-01-26 14:17:40.506 | DEBUG    | __main__:trials:24 - Trial = 15426/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.507 | DEBUG    | __main__:trials:29 - Trial = 15426/30000 | Total reward = 41.44
2022-01-26 14:17:40.511 | DEBUG    | __main__:trials:24 - Trial = 15427/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.512 | DEBUG    | __main__:trials:29 - Trial = 15427/30000 | Total reward = 35.18
2022-01-26 14:17:40.516 | DEBUG    | __main__:trials:24 - Trial = 15428/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.517 | DEBUG    | __main__:trials:29 - Trial = 15428/30000 | Total reward = 45.82
2022-01-26 14:17:40.521 | DEBUG    | __main__:trials:24 - Trial = 15429/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.523 | DEBUG    | __main__:trials:29 - Trial = 15429/30000 | Total reward = 40.56
2022-01-26 14:17:40.526 | DEBUG    | __main__:trials:24 - Trial = 15430/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.528 | DEBUG    | __main__:trials:29 - Trial = 15430/30000 | Total reward = 37.99
2022-01-26 14:17:40.531 | DEBUG    | __main__:trials:24 - Trial = 15431/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.533 | DEBUG    | __main__:trials:29 - Trial = 15431/30000 | Total reward = 51.80
2022-01-26 14:17:40.536 | DEBUG    | __main__:trials:24 - Trial = 15432/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.538 | DEBUG    | __main__:trials:29 - Trial = 15432/30000 | Total reward = 44.79
2022-01-26 14:17:40.541 | DEBUG    | __main__:trials:24 - Trial = 15433/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.543 | DEBUG    | __main__:trials:29 - Trial = 15433/30000 | Total reward = 41.78
2022-01-26 14:17:40.547 | DEBUG    | __main__:trials:24 - Trial = 15434/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.549 | DEBUG    | __main__:trials:29 - Trial = 15434/30000 | Total reward = 38.70
2022-01-26 14:17:40.552 | DEBUG    | __main__:trials:26 - Trial = 15435/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.554 | DEBUG    | __main__:trials:29 - Trial = 15435/30000 | Total reward = 29.30
2022-01-26 14:17:40.558 | DEBUG    | __main__:trials:24 - Trial = 15436/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.559 | DEBUG    | __main__:trials:29 - Trial = 15436/30000 | Total reward = 42.75
2022-01-26 14:17:40.563 | DEBUG    | __main__:trials:24 - Trial = 15437/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.565 | DEBUG    | __main__:trials:29 - Trial = 15437/30000 | Total reward = 42.37
2022-01-26 14:17:40.569 | DEBUG    | __main__:trials:24 - Trial = 15438/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.570 | DEBUG    | __main__:trials:29 - Trial = 15438/30000 | Total reward = 37.47
2022-01-26 14:17:40.574 | DEBUG    | __main__:trials:24 - Trial = 15439/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.576 | DEBUG    | __main__:trials:29 - Trial = 15439/30000 | Total reward = 49.07
2022-01-26 14:17:40.580 | DEBUG    | __main__:trials:24 - Trial = 15440/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.581 | DEBUG    | __main__:trials:29 - Trial = 15440/30000 | Total reward = 38.62
2022-01-26 14:17:40.584 | DEBUG    | __main__:trials:24 - Trial = 15441/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.585 | DEBUG    | __main__:trials:29 - Trial = 15441/30000 | Total reward = 47.87
2022-01-26 14:17:40.589 | DEBUG    | __main__:trials:24 - Trial = 15442/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.590 | DEBUG    | __main__:trials:29 - Trial = 15442/30000 | Total reward = 41.59
2022-01-26 14:17:40.593 | DEBUG    | __main__:trials:24 - Trial = 15443/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.594 | DEBUG    | __main__:trials:29 - Trial = 15443/30000 | Total reward = 44.23
2022-01-26 14:17:40.597 | DEBUG    | __main__:trials:24 - Trial = 15444/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.598 | DEBUG    | __main__:trials:29 - Trial = 15444/30000 | Total reward = 42.40
2022-01-26 14:17:40.601 | DEBUG    | __main__:trials:24 - Trial = 15445/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.603 | DEBUG    | __main__:trials:29 - Trial = 15445/30000 | Total reward = 40.92
2022-01-26 14:17:40.606 | DEBUG    | __main__:trials:24 - Trial = 15446/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.608 | DEBUG    | __main__:trials:29 - Trial = 15446/30000 | Total reward = 51.63
2022-01-26 14:17:40.611 | DEBUG    | __main__:trials:24 - Trial = 15447/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.613 | DEBUG    | __main__:trials:29 - Trial = 15447/30000 | Total reward = 44.26
2022-01-26 14:17:40.616 | DEBUG    | __main__:trials:24 - Trial = 15448/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.618 | DEBUG    | __main__:trials:29 - Trial = 15448/30000 | Total reward = 47.61
2022-01-26 14:17:40.621 | DEBUG    | __main__:trials:24 - Trial = 15449/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.622 | DEBUG    | __main__:trials:29 - Trial = 15449/30000 | Total reward = 47.02
2022-01-26 14:17:40.626 | DEBUG    | __main__:trials:24 - Trial = 15450/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.627 | DEBUG    | __main__:trials:29 - Trial = 15450/30000 | Total reward = 47.05
2022-01-26 14:17:40.631 | DEBUG    | __main__:trials:24 - Trial = 15451/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.632 | DEBUG    | __main__:trials:29 - Trial = 15451/30000 | Total reward = 41.78
2022-01-26 14:17:40.636 | DEBUG    | __main__:trials:24 - Trial = 15452/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.638 | DEBUG    | __main__:trials:29 - Trial = 15452/30000 | Total reward = 44.43
2022-01-26 14:17:40.641 | DEBUG    | __main__:trials:24 - Trial = 15453/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.643 | DEBUG    | __main__:trials:29 - Trial = 15453/30000 | Total reward = 51.04
2022-01-26 14:17:40.646 | DEBUG    | __main__:trials:24 - Trial = 15454/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.648 | DEBUG    | __main__:trials:29 - Trial = 15454/30000 | Total reward = 40.82
2022-01-26 14:17:40.652 | DEBUG    | __main__:trials:24 - Trial = 15455/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.653 | DEBUG    | __main__:trials:29 - Trial = 15455/30000 | Total reward = 46.67
2022-01-26 14:17:40.657 | DEBUG    | __main__:trials:24 - Trial = 15456/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.657 | DEBUG    | __main__:trials:29 - Trial = 15456/30000 | Total reward = 39.54
2022-01-26 14:17:40.661 | DEBUG    | __main__:trials:24 - Trial = 15457/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.662 | DEBUG    | __main__:trials:29 - Trial = 15457/30000 | Total reward = 47.20
2022-01-26 14:17:40.665 | DEBUG    | __main__:trials:24 - Trial = 15458/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.667 | DEBUG    | __main__:trials:29 - Trial = 15458/30000 | Total reward = 43.06
2022-01-26 14:17:40.670 | DEBUG    | __main__:trials:24 - Trial = 15459/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.671 | DEBUG    | __main__:trials:29 - Trial = 15459/30000 | Total reward = 35.05
2022-01-26 14:17:40.675 | DEBUG    | __main__:trials:24 - Trial = 15460/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.677 | DEBUG    | __main__:trials:29 - Trial = 15460/30000 | Total reward = 51.71
2022-01-26 14:17:40.680 | DEBUG    | __main__:trials:24 - Trial = 15461/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.682 | DEBUG    | __main__:trials:29 - Trial = 15461/30000 | Total reward = 34.61
2022-01-26 14:17:40.685 | DEBUG    | __main__:trials:24 - Trial = 15462/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.687 | DEBUG    | __main__:trials:29 - Trial = 15462/30000 | Total reward = 46.92
2022-01-26 14:17:40.690 | DEBUG    | __main__:trials:24 - Trial = 15463/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.691 | DEBUG    | __main__:trials:29 - Trial = 15463/30000 | Total reward = 47.20
2022-01-26 14:17:40.695 | DEBUG    | __main__:trials:24 - Trial = 15464/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.697 | DEBUG    | __main__:trials:29 - Trial = 15464/30000 | Total reward = 40.18
2022-01-26 14:17:40.700 | DEBUG    | __main__:trials:24 - Trial = 15465/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.702 | DEBUG    | __main__:trials:29 - Trial = 15465/30000 | Total reward = 39.65
2022-01-26 14:17:40.706 | DEBUG    | __main__:trials:24 - Trial = 15466/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.707 | DEBUG    | __main__:trials:29 - Trial = 15466/30000 | Total reward = 39.92
2022-01-26 14:17:40.711 | DEBUG    | __main__:trials:24 - Trial = 15467/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.712 | DEBUG    | __main__:trials:29 - Trial = 15467/30000 | Total reward = 64.12
2022-01-26 14:17:40.715 | DEBUG    | __main__:trials:26 - Trial = 15468/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.717 | DEBUG    | __main__:trials:29 - Trial = 15468/30000 | Total reward = 24.52
2022-01-26 14:17:40.721 | DEBUG    | __main__:trials:24 - Trial = 15469/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.721 | DEBUG    | __main__:trials:29 - Trial = 15469/30000 | Total reward = 35.93
2022-01-26 14:17:40.724 | DEBUG    | __main__:trials:24 - Trial = 15470/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.726 | DEBUG    | __main__:trials:29 - Trial = 15470/30000 | Total reward = 47.26
2022-01-26 14:17:40.730 | DEBUG    | __main__:trials:24 - Trial = 15471/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.731 | DEBUG    | __main__:trials:29 - Trial = 15471/30000 | Total reward = 44.79
2022-01-26 14:17:40.735 | DEBUG    | __main__:trials:24 - Trial = 15472/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.737 | DEBUG    | __main__:trials:29 - Trial = 15472/30000 | Total reward = 44.33
2022-01-26 14:17:40.740 | DEBUG    | __main__:trials:24 - Trial = 15473/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.741 | DEBUG    | __main__:trials:29 - Trial = 15473/30000 | Total reward = 45.09
2022-01-26 14:17:40.745 | DEBUG    | __main__:trials:24 - Trial = 15474/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.747 | DEBUG    | __main__:trials:29 - Trial = 15474/30000 | Total reward = 60.89
2022-01-26 14:17:40.751 | DEBUG    | __main__:trials:24 - Trial = 15475/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.752 | DEBUG    | __main__:trials:29 - Trial = 15475/30000 | Total reward = 36.63
2022-01-26 14:17:40.756 | DEBUG    | __main__:trials:24 - Trial = 15476/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.756 | DEBUG    | __main__:trials:29 - Trial = 15476/30000 | Total reward = 47.05
2022-01-26 14:17:40.760 | DEBUG    | __main__:trials:24 - Trial = 15477/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.761 | DEBUG    | __main__:trials:29 - Trial = 15477/30000 | Total reward = 43.88
2022-01-26 14:17:40.766 | DEBUG    | __main__:trials:24 - Trial = 15478/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.766 | DEBUG    | __main__:trials:29 - Trial = 15478/30000 | Total reward = 30.69
2022-01-26 14:17:40.771 | DEBUG    | __main__:trials:24 - Trial = 15479/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.772 | DEBUG    | __main__:trials:29 - Trial = 15479/30000 | Total reward = 49.36
2022-01-26 14:17:40.775 | DEBUG    | __main__:trials:26 - Trial = 15480/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.777 | DEBUG    | __main__:trials:29 - Trial = 15480/30000 | Total reward = 27.63
2022-01-26 14:17:40.780 | DEBUG    | __main__:trials:24 - Trial = 15481/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.781 | DEBUG    | __main__:trials:29 - Trial = 15481/30000 | Total reward = 44.20
2022-01-26 14:17:40.786 | DEBUG    | __main__:trials:24 - Trial = 15482/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.787 | DEBUG    | __main__:trials:29 - Trial = 15482/30000 | Total reward = 39.64
2022-01-26 14:17:40.791 | DEBUG    | __main__:trials:24 - Trial = 15483/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.791 | DEBUG    | __main__:trials:29 - Trial = 15483/30000 | Total reward = 36.49
2022-01-26 14:17:40.795 | DEBUG    | __main__:trials:24 - Trial = 15484/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.797 | DEBUG    | __main__:trials:29 - Trial = 15484/30000 | Total reward = 39.28
2022-01-26 14:17:40.800 | DEBUG    | __main__:trials:26 - Trial = 15485/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.800 | DEBUG    | __main__:trials:29 - Trial = 15485/30000 | Total reward = 20.00
2022-01-26 14:17:40.804 | DEBUG    | __main__:trials:26 - Trial = 15486/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.805 | DEBUG    | __main__:trials:29 - Trial = 15486/30000 | Total reward = 30.93
2022-01-26 14:17:40.809 | DEBUG    | __main__:trials:24 - Trial = 15487/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.810 | DEBUG    | __main__:trials:29 - Trial = 15487/30000 | Total reward = 40.03
2022-01-26 14:17:40.814 | DEBUG    | __main__:trials:24 - Trial = 15488/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.815 | DEBUG    | __main__:trials:29 - Trial = 15488/30000 | Total reward = 43.96
2022-01-26 14:17:40.819 | DEBUG    | __main__:trials:24 - Trial = 15489/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.821 | DEBUG    | __main__:trials:29 - Trial = 15489/30000 | Total reward = 53.36
2022-01-26 14:17:40.824 | DEBUG    | __main__:trials:24 - Trial = 15490/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.826 | DEBUG    | __main__:trials:29 - Trial = 15490/30000 | Total reward = 33.44
2022-01-26 14:17:40.830 | DEBUG    | __main__:trials:24 - Trial = 15491/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.831 | DEBUG    | __main__:trials:29 - Trial = 15491/30000 | Total reward = 39.64
2022-01-26 14:17:40.835 | DEBUG    | __main__:trials:24 - Trial = 15492/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.836 | DEBUG    | __main__:trials:29 - Trial = 15492/30000 | Total reward = 41.12
2022-01-26 14:17:40.839 | DEBUG    | __main__:trials:24 - Trial = 15493/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.841 | DEBUG    | __main__:trials:29 - Trial = 15493/30000 | Total reward = 39.04
2022-01-26 14:17:40.845 | DEBUG    | __main__:trials:24 - Trial = 15494/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.845 | DEBUG    | __main__:trials:29 - Trial = 15494/30000 | Total reward = 42.09
2022-01-26 14:17:40.850 | DEBUG    | __main__:trials:24 - Trial = 15495/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.852 | DEBUG    | __main__:trials:29 - Trial = 15495/30000 | Total reward = 32.80
2022-01-26 14:17:40.855 | DEBUG    | __main__:trials:24 - Trial = 15496/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.857 | DEBUG    | __main__:trials:29 - Trial = 15496/30000 | Total reward = 24.32
2022-01-26 14:17:40.861 | DEBUG    | __main__:trials:24 - Trial = 15497/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.861 | DEBUG    | __main__:trials:29 - Trial = 15497/30000 | Total reward = 43.55
2022-01-26 14:17:40.865 | DEBUG    | __main__:trials:26 - Trial = 15498/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.867 | DEBUG    | __main__:trials:29 - Trial = 15498/30000 | Total reward = 19.87
2022-01-26 14:17:40.870 | DEBUG    | __main__:trials:24 - Trial = 15499/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.871 | DEBUG    | __main__:trials:29 - Trial = 15499/30000 | Total reward = 42.53
2022-01-26 14:17:40.875 | DEBUG    | __main__:trials:24 - Trial = 15500/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.876 | DEBUG    | __main__:trials:29 - Trial = 15500/30000 | Total reward = 55.42
2022-01-26 14:17:40.879 | DEBUG    | __main__:trials:24 - Trial = 15501/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.881 | DEBUG    | __main__:trials:29 - Trial = 15501/30000 | Total reward = 43.30
2022-01-26 14:17:40.884 | DEBUG    | __main__:trials:24 - Trial = 15502/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.886 | DEBUG    | __main__:trials:29 - Trial = 15502/30000 | Total reward = 64.21
2022-01-26 14:17:40.889 | DEBUG    | __main__:trials:24 - Trial = 15503/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.890 | DEBUG    | __main__:trials:29 - Trial = 15503/30000 | Total reward = 60.47
2022-01-26 14:17:40.893 | DEBUG    | __main__:trials:24 - Trial = 15504/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.893 | DEBUG    | __main__:trials:29 - Trial = 15504/30000 | Total reward = 38.73
2022-01-26 14:17:40.898 | DEBUG    | __main__:trials:24 - Trial = 15505/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.899 | DEBUG    | __main__:trials:29 - Trial = 15505/30000 | Total reward = 53.90
2022-01-26 14:17:40.902 | DEBUG    | __main__:trials:24 - Trial = 15506/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.904 | DEBUG    | __main__:trials:29 - Trial = 15506/30000 | Total reward = 45.35
2022-01-26 14:17:40.908 | DEBUG    | __main__:trials:24 - Trial = 15507/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.909 | DEBUG    | __main__:trials:29 - Trial = 15507/30000 | Total reward = 50.82
2022-01-26 14:17:40.912 | DEBUG    | __main__:trials:24 - Trial = 15508/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.913 | DEBUG    | __main__:trials:29 - Trial = 15508/30000 | Total reward = 45.09
2022-01-26 14:17:40.916 | DEBUG    | __main__:trials:26 - Trial = 15509/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.918 | DEBUG    | __main__:trials:29 - Trial = 15509/30000 | Total reward = 31.60
2022-01-26 14:17:40.922 | DEBUG    | __main__:trials:24 - Trial = 15510/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.923 | DEBUG    | __main__:trials:29 - Trial = 15510/30000 | Total reward = 34.11
2022-01-26 14:17:40.926 | DEBUG    | __main__:trials:24 - Trial = 15511/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.928 | DEBUG    | __main__:trials:29 - Trial = 15511/30000 | Total reward = 49.50
2022-01-26 14:17:40.931 | DEBUG    | __main__:trials:26 - Trial = 15512/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.933 | DEBUG    | __main__:trials:29 - Trial = 15512/30000 | Total reward = 33.25
2022-01-26 14:17:40.936 | DEBUG    | __main__:trials:24 - Trial = 15513/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.938 | DEBUG    | __main__:trials:29 - Trial = 15513/30000 | Total reward = 41.39
2022-01-26 14:17:40.941 | DEBUG    | __main__:trials:24 - Trial = 15514/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.943 | DEBUG    | __main__:trials:29 - Trial = 15514/30000 | Total reward = 37.02
2022-01-26 14:17:40.946 | DEBUG    | __main__:trials:26 - Trial = 15515/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:40.948 | DEBUG    | __main__:trials:29 - Trial = 15515/30000 | Total reward = 41.34
2022-01-26 14:17:40.951 | DEBUG    | __main__:trials:24 - Trial = 15516/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.953 | DEBUG    | __main__:trials:29 - Trial = 15516/30000 | Total reward = 39.05
2022-01-26 14:17:40.956 | DEBUG    | __main__:trials:24 - Trial = 15517/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.957 | DEBUG    | __main__:trials:29 - Trial = 15517/30000 | Total reward = 41.68
2022-01-26 14:17:40.961 | DEBUG    | __main__:trials:24 - Trial = 15518/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.963 | DEBUG    | __main__:trials:29 - Trial = 15518/30000 | Total reward = 41.39
2022-01-26 14:17:40.965 | DEBUG    | __main__:trials:24 - Trial = 15519/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.967 | DEBUG    | __main__:trials:29 - Trial = 15519/30000 | Total reward = 46.02
2022-01-26 14:17:40.971 | DEBUG    | __main__:trials:24 - Trial = 15520/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.972 | DEBUG    | __main__:trials:29 - Trial = 15520/30000 | Total reward = 45.00
2022-01-26 14:17:40.976 | DEBUG    | __main__:trials:24 - Trial = 15521/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.977 | DEBUG    | __main__:trials:29 - Trial = 15521/30000 | Total reward = 48.94
2022-01-26 14:17:40.981 | DEBUG    | __main__:trials:24 - Trial = 15522/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.982 | DEBUG    | __main__:trials:29 - Trial = 15522/30000 | Total reward = 59.96
2022-01-26 14:17:40.985 | DEBUG    | __main__:trials:24 - Trial = 15523/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.986 | DEBUG    | __main__:trials:29 - Trial = 15523/30000 | Total reward = 41.04
2022-01-26 14:17:40.989 | DEBUG    | __main__:trials:24 - Trial = 15524/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.991 | DEBUG    | __main__:trials:29 - Trial = 15524/30000 | Total reward = 35.81
2022-01-26 14:17:40.994 | DEBUG    | __main__:trials:24 - Trial = 15525/30000 | Max number of steps (20) reached
2022-01-26 14:17:40.995 | DEBUG    | __main__:trials:29 - Trial = 15525/30000 | Total reward = 44.63
2022-01-26 14:17:40.998 | DEBUG    | __main__:trials:24 - Trial = 15526/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.000 | DEBUG    | __main__:trials:29 - Trial = 15526/30000 | Total reward = 42.49
2022-01-26 14:17:41.003 | DEBUG    | __main__:trials:24 - Trial = 15527/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.005 | DEBUG    | __main__:trials:29 - Trial = 15527/30000 | Total reward = 35.53
2022-01-26 14:17:41.008 | DEBUG    | __main__:trials:24 - Trial = 15528/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.010 | DEBUG    | __main__:trials:29 - Trial = 15528/30000 | Total reward = 53.15
2022-01-26 14:17:41.014 | DEBUG    | __main__:trials:24 - Trial = 15529/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.014 | DEBUG    | __main__:trials:29 - Trial = 15529/30000 | Total reward = 34.68
2022-01-26 14:17:41.018 | DEBUG    | __main__:trials:26 - Trial = 15530/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:41.018 | DEBUG    | __main__:trials:29 - Trial = 15530/30000 | Total reward = 11.24
2022-01-26 14:17:41.022 | DEBUG    | __main__:trials:24 - Trial = 15531/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.024 | DEBUG    | __main__:trials:29 - Trial = 15531/30000 | Total reward = 36.83
2022-01-26 14:17:41.028 | DEBUG    | __main__:trials:24 - Trial = 15532/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.028 | DEBUG    | __main__:trials:29 - Trial = 15532/30000 | Total reward = 65.34
2022-01-26 14:17:41.033 | DEBUG    | __main__:trials:24 - Trial = 15533/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.033 | DEBUG    | __main__:trials:29 - Trial = 15533/30000 | Total reward = 48.41
2022-01-26 14:17:41.037 | DEBUG    | __main__:trials:24 - Trial = 15534/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.038 | DEBUG    | __main__:trials:29 - Trial = 15534/30000 | Total reward = 46.44
2022-01-26 14:17:41.041 | DEBUG    | __main__:trials:24 - Trial = 15535/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.042 | DEBUG    | __main__:trials:29 - Trial = 15535/30000 | Total reward = 43.74
2022-01-26 14:17:41.045 | DEBUG    | __main__:trials:24 - Trial = 15536/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.047 | DEBUG    | __main__:trials:29 - Trial = 15536/30000 | Total reward = 30.52
2022-01-26 14:17:41.050 | DEBUG    | __main__:trials:24 - Trial = 15537/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.050 | DEBUG    | __main__:trials:29 - Trial = 15537/30000 | Total reward = 53.48
2022-01-26 14:17:41.054 | DEBUG    | __main__:trials:24 - Trial = 15538/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.056 | DEBUG    | __main__:trials:29 - Trial = 15538/30000 | Total reward = 39.12
2022-01-26 14:17:41.059 | DEBUG    | __main__:trials:24 - Trial = 15539/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.061 | DEBUG    | __main__:trials:29 - Trial = 15539/30000 | Total reward = 38.90
2022-01-26 14:17:41.064 | DEBUG    | __main__:trials:24 - Trial = 15540/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.066 | DEBUG    | __main__:trials:29 - Trial = 15540/30000 | Total reward = 56.65
2022-01-26 14:17:41.070 | DEBUG    | __main__:trials:24 - Trial = 15541/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.070 | DEBUG    | __main__:trials:29 - Trial = 15541/30000 | Total reward = 45.99
2022-01-26 14:17:41.074 | DEBUG    | __main__:trials:24 - Trial = 15542/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.075 | DEBUG    | __main__:trials:29 - Trial = 15542/30000 | Total reward = 50.44
2022-01-26 14:17:41.080 | DEBUG    | __main__:trials:24 - Trial = 15543/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.080 | DEBUG    | __main__:trials:29 - Trial = 15543/30000 | Total reward = 39.99
2022-01-26 14:17:41.085 | DEBUG    | __main__:trials:24 - Trial = 15544/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.086 | DEBUG    | __main__:trials:29 - Trial = 15544/30000 | Total reward = 41.29
2022-01-26 14:17:41.090 | DEBUG    | __main__:trials:24 - Trial = 15545/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.091 | DEBUG    | __main__:trials:29 - Trial = 15545/30000 | Total reward = 53.74
2022-01-26 14:17:41.095 | DEBUG    | __main__:trials:24 - Trial = 15546/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.095 | DEBUG    | __main__:trials:29 - Trial = 15546/30000 | Total reward = 47.78
2022-01-26 14:17:41.100 | DEBUG    | __main__:trials:24 - Trial = 15547/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.101 | DEBUG    | __main__:trials:29 - Trial = 15547/30000 | Total reward = 53.81
2022-01-26 14:17:41.104 | DEBUG    | __main__:trials:24 - Trial = 15548/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.105 | DEBUG    | __main__:trials:29 - Trial = 15548/30000 | Total reward = 31.24
2022-01-26 14:17:41.109 | DEBUG    | __main__:trials:24 - Trial = 15549/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.110 | DEBUG    | __main__:trials:29 - Trial = 15549/30000 | Total reward = 56.62
2022-01-26 14:17:41.113 | DEBUG    | __main__:trials:24 - Trial = 15550/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.114 | DEBUG    | __main__:trials:29 - Trial = 15550/30000 | Total reward = 38.08
2022-01-26 14:17:41.119 | DEBUG    | __main__:trials:24 - Trial = 15551/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.120 | DEBUG    | __main__:trials:29 - Trial = 15551/30000 | Total reward = 62.50
2022-01-26 14:17:41.123 | DEBUG    | __main__:trials:24 - Trial = 15552/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.125 | DEBUG    | __main__:trials:29 - Trial = 15552/30000 | Total reward = 44.50
2022-01-26 14:17:41.128 | DEBUG    | __main__:trials:24 - Trial = 15553/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.130 | DEBUG    | __main__:trials:29 - Trial = 15553/30000 | Total reward = 42.00
2022-01-26 14:17:41.133 | DEBUG    | __main__:trials:24 - Trial = 15554/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.134 | DEBUG    | __main__:trials:29 - Trial = 15554/30000 | Total reward = 58.35
2022-01-26 14:17:41.138 | DEBUG    | __main__:trials:24 - Trial = 15555/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.139 | DEBUG    | __main__:trials:29 - Trial = 15555/30000 | Total reward = 50.47
2022-01-26 14:17:41.143 | DEBUG    | __main__:trials:24 - Trial = 15556/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.144 | DEBUG    | __main__:trials:29 - Trial = 15556/30000 | Total reward = 40.84
2022-01-26 14:17:41.147 | DEBUG    | __main__:trials:24 - Trial = 15557/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.149 | DEBUG    | __main__:trials:29 - Trial = 15557/30000 | Total reward = 62.91
2022-01-26 14:17:41.152 | DEBUG    | __main__:trials:24 - Trial = 15558/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.153 | DEBUG    | __main__:trials:29 - Trial = 15558/30000 | Total reward = 50.56
2022-01-26 14:17:41.156 | DEBUG    | __main__:trials:24 - Trial = 15559/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.157 | DEBUG    | __main__:trials:29 - Trial = 15559/30000 | Total reward = 41.79
2022-01-26 14:17:41.161 | DEBUG    | __main__:trials:24 - Trial = 15560/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.162 | DEBUG    | __main__:trials:29 - Trial = 15560/30000 | Total reward = 40.83
2022-01-26 14:17:41.165 | DEBUG    | __main__:trials:24 - Trial = 15561/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.166 | DEBUG    | __main__:trials:29 - Trial = 15561/30000 | Total reward = 38.20
2022-01-26 14:17:41.169 | DEBUG    | __main__:trials:24 - Trial = 15562/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.170 | DEBUG    | __main__:trials:29 - Trial = 15562/30000 | Total reward = 57.75
2022-01-26 14:17:41.173 | DEBUG    | __main__:trials:24 - Trial = 15563/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.174 | DEBUG    | __main__:trials:29 - Trial = 15563/30000 | Total reward = 44.78
2022-01-26 14:17:41.177 | DEBUG    | __main__:trials:24 - Trial = 15564/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.178 | DEBUG    | __main__:trials:29 - Trial = 15564/30000 | Total reward = 36.35
2022-01-26 14:17:41.182 | DEBUG    | __main__:trials:24 - Trial = 15565/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.183 | DEBUG    | __main__:trials:29 - Trial = 15565/30000 | Total reward = 51.38
2022-01-26 14:17:41.187 | DEBUG    | __main__:trials:24 - Trial = 15566/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.187 | DEBUG    | __main__:trials:29 - Trial = 15566/30000 | Total reward = 40.49
2022-01-26 14:17:41.191 | DEBUG    | __main__:trials:24 - Trial = 15567/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.192 | DEBUG    | __main__:trials:29 - Trial = 15567/30000 | Total reward = 36.95
2022-01-26 14:17:41.195 | DEBUG    | __main__:trials:24 - Trial = 15568/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.196 | DEBUG    | __main__:trials:29 - Trial = 15568/30000 | Total reward = 56.30
2022-01-26 14:17:41.199 | DEBUG    | __main__:trials:24 - Trial = 15569/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.201 | DEBUG    | __main__:trials:29 - Trial = 15569/30000 | Total reward = 61.23
2022-01-26 14:17:41.204 | DEBUG    | __main__:trials:24 - Trial = 15570/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.205 | DEBUG    | __main__:trials:29 - Trial = 15570/30000 | Total reward = 30.13
2022-01-26 14:17:41.209 | DEBUG    | __main__:trials:24 - Trial = 15571/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.210 | DEBUG    | __main__:trials:29 - Trial = 15571/30000 | Total reward = 46.54
2022-01-26 14:17:41.213 | DEBUG    | __main__:trials:24 - Trial = 15572/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.214 | DEBUG    | __main__:trials:29 - Trial = 15572/30000 | Total reward = 51.77
2022-01-26 14:17:41.217 | DEBUG    | __main__:trials:24 - Trial = 15573/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.219 | DEBUG    | __main__:trials:29 - Trial = 15573/30000 | Total reward = 61.41
2022-01-26 14:17:41.222 | DEBUG    | __main__:trials:24 - Trial = 15574/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.223 | DEBUG    | __main__:trials:29 - Trial = 15574/30000 | Total reward = 43.09
2022-01-26 14:17:41.226 | DEBUG    | __main__:trials:24 - Trial = 15575/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.228 | DEBUG    | __main__:trials:29 - Trial = 15575/30000 | Total reward = 52.83
2022-01-26 14:17:41.232 | DEBUG    | __main__:trials:24 - Trial = 15576/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.233 | DEBUG    | __main__:trials:29 - Trial = 15576/30000 | Total reward = 53.95
2022-01-26 14:17:41.237 | DEBUG    | __main__:trials:24 - Trial = 15577/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.238 | DEBUG    | __main__:trials:29 - Trial = 15577/30000 | Total reward = 52.56
2022-01-26 14:17:41.241 | DEBUG    | __main__:trials:24 - Trial = 15578/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.243 | DEBUG    | __main__:trials:29 - Trial = 15578/30000 | Total reward = 61.52
2022-01-26 14:17:41.247 | DEBUG    | __main__:trials:24 - Trial = 15579/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.248 | DEBUG    | __main__:trials:29 - Trial = 15579/30000 | Total reward = 28.97
2022-01-26 14:17:41.251 | DEBUG    | __main__:trials:24 - Trial = 15580/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.253 | DEBUG    | __main__:trials:29 - Trial = 15580/30000 | Total reward = 53.60
2022-01-26 14:17:41.256 | DEBUG    | __main__:trials:24 - Trial = 15581/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.258 | DEBUG    | __main__:trials:29 - Trial = 15581/30000 | Total reward = 53.83
2022-01-26 14:17:41.261 | DEBUG    | __main__:trials:24 - Trial = 15582/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.263 | DEBUG    | __main__:trials:29 - Trial = 15582/30000 | Total reward = 37.66
2022-01-26 14:17:41.266 | DEBUG    | __main__:trials:24 - Trial = 15583/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.268 | DEBUG    | __main__:trials:29 - Trial = 15583/30000 | Total reward = 57.80
2022-01-26 14:17:41.271 | DEBUG    | __main__:trials:24 - Trial = 15584/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.272 | DEBUG    | __main__:trials:29 - Trial = 15584/30000 | Total reward = 56.17
2022-01-26 14:17:41.277 | DEBUG    | __main__:trials:24 - Trial = 15585/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.278 | DEBUG    | __main__:trials:29 - Trial = 15585/30000 | Total reward = 39.23
2022-01-26 14:17:41.282 | DEBUG    | __main__:trials:24 - Trial = 15586/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.284 | DEBUG    | __main__:trials:29 - Trial = 15586/30000 | Total reward = 50.06
2022-01-26 14:17:41.288 | DEBUG    | __main__:trials:24 - Trial = 15587/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.289 | DEBUG    | __main__:trials:29 - Trial = 15587/30000 | Total reward = 57.08
2022-01-26 14:17:41.293 | DEBUG    | __main__:trials:24 - Trial = 15588/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.294 | DEBUG    | __main__:trials:29 - Trial = 15588/30000 | Total reward = 38.38
2022-01-26 14:17:41.298 | DEBUG    | __main__:trials:24 - Trial = 15589/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.298 | DEBUG    | __main__:trials:29 - Trial = 15589/30000 | Total reward = 50.11
2022-01-26 14:17:41.303 | DEBUG    | __main__:trials:24 - Trial = 15590/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.304 | DEBUG    | __main__:trials:29 - Trial = 15590/30000 | Total reward = 47.13
2022-01-26 14:17:41.308 | DEBUG    | __main__:trials:24 - Trial = 15591/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.308 | DEBUG    | __main__:trials:29 - Trial = 15591/30000 | Total reward = 43.49
2022-01-26 14:17:41.313 | DEBUG    | __main__:trials:24 - Trial = 15592/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.314 | DEBUG    | __main__:trials:29 - Trial = 15592/30000 | Total reward = 55.73
2022-01-26 14:17:41.318 | DEBUG    | __main__:trials:24 - Trial = 15593/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.318 | DEBUG    | __main__:trials:29 - Trial = 15593/30000 | Total reward = 41.25
2022-01-26 14:17:41.322 | DEBUG    | __main__:trials:24 - Trial = 15594/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.323 | DEBUG    | __main__:trials:29 - Trial = 15594/30000 | Total reward = 45.51
2022-01-26 14:17:41.327 | DEBUG    | __main__:trials:24 - Trial = 15595/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.329 | DEBUG    | __main__:trials:29 - Trial = 15595/30000 | Total reward = 44.93
2022-01-26 14:17:41.332 | DEBUG    | __main__:trials:24 - Trial = 15596/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.334 | DEBUG    | __main__:trials:29 - Trial = 15596/30000 | Total reward = 55.70
2022-01-26 14:17:41.337 | DEBUG    | __main__:trials:24 - Trial = 15597/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.338 | DEBUG    | __main__:trials:29 - Trial = 15597/30000 | Total reward = 56.35
2022-01-26 14:17:41.343 | DEBUG    | __main__:trials:24 - Trial = 15598/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.343 | DEBUG    | __main__:trials:29 - Trial = 15598/30000 | Total reward = 47.70
2022-01-26 14:17:41.348 | DEBUG    | __main__:trials:24 - Trial = 15599/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.348 | DEBUG    | __main__:trials:29 - Trial = 15599/30000 | Total reward = 52.31
2022-01-26 14:17:41.352 | DEBUG    | __main__:trials:24 - Trial = 15600/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.354 | DEBUG    | __main__:trials:29 - Trial = 15600/30000 | Total reward = 54.96
2022-01-26 14:17:41.357 | DEBUG    | __main__:trials:24 - Trial = 15601/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.358 | DEBUG    | __main__:trials:29 - Trial = 15601/30000 | Total reward = 50.94
2022-01-26 14:17:41.362 | DEBUG    | __main__:trials:24 - Trial = 15602/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.362 | DEBUG    | __main__:trials:29 - Trial = 15602/30000 | Total reward = 57.32
2022-01-26 14:17:41.367 | DEBUG    | __main__:trials:24 - Trial = 15603/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.369 | DEBUG    | __main__:trials:29 - Trial = 15603/30000 | Total reward = 62.30
2022-01-26 14:17:41.373 | DEBUG    | __main__:trials:24 - Trial = 15604/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.374 | DEBUG    | __main__:trials:29 - Trial = 15604/30000 | Total reward = 62.31
2022-01-26 14:17:41.377 | DEBUG    | __main__:trials:24 - Trial = 15605/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.378 | DEBUG    | __main__:trials:29 - Trial = 15605/30000 | Total reward = 49.36
2022-01-26 14:17:41.381 | DEBUG    | __main__:trials:24 - Trial = 15606/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.382 | DEBUG    | __main__:trials:29 - Trial = 15606/30000 | Total reward = 57.61
2022-01-26 14:17:41.386 | DEBUG    | __main__:trials:24 - Trial = 15607/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.388 | DEBUG    | __main__:trials:29 - Trial = 15607/30000 | Total reward = 56.44
2022-01-26 14:17:41.391 | DEBUG    | __main__:trials:24 - Trial = 15608/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.392 | DEBUG    | __main__:trials:29 - Trial = 15608/30000 | Total reward = 57.06
2022-01-26 14:17:41.396 | DEBUG    | __main__:trials:24 - Trial = 15609/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.397 | DEBUG    | __main__:trials:29 - Trial = 15609/30000 | Total reward = 64.04
2022-01-26 14:17:41.400 | DEBUG    | __main__:trials:24 - Trial = 15610/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.402 | DEBUG    | __main__:trials:29 - Trial = 15610/30000 | Total reward = 44.46
2022-01-26 14:17:41.405 | DEBUG    | __main__:trials:24 - Trial = 15611/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.406 | DEBUG    | __main__:trials:29 - Trial = 15611/30000 | Total reward = 63.96
2022-01-26 14:17:41.409 | DEBUG    | __main__:trials:24 - Trial = 15612/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.411 | DEBUG    | __main__:trials:29 - Trial = 15612/30000 | Total reward = 57.21
2022-01-26 14:17:41.413 | DEBUG    | __main__:trials:24 - Trial = 15613/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.415 | DEBUG    | __main__:trials:29 - Trial = 15613/30000 | Total reward = 55.02
2022-01-26 14:17:41.418 | DEBUG    | __main__:trials:24 - Trial = 15614/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.420 | DEBUG    | __main__:trials:29 - Trial = 15614/30000 | Total reward = 37.06
2022-01-26 14:17:41.424 | DEBUG    | __main__:trials:24 - Trial = 15615/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.425 | DEBUG    | __main__:trials:29 - Trial = 15615/30000 | Total reward = 40.19
2022-01-26 14:17:41.429 | DEBUG    | __main__:trials:24 - Trial = 15616/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.430 | DEBUG    | __main__:trials:29 - Trial = 15616/30000 | Total reward = 55.97
2022-01-26 14:17:41.434 | DEBUG    | __main__:trials:24 - Trial = 15617/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.435 | DEBUG    | __main__:trials:29 - Trial = 15617/30000 | Total reward = 57.22
2022-01-26 14:17:41.439 | DEBUG    | __main__:trials:24 - Trial = 15618/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.440 | DEBUG    | __main__:trials:29 - Trial = 15618/30000 | Total reward = 53.67
2022-01-26 14:17:41.444 | DEBUG    | __main__:trials:24 - Trial = 15619/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.446 | DEBUG    | __main__:trials:29 - Trial = 15619/30000 | Total reward = 56.04
2022-01-26 14:17:41.449 | DEBUG    | __main__:trials:24 - Trial = 15620/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.451 | DEBUG    | __main__:trials:29 - Trial = 15620/30000 | Total reward = 41.56
2022-01-26 14:17:41.454 | DEBUG    | __main__:trials:24 - Trial = 15621/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.456 | DEBUG    | __main__:trials:29 - Trial = 15621/30000 | Total reward = 41.99
2022-01-26 14:17:41.459 | DEBUG    | __main__:trials:24 - Trial = 15622/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.461 | DEBUG    | __main__:trials:29 - Trial = 15622/30000 | Total reward = 49.20
2022-01-26 14:17:41.463 | DEBUG    | __main__:trials:26 - Trial = 15623/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:41.464 | DEBUG    | __main__:trials:29 - Trial = 15623/30000 | Total reward = 17.05
2022-01-26 14:17:41.467 | DEBUG    | __main__:trials:24 - Trial = 15624/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.469 | DEBUG    | __main__:trials:29 - Trial = 15624/30000 | Total reward = 65.95
2022-01-26 14:17:41.472 | DEBUG    | __main__:trials:24 - Trial = 15625/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.473 | DEBUG    | __main__:trials:29 - Trial = 15625/30000 | Total reward = 57.69
2022-01-26 14:17:41.477 | DEBUG    | __main__:trials:24 - Trial = 15626/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.478 | DEBUG    | __main__:trials:29 - Trial = 15626/30000 | Total reward = 44.24
2022-01-26 14:17:41.481 | DEBUG    | __main__:trials:24 - Trial = 15627/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.482 | DEBUG    | __main__:trials:29 - Trial = 15627/30000 | Total reward = 44.28
2022-01-26 14:17:41.487 | DEBUG    | __main__:trials:24 - Trial = 15628/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.487 | DEBUG    | __main__:trials:29 - Trial = 15628/30000 | Total reward = 43.38
2022-01-26 14:17:41.491 | DEBUG    | __main__:trials:24 - Trial = 15629/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.493 | DEBUG    | __main__:trials:29 - Trial = 15629/30000 | Total reward = 48.98
2022-01-26 14:17:41.497 | DEBUG    | __main__:trials:24 - Trial = 15630/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.497 | DEBUG    | __main__:trials:29 - Trial = 15630/30000 | Total reward = 30.71
2022-01-26 14:17:41.501 | DEBUG    | __main__:trials:24 - Trial = 15631/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.502 | DEBUG    | __main__:trials:29 - Trial = 15631/30000 | Total reward = 44.24
2022-01-26 14:17:41.506 | DEBUG    | __main__:trials:24 - Trial = 15632/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.507 | DEBUG    | __main__:trials:29 - Trial = 15632/30000 | Total reward = 55.13
2022-01-26 14:17:41.510 | DEBUG    | __main__:trials:24 - Trial = 15633/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.512 | DEBUG    | __main__:trials:29 - Trial = 15633/30000 | Total reward = 35.41
2022-01-26 14:17:41.516 | DEBUG    | __main__:trials:24 - Trial = 15634/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.516 | DEBUG    | __main__:trials:29 - Trial = 15634/30000 | Total reward = 32.16
2022-01-26 14:17:41.520 | DEBUG    | __main__:trials:24 - Trial = 15635/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.522 | DEBUG    | __main__:trials:29 - Trial = 15635/30000 | Total reward = 56.74
2022-01-26 14:17:41.525 | DEBUG    | __main__:trials:24 - Trial = 15636/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.526 | DEBUG    | __main__:trials:29 - Trial = 15636/30000 | Total reward = 60.41
2022-01-26 14:17:41.530 | DEBUG    | __main__:trials:24 - Trial = 15637/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.531 | DEBUG    | __main__:trials:29 - Trial = 15637/30000 | Total reward = 36.47
2022-01-26 14:17:41.535 | DEBUG    | __main__:trials:24 - Trial = 15638/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.536 | DEBUG    | __main__:trials:29 - Trial = 15638/30000 | Total reward = 66.33
2022-01-26 14:17:41.539 | DEBUG    | __main__:trials:24 - Trial = 15639/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.541 | DEBUG    | __main__:trials:29 - Trial = 15639/30000 | Total reward = 52.83
2022-01-26 14:17:41.544 | DEBUG    | __main__:trials:24 - Trial = 15640/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.546 | DEBUG    | __main__:trials:29 - Trial = 15640/30000 | Total reward = 43.65
2022-01-26 14:17:41.549 | DEBUG    | __main__:trials:24 - Trial = 15641/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.550 | DEBUG    | __main__:trials:29 - Trial = 15641/30000 | Total reward = 38.28
2022-01-26 14:17:41.554 | DEBUG    | __main__:trials:24 - Trial = 15642/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.555 | DEBUG    | __main__:trials:29 - Trial = 15642/30000 | Total reward = 41.27
2022-01-26 14:17:41.559 | DEBUG    | __main__:trials:24 - Trial = 15643/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.561 | DEBUG    | __main__:trials:29 - Trial = 15643/30000 | Total reward = 57.79
2022-01-26 14:17:41.564 | DEBUG    | __main__:trials:24 - Trial = 15644/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.566 | DEBUG    | __main__:trials:29 - Trial = 15644/30000 | Total reward = 45.66
2022-01-26 14:17:41.569 | DEBUG    | __main__:trials:24 - Trial = 15645/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.570 | DEBUG    | __main__:trials:29 - Trial = 15645/30000 | Total reward = 44.94
2022-01-26 14:17:41.574 | DEBUG    | __main__:trials:24 - Trial = 15646/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.576 | DEBUG    | __main__:trials:29 - Trial = 15646/30000 | Total reward = 41.72
2022-01-26 14:17:41.580 | DEBUG    | __main__:trials:24 - Trial = 15647/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.581 | DEBUG    | __main__:trials:29 - Trial = 15647/30000 | Total reward = 43.21
2022-01-26 14:17:41.584 | DEBUG    | __main__:trials:24 - Trial = 15648/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.586 | DEBUG    | __main__:trials:29 - Trial = 15648/30000 | Total reward = 57.62
2022-01-26 14:17:41.590 | DEBUG    | __main__:trials:24 - Trial = 15649/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.591 | DEBUG    | __main__:trials:29 - Trial = 15649/30000 | Total reward = 43.37
2022-01-26 14:17:41.595 | DEBUG    | __main__:trials:24 - Trial = 15650/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.595 | DEBUG    | __main__:trials:29 - Trial = 15650/30000 | Total reward = 41.70
2022-01-26 14:17:41.600 | DEBUG    | __main__:trials:24 - Trial = 15651/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.600 | DEBUG    | __main__:trials:29 - Trial = 15651/30000 | Total reward = 42.38
2022-01-26 14:17:41.604 | DEBUG    | __main__:trials:24 - Trial = 15652/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.606 | DEBUG    | __main__:trials:29 - Trial = 15652/30000 | Total reward = 58.62
2022-01-26 14:17:41.609 | DEBUG    | __main__:trials:24 - Trial = 15653/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.610 | DEBUG    | __main__:trials:29 - Trial = 15653/30000 | Total reward = 40.21
2022-01-26 14:17:41.613 | DEBUG    | __main__:trials:24 - Trial = 15654/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.615 | DEBUG    | __main__:trials:29 - Trial = 15654/30000 | Total reward = 50.14
2022-01-26 14:17:41.619 | DEBUG    | __main__:trials:24 - Trial = 15655/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.621 | DEBUG    | __main__:trials:29 - Trial = 15655/30000 | Total reward = 43.03
2022-01-26 14:17:41.624 | DEBUG    | __main__:trials:24 - Trial = 15656/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.625 | DEBUG    | __main__:trials:29 - Trial = 15656/30000 | Total reward = 45.86
2022-01-26 14:17:41.628 | DEBUG    | __main__:trials:24 - Trial = 15657/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.630 | DEBUG    | __main__:trials:29 - Trial = 15657/30000 | Total reward = 43.81
2022-01-26 14:17:41.633 | DEBUG    | __main__:trials:24 - Trial = 15658/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.633 | DEBUG    | __main__:trials:29 - Trial = 15658/30000 | Total reward = 39.97
2022-01-26 14:17:41.637 | DEBUG    | __main__:trials:24 - Trial = 15659/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.638 | DEBUG    | __main__:trials:29 - Trial = 15659/30000 | Total reward = 46.03
2022-01-26 14:17:41.641 | DEBUG    | __main__:trials:26 - Trial = 15660/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:41.643 | DEBUG    | __main__:trials:29 - Trial = 15660/30000 | Total reward = 33.80
2022-01-26 14:17:41.646 | DEBUG    | __main__:trials:24 - Trial = 15661/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.648 | DEBUG    | __main__:trials:29 - Trial = 15661/30000 | Total reward = 55.11
2022-01-26 14:17:41.651 | DEBUG    | __main__:trials:24 - Trial = 15662/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.652 | DEBUG    | __main__:trials:29 - Trial = 15662/30000 | Total reward = 48.63
2022-01-26 14:17:41.656 | DEBUG    | __main__:trials:24 - Trial = 15663/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.658 | DEBUG    | __main__:trials:29 - Trial = 15663/30000 | Total reward = 58.28
2022-01-26 14:17:41.661 | DEBUG    | __main__:trials:24 - Trial = 15664/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.662 | DEBUG    | __main__:trials:29 - Trial = 15664/30000 | Total reward = 50.98
2022-01-26 14:17:41.667 | DEBUG    | __main__:trials:24 - Trial = 15665/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.668 | DEBUG    | __main__:trials:29 - Trial = 15665/30000 | Total reward = 47.05
2022-01-26 14:17:41.672 | DEBUG    | __main__:trials:24 - Trial = 15666/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.673 | DEBUG    | __main__:trials:29 - Trial = 15666/30000 | Total reward = 45.35
2022-01-26 14:17:41.676 | DEBUG    | __main__:trials:24 - Trial = 15667/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.677 | DEBUG    | __main__:trials:29 - Trial = 15667/30000 | Total reward = 54.46
2022-01-26 14:17:41.680 | DEBUG    | __main__:trials:24 - Trial = 15668/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.682 | DEBUG    | __main__:trials:29 - Trial = 15668/30000 | Total reward = 38.26
2022-01-26 14:17:41.685 | DEBUG    | __main__:trials:24 - Trial = 15669/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.687 | DEBUG    | __main__:trials:29 - Trial = 15669/30000 | Total reward = 51.22
2022-01-26 14:17:41.690 | DEBUG    | __main__:trials:24 - Trial = 15670/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.691 | DEBUG    | __main__:trials:29 - Trial = 15670/30000 | Total reward = 62.24
2022-01-26 14:17:41.695 | DEBUG    | __main__:trials:24 - Trial = 15671/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.696 | DEBUG    | __main__:trials:29 - Trial = 15671/30000 | Total reward = 43.38
2022-01-26 14:17:41.700 | DEBUG    | __main__:trials:24 - Trial = 15672/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.701 | DEBUG    | __main__:trials:29 - Trial = 15672/30000 | Total reward = 57.08
2022-01-26 14:17:41.705 | DEBUG    | __main__:trials:24 - Trial = 15673/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.707 | DEBUG    | __main__:trials:29 - Trial = 15673/30000 | Total reward = 54.80
2022-01-26 14:17:41.710 | DEBUG    | __main__:trials:24 - Trial = 15674/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.712 | DEBUG    | __main__:trials:29 - Trial = 15674/30000 | Total reward = 47.34
2022-01-26 14:17:41.715 | DEBUG    | __main__:trials:24 - Trial = 15675/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.717 | DEBUG    | __main__:trials:29 - Trial = 15675/30000 | Total reward = 40.43
2022-01-26 14:17:41.720 | DEBUG    | __main__:trials:24 - Trial = 15676/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.722 | DEBUG    | __main__:trials:29 - Trial = 15676/30000 | Total reward = 47.29
2022-01-26 14:17:41.725 | DEBUG    | __main__:trials:24 - Trial = 15677/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.726 | DEBUG    | __main__:trials:29 - Trial = 15677/30000 | Total reward = 46.58
2022-01-26 14:17:41.731 | DEBUG    | __main__:trials:24 - Trial = 15678/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.732 | DEBUG    | __main__:trials:29 - Trial = 15678/30000 | Total reward = 63.35
2022-01-26 14:17:41.735 | DEBUG    | __main__:trials:24 - Trial = 15679/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.737 | DEBUG    | __main__:trials:29 - Trial = 15679/30000 | Total reward = 56.34
2022-01-26 14:17:41.740 | DEBUG    | __main__:trials:24 - Trial = 15680/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.741 | DEBUG    | __main__:trials:29 - Trial = 15680/30000 | Total reward = 41.00
2022-01-26 14:17:41.745 | DEBUG    | __main__:trials:24 - Trial = 15681/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.747 | DEBUG    | __main__:trials:29 - Trial = 15681/30000 | Total reward = 30.57
2022-01-26 14:17:41.751 | DEBUG    | __main__:trials:24 - Trial = 15682/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.751 | DEBUG    | __main__:trials:29 - Trial = 15682/30000 | Total reward = 41.63
2022-01-26 14:17:41.756 | DEBUG    | __main__:trials:24 - Trial = 15683/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.757 | DEBUG    | __main__:trials:29 - Trial = 15683/30000 | Total reward = 28.12
2022-01-26 14:17:41.761 | DEBUG    | __main__:trials:24 - Trial = 15684/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.762 | DEBUG    | __main__:trials:29 - Trial = 15684/30000 | Total reward = 41.84
2022-01-26 14:17:41.766 | DEBUG    | __main__:trials:24 - Trial = 15685/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.769 | DEBUG    | __main__:trials:29 - Trial = 15685/30000 | Total reward = 40.43
2022-01-26 14:17:41.774 | DEBUG    | __main__:trials:24 - Trial = 15686/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.775 | DEBUG    | __main__:trials:29 - Trial = 15686/30000 | Total reward = 39.65
2022-01-26 14:17:41.780 | DEBUG    | __main__:trials:24 - Trial = 15687/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.781 | DEBUG    | __main__:trials:29 - Trial = 15687/30000 | Total reward = 34.20
2022-01-26 14:17:41.785 | DEBUG    | __main__:trials:24 - Trial = 15688/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.786 | DEBUG    | __main__:trials:29 - Trial = 15688/30000 | Total reward = 42.03
2022-01-26 14:17:41.789 | DEBUG    | __main__:trials:24 - Trial = 15689/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.790 | DEBUG    | __main__:trials:29 - Trial = 15689/30000 | Total reward = 56.74
2022-01-26 14:17:41.793 | DEBUG    | __main__:trials:24 - Trial = 15690/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.795 | DEBUG    | __main__:trials:29 - Trial = 15690/30000 | Total reward = 36.78
2022-01-26 14:17:41.799 | DEBUG    | __main__:trials:24 - Trial = 15691/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.800 | DEBUG    | __main__:trials:29 - Trial = 15691/30000 | Total reward = 39.85
2022-01-26 14:17:41.804 | DEBUG    | __main__:trials:24 - Trial = 15692/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.805 | DEBUG    | __main__:trials:29 - Trial = 15692/30000 | Total reward = 51.63
2022-01-26 14:17:41.809 | DEBUG    | __main__:trials:24 - Trial = 15693/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.810 | DEBUG    | __main__:trials:29 - Trial = 15693/30000 | Total reward = 28.94
2022-01-26 14:17:41.814 | DEBUG    | __main__:trials:26 - Trial = 15694/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:41.814 | DEBUG    | __main__:trials:29 - Trial = 15694/30000 | Total reward = 30.83
2022-01-26 14:17:41.819 | DEBUG    | __main__:trials:24 - Trial = 15695/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.819 | DEBUG    | __main__:trials:29 - Trial = 15695/30000 | Total reward = 50.13
2022-01-26 14:17:41.823 | DEBUG    | __main__:trials:24 - Trial = 15696/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.825 | DEBUG    | __main__:trials:29 - Trial = 15696/30000 | Total reward = 56.56
2022-01-26 14:17:41.828 | DEBUG    | __main__:trials:24 - Trial = 15697/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.830 | DEBUG    | __main__:trials:29 - Trial = 15697/30000 | Total reward = 44.25
2022-01-26 14:17:41.833 | DEBUG    | __main__:trials:24 - Trial = 15698/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.835 | DEBUG    | __main__:trials:29 - Trial = 15698/30000 | Total reward = 62.38
2022-01-26 14:17:41.839 | DEBUG    | __main__:trials:24 - Trial = 15699/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.840 | DEBUG    | __main__:trials:29 - Trial = 15699/30000 | Total reward = 46.52
2022-01-26 14:17:41.843 | DEBUG    | __main__:trials:24 - Trial = 15700/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.845 | DEBUG    | __main__:trials:29 - Trial = 15700/30000 | Total reward = 47.90
2022-01-26 14:17:41.848 | DEBUG    | __main__:trials:24 - Trial = 15701/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.849 | DEBUG    | __main__:trials:29 - Trial = 15701/30000 | Total reward = 43.65
2022-01-26 14:17:41.852 | DEBUG    | __main__:trials:24 - Trial = 15702/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.854 | DEBUG    | __main__:trials:29 - Trial = 15702/30000 | Total reward = 40.18
2022-01-26 14:17:41.858 | DEBUG    | __main__:trials:24 - Trial = 15703/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.859 | DEBUG    | __main__:trials:29 - Trial = 15703/30000 | Total reward = 55.42
2022-01-26 14:17:41.862 | DEBUG    | __main__:trials:24 - Trial = 15704/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.864 | DEBUG    | __main__:trials:29 - Trial = 15704/30000 | Total reward = 61.37
2022-01-26 14:17:41.867 | DEBUG    | __main__:trials:24 - Trial = 15705/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.868 | DEBUG    | __main__:trials:29 - Trial = 15705/30000 | Total reward = 60.63
2022-01-26 14:17:41.872 | DEBUG    | __main__:trials:24 - Trial = 15706/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.873 | DEBUG    | __main__:trials:29 - Trial = 15706/30000 | Total reward = 50.30
2022-01-26 14:17:41.876 | DEBUG    | __main__:trials:24 - Trial = 15707/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.878 | DEBUG    | __main__:trials:29 - Trial = 15707/30000 | Total reward = 46.04
2022-01-26 14:17:41.881 | DEBUG    | __main__:trials:24 - Trial = 15708/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.883 | DEBUG    | __main__:trials:29 - Trial = 15708/30000 | Total reward = 44.79
2022-01-26 14:17:41.886 | DEBUG    | __main__:trials:24 - Trial = 15709/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.887 | DEBUG    | __main__:trials:29 - Trial = 15709/30000 | Total reward = 49.52
2022-01-26 14:17:41.891 | DEBUG    | __main__:trials:24 - Trial = 15710/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.893 | DEBUG    | __main__:trials:29 - Trial = 15710/30000 | Total reward = 62.43
2022-01-26 14:17:41.896 | DEBUG    | __main__:trials:24 - Trial = 15711/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.897 | DEBUG    | __main__:trials:29 - Trial = 15711/30000 | Total reward = 53.01
2022-01-26 14:17:41.901 | DEBUG    | __main__:trials:24 - Trial = 15712/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.901 | DEBUG    | __main__:trials:29 - Trial = 15712/30000 | Total reward = 44.53
2022-01-26 14:17:41.905 | DEBUG    | __main__:trials:24 - Trial = 15713/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.906 | DEBUG    | __main__:trials:29 - Trial = 15713/30000 | Total reward = 46.49
2022-01-26 14:17:41.910 | DEBUG    | __main__:trials:24 - Trial = 15714/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.910 | DEBUG    | __main__:trials:29 - Trial = 15714/30000 | Total reward = 45.60
2022-01-26 14:17:41.914 | DEBUG    | __main__:trials:24 - Trial = 15715/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.915 | DEBUG    | __main__:trials:29 - Trial = 15715/30000 | Total reward = 53.42
2022-01-26 14:17:41.918 | DEBUG    | __main__:trials:24 - Trial = 15716/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.919 | DEBUG    | __main__:trials:29 - Trial = 15716/30000 | Total reward = 36.00
2022-01-26 14:17:41.922 | DEBUG    | __main__:trials:24 - Trial = 15717/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.923 | DEBUG    | __main__:trials:29 - Trial = 15717/30000 | Total reward = 65.86
2022-01-26 14:17:41.926 | DEBUG    | __main__:trials:24 - Trial = 15718/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.927 | DEBUG    | __main__:trials:29 - Trial = 15718/30000 | Total reward = 42.60
2022-01-26 14:17:41.931 | DEBUG    | __main__:trials:24 - Trial = 15719/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.932 | DEBUG    | __main__:trials:29 - Trial = 15719/30000 | Total reward = 63.08
2022-01-26 14:17:41.935 | DEBUG    | __main__:trials:24 - Trial = 15720/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.937 | DEBUG    | __main__:trials:29 - Trial = 15720/30000 | Total reward = 55.89
2022-01-26 14:17:41.940 | DEBUG    | __main__:trials:24 - Trial = 15721/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.941 | DEBUG    | __main__:trials:29 - Trial = 15721/30000 | Total reward = 56.27
2022-01-26 14:17:41.944 | DEBUG    | __main__:trials:24 - Trial = 15722/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.944 | DEBUG    | __main__:trials:29 - Trial = 15722/30000 | Total reward = 42.96
2022-01-26 14:17:41.948 | DEBUG    | __main__:trials:24 - Trial = 15723/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.948 | DEBUG    | __main__:trials:29 - Trial = 15723/30000 | Total reward = 51.05
2022-01-26 14:17:41.952 | DEBUG    | __main__:trials:24 - Trial = 15724/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.953 | DEBUG    | __main__:trials:29 - Trial = 15724/30000 | Total reward = 57.08
2022-01-26 14:17:41.957 | DEBUG    | __main__:trials:24 - Trial = 15725/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.958 | DEBUG    | __main__:trials:29 - Trial = 15725/30000 | Total reward = 51.78
2022-01-26 14:17:41.961 | DEBUG    | __main__:trials:24 - Trial = 15726/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.962 | DEBUG    | __main__:trials:29 - Trial = 15726/30000 | Total reward = 43.03
2022-01-26 14:17:41.965 | DEBUG    | __main__:trials:26 - Trial = 15727/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:41.966 | DEBUG    | __main__:trials:29 - Trial = 15727/30000 | Total reward = 12.26
2022-01-26 14:17:41.969 | DEBUG    | __main__:trials:24 - Trial = 15728/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.971 | DEBUG    | __main__:trials:29 - Trial = 15728/30000 | Total reward = 39.07
2022-01-26 14:17:41.974 | DEBUG    | __main__:trials:24 - Trial = 15729/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.975 | DEBUG    | __main__:trials:29 - Trial = 15729/30000 | Total reward = 47.81
2022-01-26 14:17:41.979 | DEBUG    | __main__:trials:24 - Trial = 15730/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.980 | DEBUG    | __main__:trials:29 - Trial = 15730/30000 | Total reward = 40.50
2022-01-26 14:17:41.984 | DEBUG    | __main__:trials:24 - Trial = 15731/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.985 | DEBUG    | __main__:trials:29 - Trial = 15731/30000 | Total reward = 42.48
2022-01-26 14:17:41.989 | DEBUG    | __main__:trials:24 - Trial = 15732/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.990 | DEBUG    | __main__:trials:29 - Trial = 15732/30000 | Total reward = 41.57
2022-01-26 14:17:41.994 | DEBUG    | __main__:trials:24 - Trial = 15733/30000 | Max number of steps (20) reached
2022-01-26 14:17:41.995 | DEBUG    | __main__:trials:29 - Trial = 15733/30000 | Total reward = 43.81
2022-01-26 14:17:41.998 | DEBUG    | __main__:trials:24 - Trial = 15734/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.000 | DEBUG    | __main__:trials:29 - Trial = 15734/30000 | Total reward = 37.62
2022-01-26 14:17:42.004 | DEBUG    | __main__:trials:24 - Trial = 15735/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.004 | DEBUG    | __main__:trials:29 - Trial = 15735/30000 | Total reward = 40.40
2022-01-26 14:17:42.008 | DEBUG    | __main__:trials:24 - Trial = 15736/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.009 | DEBUG    | __main__:trials:29 - Trial = 15736/30000 | Total reward = 56.90
2022-01-26 14:17:42.013 | DEBUG    | __main__:trials:24 - Trial = 15737/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.014 | DEBUG    | __main__:trials:29 - Trial = 15737/30000 | Total reward = 41.41
2022-01-26 14:17:42.018 | DEBUG    | __main__:trials:24 - Trial = 15738/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.018 | DEBUG    | __main__:trials:29 - Trial = 15738/30000 | Total reward = 40.28
2022-01-26 14:17:42.023 | DEBUG    | __main__:trials:24 - Trial = 15739/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.024 | DEBUG    | __main__:trials:29 - Trial = 15739/30000 | Total reward = 47.69
2022-01-26 14:17:42.028 | DEBUG    | __main__:trials:24 - Trial = 15740/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.029 | DEBUG    | __main__:trials:29 - Trial = 15740/30000 | Total reward = 41.56
2022-01-26 14:17:42.033 | DEBUG    | __main__:trials:24 - Trial = 15741/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.034 | DEBUG    | __main__:trials:29 - Trial = 15741/30000 | Total reward = 43.31
2022-01-26 14:17:42.037 | DEBUG    | __main__:trials:24 - Trial = 15742/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.038 | DEBUG    | __main__:trials:29 - Trial = 15742/30000 | Total reward = 43.85
2022-01-26 14:17:42.041 | DEBUG    | __main__:trials:26 - Trial = 15743/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:42.042 | DEBUG    | __main__:trials:29 - Trial = 15743/30000 | Total reward = 28.25
2022-01-26 14:17:42.045 | DEBUG    | __main__:trials:26 - Trial = 15744/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:42.046 | DEBUG    | __main__:trials:29 - Trial = 15744/30000 | Total reward = 25.29
2022-01-26 14:17:42.050 | DEBUG    | __main__:trials:24 - Trial = 15745/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.051 | DEBUG    | __main__:trials:29 - Trial = 15745/30000 | Total reward = 40.95
2022-01-26 14:17:42.054 | DEBUG    | __main__:trials:24 - Trial = 15746/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.056 | DEBUG    | __main__:trials:29 - Trial = 15746/30000 | Total reward = 56.30
2022-01-26 14:17:42.060 | DEBUG    | __main__:trials:24 - Trial = 15747/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.062 | DEBUG    | __main__:trials:29 - Trial = 15747/30000 | Total reward = 59.79
2022-01-26 14:17:42.065 | DEBUG    | __main__:trials:24 - Trial = 15748/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.065 | DEBUG    | __main__:trials:29 - Trial = 15748/30000 | Total reward = 37.44
2022-01-26 14:17:42.069 | DEBUG    | __main__:trials:24 - Trial = 15749/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.070 | DEBUG    | __main__:trials:29 - Trial = 15749/30000 | Total reward = 59.39
2022-01-26 14:17:42.073 | DEBUG    | __main__:trials:24 - Trial = 15750/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.074 | DEBUG    | __main__:trials:29 - Trial = 15750/30000 | Total reward = 44.12
2022-01-26 14:17:42.077 | DEBUG    | __main__:trials:24 - Trial = 15751/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.078 | DEBUG    | __main__:trials:29 - Trial = 15751/30000 | Total reward = 57.08
2022-01-26 14:17:42.081 | DEBUG    | __main__:trials:24 - Trial = 15752/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.082 | DEBUG    | __main__:trials:29 - Trial = 15752/30000 | Total reward = 38.75
2022-01-26 14:17:42.085 | DEBUG    | __main__:trials:24 - Trial = 15753/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.086 | DEBUG    | __main__:trials:29 - Trial = 15753/30000 | Total reward = 49.57
2022-01-26 14:17:42.090 | DEBUG    | __main__:trials:24 - Trial = 15754/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.092 | DEBUG    | __main__:trials:29 - Trial = 15754/30000 | Total reward = 47.01
2022-01-26 14:17:42.096 | DEBUG    | __main__:trials:24 - Trial = 15755/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.097 | DEBUG    | __main__:trials:29 - Trial = 15755/30000 | Total reward = 38.68
2022-01-26 14:17:42.100 | DEBUG    | __main__:trials:24 - Trial = 15756/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.101 | DEBUG    | __main__:trials:29 - Trial = 15756/30000 | Total reward = 56.44
2022-01-26 14:17:42.104 | DEBUG    | __main__:trials:24 - Trial = 15757/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.105 | DEBUG    | __main__:trials:29 - Trial = 15757/30000 | Total reward = 52.98
2022-01-26 14:17:42.109 | DEBUG    | __main__:trials:24 - Trial = 15758/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.109 | DEBUG    | __main__:trials:29 - Trial = 15758/30000 | Total reward = 39.42
2022-01-26 14:17:42.112 | DEBUG    | __main__:trials:24 - Trial = 15759/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.113 | DEBUG    | __main__:trials:29 - Trial = 15759/30000 | Total reward = 51.67
2022-01-26 14:17:42.117 | DEBUG    | __main__:trials:24 - Trial = 15760/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.118 | DEBUG    | __main__:trials:29 - Trial = 15760/30000 | Total reward = 55.56
2022-01-26 14:17:42.122 | DEBUG    | __main__:trials:24 - Trial = 15761/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.123 | DEBUG    | __main__:trials:29 - Trial = 15761/30000 | Total reward = 63.53
2022-01-26 14:17:42.126 | DEBUG    | __main__:trials:26 - Trial = 15762/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:42.127 | DEBUG    | __main__:trials:29 - Trial = 15762/30000 | Total reward = 25.40
2022-01-26 14:17:42.132 | DEBUG    | __main__:trials:24 - Trial = 15763/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.133 | DEBUG    | __main__:trials:29 - Trial = 15763/30000 | Total reward = 51.99
2022-01-26 14:17:42.136 | DEBUG    | __main__:trials:24 - Trial = 15764/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.137 | DEBUG    | __main__:trials:29 - Trial = 15764/30000 | Total reward = 34.83
2022-01-26 14:17:42.140 | DEBUG    | __main__:trials:24 - Trial = 15765/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.142 | DEBUG    | __main__:trials:29 - Trial = 15765/30000 | Total reward = 52.82
2022-01-26 14:17:42.145 | DEBUG    | __main__:trials:24 - Trial = 15766/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.146 | DEBUG    | __main__:trials:29 - Trial = 15766/30000 | Total reward = 52.12
2022-01-26 14:17:42.150 | DEBUG    | __main__:trials:24 - Trial = 15767/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.151 | DEBUG    | __main__:trials:29 - Trial = 15767/30000 | Total reward = 37.27
2022-01-26 14:17:42.155 | DEBUG    | __main__:trials:24 - Trial = 15768/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.156 | DEBUG    | __main__:trials:29 - Trial = 15768/30000 | Total reward = 58.89
2022-01-26 14:17:42.160 | DEBUG    | __main__:trials:24 - Trial = 15769/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.161 | DEBUG    | __main__:trials:29 - Trial = 15769/30000 | Total reward = 62.57
2022-01-26 14:17:42.165 | DEBUG    | __main__:trials:24 - Trial = 15770/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.166 | DEBUG    | __main__:trials:29 - Trial = 15770/30000 | Total reward = 35.02
2022-01-26 14:17:42.170 | DEBUG    | __main__:trials:24 - Trial = 15771/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.171 | DEBUG    | __main__:trials:29 - Trial = 15771/30000 | Total reward = 58.40
2022-01-26 14:17:42.175 | DEBUG    | __main__:trials:24 - Trial = 15772/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.176 | DEBUG    | __main__:trials:29 - Trial = 15772/30000 | Total reward = 55.65
2022-01-26 14:17:42.180 | DEBUG    | __main__:trials:24 - Trial = 15773/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.182 | DEBUG    | __main__:trials:29 - Trial = 15773/30000 | Total reward = 56.77
2022-01-26 14:17:42.185 | DEBUG    | __main__:trials:24 - Trial = 15774/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.186 | DEBUG    | __main__:trials:29 - Trial = 15774/30000 | Total reward = 38.38
2022-01-26 14:17:42.190 | DEBUG    | __main__:trials:24 - Trial = 15775/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.191 | DEBUG    | __main__:trials:29 - Trial = 15775/30000 | Total reward = 57.67
2022-01-26 14:17:42.195 | DEBUG    | __main__:trials:24 - Trial = 15776/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.197 | DEBUG    | __main__:trials:29 - Trial = 15776/30000 | Total reward = 48.59
2022-01-26 14:17:42.200 | DEBUG    | __main__:trials:24 - Trial = 15777/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.201 | DEBUG    | __main__:trials:29 - Trial = 15777/30000 | Total reward = 53.54
2022-01-26 14:17:42.205 | DEBUG    | __main__:trials:24 - Trial = 15778/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.207 | DEBUG    | __main__:trials:29 - Trial = 15778/30000 | Total reward = 37.96
2022-01-26 14:17:42.210 | DEBUG    | __main__:trials:24 - Trial = 15779/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.211 | DEBUG    | __main__:trials:29 - Trial = 15779/30000 | Total reward = 40.83
2022-01-26 14:17:42.215 | DEBUG    | __main__:trials:24 - Trial = 15780/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.216 | DEBUG    | __main__:trials:29 - Trial = 15780/30000 | Total reward = 51.22
2022-01-26 14:17:42.220 | DEBUG    | __main__:trials:24 - Trial = 15781/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.221 | DEBUG    | __main__:trials:29 - Trial = 15781/30000 | Total reward = 65.02
2022-01-26 14:17:42.225 | DEBUG    | __main__:trials:24 - Trial = 15782/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.226 | DEBUG    | __main__:trials:29 - Trial = 15782/30000 | Total reward = 57.08
2022-01-26 14:17:42.229 | DEBUG    | __main__:trials:24 - Trial = 15783/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.229 | DEBUG    | __main__:trials:29 - Trial = 15783/30000 | Total reward = 53.13
2022-01-26 14:17:42.233 | DEBUG    | __main__:trials:24 - Trial = 15784/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.235 | DEBUG    | __main__:trials:29 - Trial = 15784/30000 | Total reward = 40.13
2022-01-26 14:17:42.238 | DEBUG    | __main__:trials:24 - Trial = 15785/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.239 | DEBUG    | __main__:trials:29 - Trial = 15785/30000 | Total reward = 54.02
2022-01-26 14:17:42.243 | DEBUG    | __main__:trials:24 - Trial = 15786/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.244 | DEBUG    | __main__:trials:29 - Trial = 15786/30000 | Total reward = 42.05
2022-01-26 14:17:42.248 | DEBUG    | __main__:trials:24 - Trial = 15787/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.250 | DEBUG    | __main__:trials:29 - Trial = 15787/30000 | Total reward = 46.79
2022-01-26 14:17:42.254 | DEBUG    | __main__:trials:24 - Trial = 15788/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.255 | DEBUG    | __main__:trials:29 - Trial = 15788/30000 | Total reward = 53.41
2022-01-26 14:17:42.259 | DEBUG    | __main__:trials:24 - Trial = 15789/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.260 | DEBUG    | __main__:trials:29 - Trial = 15789/30000 | Total reward = 53.19
2022-01-26 14:17:42.264 | DEBUG    | __main__:trials:24 - Trial = 15790/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.266 | DEBUG    | __main__:trials:29 - Trial = 15790/30000 | Total reward = 28.91
2022-01-26 14:17:42.269 | DEBUG    | __main__:trials:24 - Trial = 15791/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.271 | DEBUG    | __main__:trials:29 - Trial = 15791/30000 | Total reward = 47.16
2022-01-26 14:17:42.274 | DEBUG    | __main__:trials:24 - Trial = 15792/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.276 | DEBUG    | __main__:trials:29 - Trial = 15792/30000 | Total reward = 52.50
2022-01-26 14:17:42.280 | DEBUG    | __main__:trials:24 - Trial = 15793/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.281 | DEBUG    | __main__:trials:29 - Trial = 15793/30000 | Total reward = 50.41
2022-01-26 14:17:42.285 | DEBUG    | __main__:trials:24 - Trial = 15794/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.286 | DEBUG    | __main__:trials:29 - Trial = 15794/30000 | Total reward = 43.87
2022-01-26 14:17:42.290 | DEBUG    | __main__:trials:24 - Trial = 15795/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.290 | DEBUG    | __main__:trials:29 - Trial = 15795/30000 | Total reward = 38.81
2022-01-26 14:17:42.294 | DEBUG    | __main__:trials:24 - Trial = 15796/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.295 | DEBUG    | __main__:trials:29 - Trial = 15796/30000 | Total reward = 51.48
2022-01-26 14:17:42.300 | DEBUG    | __main__:trials:24 - Trial = 15797/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.300 | DEBUG    | __main__:trials:29 - Trial = 15797/30000 | Total reward = 55.89
2022-01-26 14:17:42.304 | DEBUG    | __main__:trials:24 - Trial = 15798/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.306 | DEBUG    | __main__:trials:29 - Trial = 15798/30000 | Total reward = 52.28
2022-01-26 14:17:42.309 | DEBUG    | __main__:trials:24 - Trial = 15799/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.310 | DEBUG    | __main__:trials:29 - Trial = 15799/30000 | Total reward = 57.08
2022-01-26 14:17:42.313 | DEBUG    | __main__:trials:24 - Trial = 15800/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.314 | DEBUG    | __main__:trials:29 - Trial = 15800/30000 | Total reward = 60.58
2022-01-26 14:17:42.317 | DEBUG    | __main__:trials:24 - Trial = 15801/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.319 | DEBUG    | __main__:trials:29 - Trial = 15801/30000 | Total reward = 54.12
2022-01-26 14:17:42.322 | DEBUG    | __main__:trials:24 - Trial = 15802/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.323 | DEBUG    | __main__:trials:29 - Trial = 15802/30000 | Total reward = 60.16
2022-01-26 14:17:42.328 | DEBUG    | __main__:trials:24 - Trial = 15803/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.328 | DEBUG    | __main__:trials:29 - Trial = 15803/30000 | Total reward = 44.93
2022-01-26 14:17:42.332 | DEBUG    | __main__:trials:24 - Trial = 15804/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.334 | DEBUG    | __main__:trials:29 - Trial = 15804/30000 | Total reward = 46.51
2022-01-26 14:17:42.337 | DEBUG    | __main__:trials:24 - Trial = 15805/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.338 | DEBUG    | __main__:trials:29 - Trial = 15805/30000 | Total reward = 51.25
2022-01-26 14:17:42.343 | DEBUG    | __main__:trials:24 - Trial = 15806/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.343 | DEBUG    | __main__:trials:29 - Trial = 15806/30000 | Total reward = 59.60
2022-01-26 14:17:42.347 | DEBUG    | __main__:trials:24 - Trial = 15807/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.349 | DEBUG    | __main__:trials:29 - Trial = 15807/30000 | Total reward = 57.54
2022-01-26 14:17:42.352 | DEBUG    | __main__:trials:24 - Trial = 15808/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.354 | DEBUG    | __main__:trials:29 - Trial = 15808/30000 | Total reward = 55.51
2022-01-26 14:17:42.358 | DEBUG    | __main__:trials:24 - Trial = 15809/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.359 | DEBUG    | __main__:trials:29 - Trial = 15809/30000 | Total reward = 42.52
2022-01-26 14:17:42.363 | DEBUG    | __main__:trials:24 - Trial = 15810/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.364 | DEBUG    | __main__:trials:29 - Trial = 15810/30000 | Total reward = 47.13
2022-01-26 14:17:42.368 | DEBUG    | __main__:trials:24 - Trial = 15811/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.370 | DEBUG    | __main__:trials:29 - Trial = 15811/30000 | Total reward = 47.72
2022-01-26 14:17:42.373 | DEBUG    | __main__:trials:24 - Trial = 15812/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.374 | DEBUG    | __main__:trials:29 - Trial = 15812/30000 | Total reward = 50.52
2022-01-26 14:17:42.379 | DEBUG    | __main__:trials:24 - Trial = 15813/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.380 | DEBUG    | __main__:trials:29 - Trial = 15813/30000 | Total reward = 52.56
2022-01-26 14:17:42.384 | DEBUG    | __main__:trials:24 - Trial = 15814/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.385 | DEBUG    | __main__:trials:29 - Trial = 15814/30000 | Total reward = 63.43
2022-01-26 14:17:42.388 | DEBUG    | __main__:trials:24 - Trial = 15815/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.390 | DEBUG    | __main__:trials:29 - Trial = 15815/30000 | Total reward = 41.53
2022-01-26 14:17:42.394 | DEBUG    | __main__:trials:24 - Trial = 15816/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.394 | DEBUG    | __main__:trials:29 - Trial = 15816/30000 | Total reward = 51.67
2022-01-26 14:17:42.398 | DEBUG    | __main__:trials:24 - Trial = 15817/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.398 | DEBUG    | __main__:trials:29 - Trial = 15817/30000 | Total reward = 62.21
2022-01-26 14:17:42.402 | DEBUG    | __main__:trials:24 - Trial = 15818/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.403 | DEBUG    | __main__:trials:29 - Trial = 15818/30000 | Total reward = 57.08
2022-01-26 14:17:42.407 | DEBUG    | __main__:trials:24 - Trial = 15819/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.409 | DEBUG    | __main__:trials:29 - Trial = 15819/30000 | Total reward = 48.14
2022-01-26 14:17:42.412 | DEBUG    | __main__:trials:24 - Trial = 15820/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.413 | DEBUG    | __main__:trials:29 - Trial = 15820/30000 | Total reward = 49.40
2022-01-26 14:17:42.416 | DEBUG    | __main__:trials:24 - Trial = 15821/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.417 | DEBUG    | __main__:trials:29 - Trial = 15821/30000 | Total reward = 53.73
2022-01-26 14:17:42.420 | DEBUG    | __main__:trials:24 - Trial = 15822/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.421 | DEBUG    | __main__:trials:29 - Trial = 15822/30000 | Total reward = 60.32
2022-01-26 14:17:42.424 | DEBUG    | __main__:trials:24 - Trial = 15823/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.426 | DEBUG    | __main__:trials:29 - Trial = 15823/30000 | Total reward = 40.29
2022-01-26 14:17:42.430 | DEBUG    | __main__:trials:24 - Trial = 15824/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.431 | DEBUG    | __main__:trials:29 - Trial = 15824/30000 | Total reward = 35.52
2022-01-26 14:17:42.434 | DEBUG    | __main__:trials:24 - Trial = 15825/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.435 | DEBUG    | __main__:trials:29 - Trial = 15825/30000 | Total reward = 45.38
2022-01-26 14:17:42.438 | DEBUG    | __main__:trials:24 - Trial = 15826/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.439 | DEBUG    | __main__:trials:29 - Trial = 15826/30000 | Total reward = 47.21
2022-01-26 14:17:42.442 | DEBUG    | __main__:trials:24 - Trial = 15827/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.444 | DEBUG    | __main__:trials:29 - Trial = 15827/30000 | Total reward = 60.14
2022-01-26 14:17:42.448 | DEBUG    | __main__:trials:24 - Trial = 15828/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.449 | DEBUG    | __main__:trials:29 - Trial = 15828/30000 | Total reward = 44.59
2022-01-26 14:17:42.452 | DEBUG    | __main__:trials:24 - Trial = 15829/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.454 | DEBUG    | __main__:trials:29 - Trial = 15829/30000 | Total reward = 56.57
2022-01-26 14:17:42.457 | DEBUG    | __main__:trials:24 - Trial = 15830/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.458 | DEBUG    | __main__:trials:29 - Trial = 15830/30000 | Total reward = 57.95
2022-01-26 14:17:42.461 | DEBUG    | __main__:trials:24 - Trial = 15831/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.463 | DEBUG    | __main__:trials:29 - Trial = 15831/30000 | Total reward = 47.14
2022-01-26 14:17:42.466 | DEBUG    | __main__:trials:24 - Trial = 15832/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.467 | DEBUG    | __main__:trials:29 - Trial = 15832/30000 | Total reward = 48.49
2022-01-26 14:17:42.471 | DEBUG    | __main__:trials:24 - Trial = 15833/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.472 | DEBUG    | __main__:trials:29 - Trial = 15833/30000 | Total reward = 53.95
2022-01-26 14:17:42.475 | DEBUG    | __main__:trials:24 - Trial = 15834/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.477 | DEBUG    | __main__:trials:29 - Trial = 15834/30000 | Total reward = 49.33
2022-01-26 14:17:42.480 | DEBUG    | __main__:trials:24 - Trial = 15835/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.482 | DEBUG    | __main__:trials:29 - Trial = 15835/30000 | Total reward = 46.53
2022-01-26 14:17:42.485 | DEBUG    | __main__:trials:24 - Trial = 15836/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.485 | DEBUG    | __main__:trials:29 - Trial = 15836/30000 | Total reward = 52.49
2022-01-26 14:17:42.489 | DEBUG    | __main__:trials:24 - Trial = 15837/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.490 | DEBUG    | __main__:trials:29 - Trial = 15837/30000 | Total reward = 41.67
2022-01-26 14:17:42.493 | DEBUG    | __main__:trials:24 - Trial = 15838/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.495 | DEBUG    | __main__:trials:29 - Trial = 15838/30000 | Total reward = 59.09
2022-01-26 14:17:42.498 | DEBUG    | __main__:trials:24 - Trial = 15839/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.500 | DEBUG    | __main__:trials:29 - Trial = 15839/30000 | Total reward = 64.39
2022-01-26 14:17:42.503 | DEBUG    | __main__:trials:24 - Trial = 15840/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.504 | DEBUG    | __main__:trials:29 - Trial = 15840/30000 | Total reward = 43.79
2022-01-26 14:17:42.507 | DEBUG    | __main__:trials:24 - Trial = 15841/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.508 | DEBUG    | __main__:trials:29 - Trial = 15841/30000 | Total reward = 54.46
2022-01-26 14:17:42.511 | DEBUG    | __main__:trials:24 - Trial = 15842/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.513 | DEBUG    | __main__:trials:29 - Trial = 15842/30000 | Total reward = 41.89
2022-01-26 14:17:42.516 | DEBUG    | __main__:trials:24 - Trial = 15843/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.517 | DEBUG    | __main__:trials:29 - Trial = 15843/30000 | Total reward = 56.34
2022-01-26 14:17:42.521 | DEBUG    | __main__:trials:24 - Trial = 15844/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.522 | DEBUG    | __main__:trials:29 - Trial = 15844/30000 | Total reward = 46.29
2022-01-26 14:17:42.525 | DEBUG    | __main__:trials:24 - Trial = 15845/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.526 | DEBUG    | __main__:trials:29 - Trial = 15845/30000 | Total reward = 47.49
2022-01-26 14:17:42.530 | DEBUG    | __main__:trials:24 - Trial = 15846/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.532 | DEBUG    | __main__:trials:29 - Trial = 15846/30000 | Total reward = 61.37
2022-01-26 14:17:42.535 | DEBUG    | __main__:trials:24 - Trial = 15847/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.537 | DEBUG    | __main__:trials:29 - Trial = 15847/30000 | Total reward = 46.37
2022-01-26 14:17:42.540 | DEBUG    | __main__:trials:24 - Trial = 15848/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.541 | DEBUG    | __main__:trials:29 - Trial = 15848/30000 | Total reward = 60.21
2022-01-26 14:17:42.545 | DEBUG    | __main__:trials:24 - Trial = 15849/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.547 | DEBUG    | __main__:trials:29 - Trial = 15849/30000 | Total reward = 34.59
2022-01-26 14:17:42.550 | DEBUG    | __main__:trials:24 - Trial = 15850/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.552 | DEBUG    | __main__:trials:29 - Trial = 15850/30000 | Total reward = 48.69
2022-01-26 14:17:42.555 | DEBUG    | __main__:trials:24 - Trial = 15851/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.556 | DEBUG    | __main__:trials:29 - Trial = 15851/30000 | Total reward = 60.54
2022-01-26 14:17:42.559 | DEBUG    | __main__:trials:24 - Trial = 15852/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.560 | DEBUG    | __main__:trials:29 - Trial = 15852/30000 | Total reward = 64.36
2022-01-26 14:17:42.563 | DEBUG    | __main__:trials:24 - Trial = 15853/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.564 | DEBUG    | __main__:trials:29 - Trial = 15853/30000 | Total reward = 60.75
2022-01-26 14:17:42.567 | DEBUG    | __main__:trials:24 - Trial = 15854/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.569 | DEBUG    | __main__:trials:29 - Trial = 15854/30000 | Total reward = 48.13
2022-01-26 14:17:42.572 | DEBUG    | __main__:trials:24 - Trial = 15855/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.573 | DEBUG    | __main__:trials:29 - Trial = 15855/30000 | Total reward = 63.64
2022-01-26 14:17:42.577 | DEBUG    | __main__:trials:24 - Trial = 15856/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.578 | DEBUG    | __main__:trials:29 - Trial = 15856/30000 | Total reward = 57.37
2022-01-26 14:17:42.581 | DEBUG    | __main__:trials:24 - Trial = 15857/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.582 | DEBUG    | __main__:trials:29 - Trial = 15857/30000 | Total reward = 47.48
2022-01-26 14:17:42.585 | DEBUG    | __main__:trials:24 - Trial = 15858/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.586 | DEBUG    | __main__:trials:29 - Trial = 15858/30000 | Total reward = 61.23
2022-01-26 14:17:42.589 | DEBUG    | __main__:trials:24 - Trial = 15859/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.591 | DEBUG    | __main__:trials:29 - Trial = 15859/30000 | Total reward = 56.25
2022-01-26 14:17:42.593 | DEBUG    | __main__:trials:24 - Trial = 15860/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.595 | DEBUG    | __main__:trials:29 - Trial = 15860/30000 | Total reward = 58.42
2022-01-26 14:17:42.598 | DEBUG    | __main__:trials:24 - Trial = 15861/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.599 | DEBUG    | __main__:trials:29 - Trial = 15861/30000 | Total reward = 44.55
2022-01-26 14:17:42.603 | DEBUG    | __main__:trials:24 - Trial = 15862/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.604 | DEBUG    | __main__:trials:29 - Trial = 15862/30000 | Total reward = 60.69
2022-01-26 14:17:42.608 | DEBUG    | __main__:trials:24 - Trial = 15863/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.608 | DEBUG    | __main__:trials:29 - Trial = 15863/30000 | Total reward = 42.49
2022-01-26 14:17:42.612 | DEBUG    | __main__:trials:24 - Trial = 15864/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.613 | DEBUG    | __main__:trials:29 - Trial = 15864/30000 | Total reward = 54.04
2022-01-26 14:17:42.616 | DEBUG    | __main__:trials:24 - Trial = 15865/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.618 | DEBUG    | __main__:trials:29 - Trial = 15865/30000 | Total reward = 54.35
2022-01-26 14:17:42.622 | DEBUG    | __main__:trials:24 - Trial = 15866/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.623 | DEBUG    | __main__:trials:29 - Trial = 15866/30000 | Total reward = 51.01
2022-01-26 14:17:42.627 | DEBUG    | __main__:trials:24 - Trial = 15867/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.627 | DEBUG    | __main__:trials:29 - Trial = 15867/30000 | Total reward = 42.71
2022-01-26 14:17:42.631 | DEBUG    | __main__:trials:24 - Trial = 15868/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.633 | DEBUG    | __main__:trials:29 - Trial = 15868/30000 | Total reward = 46.23
2022-01-26 14:17:42.635 | DEBUG    | __main__:trials:24 - Trial = 15869/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.636 | DEBUG    | __main__:trials:29 - Trial = 15869/30000 | Total reward = 44.22
2022-01-26 14:17:42.639 | DEBUG    | __main__:trials:24 - Trial = 15870/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.640 | DEBUG    | __main__:trials:29 - Trial = 15870/30000 | Total reward = 41.75
2022-01-26 14:17:42.643 | DEBUG    | __main__:trials:24 - Trial = 15871/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.645 | DEBUG    | __main__:trials:29 - Trial = 15871/30000 | Total reward = 63.17
2022-01-26 14:17:42.648 | DEBUG    | __main__:trials:24 - Trial = 15872/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.648 | DEBUG    | __main__:trials:29 - Trial = 15872/30000 | Total reward = 31.84
2022-01-26 14:17:42.652 | DEBUG    | __main__:trials:24 - Trial = 15873/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.654 | DEBUG    | __main__:trials:29 - Trial = 15873/30000 | Total reward = 51.45
2022-01-26 14:17:42.656 | DEBUG    | __main__:trials:24 - Trial = 15874/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.657 | DEBUG    | __main__:trials:29 - Trial = 15874/30000 | Total reward = 41.13
2022-01-26 14:17:42.661 | DEBUG    | __main__:trials:24 - Trial = 15875/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.662 | DEBUG    | __main__:trials:29 - Trial = 15875/30000 | Total reward = 47.32
2022-01-26 14:17:42.665 | DEBUG    | __main__:trials:24 - Trial = 15876/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.666 | DEBUG    | __main__:trials:29 - Trial = 15876/30000 | Total reward = 47.36
2022-01-26 14:17:42.670 | DEBUG    | __main__:trials:24 - Trial = 15877/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.670 | DEBUG    | __main__:trials:29 - Trial = 15877/30000 | Total reward = 53.25
2022-01-26 14:17:42.675 | DEBUG    | __main__:trials:24 - Trial = 15878/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.676 | DEBUG    | __main__:trials:29 - Trial = 15878/30000 | Total reward = 59.23
2022-01-26 14:17:42.680 | DEBUG    | __main__:trials:24 - Trial = 15879/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.682 | DEBUG    | __main__:trials:29 - Trial = 15879/30000 | Total reward = 57.99
2022-01-26 14:17:42.686 | DEBUG    | __main__:trials:24 - Trial = 15880/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.686 | DEBUG    | __main__:trials:29 - Trial = 15880/30000 | Total reward = 57.08
2022-01-26 14:17:42.690 | DEBUG    | __main__:trials:24 - Trial = 15881/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.691 | DEBUG    | __main__:trials:29 - Trial = 15881/30000 | Total reward = 44.61
2022-01-26 14:17:42.695 | DEBUG    | __main__:trials:24 - Trial = 15882/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.696 | DEBUG    | __main__:trials:29 - Trial = 15882/30000 | Total reward = 46.90
2022-01-26 14:17:42.700 | DEBUG    | __main__:trials:24 - Trial = 15883/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.701 | DEBUG    | __main__:trials:29 - Trial = 15883/30000 | Total reward = 39.03
2022-01-26 14:17:42.705 | DEBUG    | __main__:trials:24 - Trial = 15884/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.707 | DEBUG    | __main__:trials:29 - Trial = 15884/30000 | Total reward = 45.67
2022-01-26 14:17:42.710 | DEBUG    | __main__:trials:24 - Trial = 15885/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.712 | DEBUG    | __main__:trials:29 - Trial = 15885/30000 | Total reward = 43.24
2022-01-26 14:17:42.715 | DEBUG    | __main__:trials:24 - Trial = 15886/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.717 | DEBUG    | __main__:trials:29 - Trial = 15886/30000 | Total reward = 49.60
2022-01-26 14:17:42.720 | DEBUG    | __main__:trials:24 - Trial = 15887/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.722 | DEBUG    | __main__:trials:29 - Trial = 15887/30000 | Total reward = 46.16
2022-01-26 14:17:42.725 | DEBUG    | __main__:trials:24 - Trial = 15888/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.726 | DEBUG    | __main__:trials:29 - Trial = 15888/30000 | Total reward = 45.32
2022-01-26 14:17:42.730 | DEBUG    | __main__:trials:24 - Trial = 15889/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.731 | DEBUG    | __main__:trials:29 - Trial = 15889/30000 | Total reward = 47.79
2022-01-26 14:17:42.735 | DEBUG    | __main__:trials:24 - Trial = 15890/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.736 | DEBUG    | __main__:trials:29 - Trial = 15890/30000 | Total reward = 43.66
2022-01-26 14:17:42.740 | DEBUG    | __main__:trials:24 - Trial = 15891/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.742 | DEBUG    | __main__:trials:29 - Trial = 15891/30000 | Total reward = 52.03
2022-01-26 14:17:42.745 | DEBUG    | __main__:trials:24 - Trial = 15892/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.746 | DEBUG    | __main__:trials:29 - Trial = 15892/30000 | Total reward = 57.00
2022-01-26 14:17:42.750 | DEBUG    | __main__:trials:24 - Trial = 15893/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.751 | DEBUG    | __main__:trials:29 - Trial = 15893/30000 | Total reward = 48.79
2022-01-26 14:17:42.755 | DEBUG    | __main__:trials:24 - Trial = 15894/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.756 | DEBUG    | __main__:trials:29 - Trial = 15894/30000 | Total reward = 40.63
2022-01-26 14:17:42.760 | DEBUG    | __main__:trials:24 - Trial = 15895/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.761 | DEBUG    | __main__:trials:29 - Trial = 15895/30000 | Total reward = 48.35
2022-01-26 14:17:42.765 | DEBUG    | __main__:trials:24 - Trial = 15896/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.766 | DEBUG    | __main__:trials:29 - Trial = 15896/30000 | Total reward = 45.07
2022-01-26 14:17:42.770 | DEBUG    | __main__:trials:24 - Trial = 15897/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.771 | DEBUG    | __main__:trials:29 - Trial = 15897/30000 | Total reward = 49.31
2022-01-26 14:17:42.774 | DEBUG    | __main__:trials:24 - Trial = 15898/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.776 | DEBUG    | __main__:trials:29 - Trial = 15898/30000 | Total reward = 55.79
2022-01-26 14:17:42.779 | DEBUG    | __main__:trials:24 - Trial = 15899/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.781 | DEBUG    | __main__:trials:29 - Trial = 15899/30000 | Total reward = 47.46
2022-01-26 14:17:42.784 | DEBUG    | __main__:trials:24 - Trial = 15900/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.786 | DEBUG    | __main__:trials:29 - Trial = 15900/30000 | Total reward = 50.43
2022-01-26 14:17:42.789 | DEBUG    | __main__:trials:24 - Trial = 15901/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.790 | DEBUG    | __main__:trials:29 - Trial = 15901/30000 | Total reward = 48.42
2022-01-26 14:17:42.794 | DEBUG    | __main__:trials:24 - Trial = 15902/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.795 | DEBUG    | __main__:trials:29 - Trial = 15902/30000 | Total reward = 41.93
2022-01-26 14:17:42.799 | DEBUG    | __main__:trials:24 - Trial = 15903/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.800 | DEBUG    | __main__:trials:29 - Trial = 15903/30000 | Total reward = 63.08
2022-01-26 14:17:42.803 | DEBUG    | __main__:trials:24 - Trial = 15904/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.804 | DEBUG    | __main__:trials:29 - Trial = 15904/30000 | Total reward = 43.75
2022-01-26 14:17:42.807 | DEBUG    | __main__:trials:24 - Trial = 15905/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.809 | DEBUG    | __main__:trials:29 - Trial = 15905/30000 | Total reward = 54.78
2022-01-26 14:17:42.813 | DEBUG    | __main__:trials:24 - Trial = 15906/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.814 | DEBUG    | __main__:trials:29 - Trial = 15906/30000 | Total reward = 42.12
2022-01-26 14:17:42.818 | DEBUG    | __main__:trials:24 - Trial = 15907/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.818 | DEBUG    | __main__:trials:29 - Trial = 15907/30000 | Total reward = 43.68
2022-01-26 14:17:42.822 | DEBUG    | __main__:trials:24 - Trial = 15908/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.822 | DEBUG    | __main__:trials:29 - Trial = 15908/30000 | Total reward = 49.84
2022-01-26 14:17:42.826 | DEBUG    | __main__:trials:24 - Trial = 15909/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.828 | DEBUG    | __main__:trials:29 - Trial = 15909/30000 | Total reward = 43.72
2022-01-26 14:17:42.830 | DEBUG    | __main__:trials:24 - Trial = 15910/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.832 | DEBUG    | __main__:trials:29 - Trial = 15910/30000 | Total reward = 50.16
2022-01-26 14:17:42.835 | DEBUG    | __main__:trials:24 - Trial = 15911/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.837 | DEBUG    | __main__:trials:29 - Trial = 15911/30000 | Total reward = 44.92
2022-01-26 14:17:42.840 | DEBUG    | __main__:trials:24 - Trial = 15912/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.841 | DEBUG    | __main__:trials:29 - Trial = 15912/30000 | Total reward = 41.27
2022-01-26 14:17:42.845 | DEBUG    | __main__:trials:24 - Trial = 15913/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.845 | DEBUG    | __main__:trials:29 - Trial = 15913/30000 | Total reward = 42.05
2022-01-26 14:17:42.849 | DEBUG    | __main__:trials:24 - Trial = 15914/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.850 | DEBUG    | __main__:trials:29 - Trial = 15914/30000 | Total reward = 44.75
2022-01-26 14:17:42.853 | DEBUG    | __main__:trials:24 - Trial = 15915/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.854 | DEBUG    | __main__:trials:29 - Trial = 15915/30000 | Total reward = 50.70
2022-01-26 14:17:42.857 | DEBUG    | __main__:trials:24 - Trial = 15916/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.859 | DEBUG    | __main__:trials:29 - Trial = 15916/30000 | Total reward = 51.90
2022-01-26 14:17:42.861 | DEBUG    | __main__:trials:26 - Trial = 15917/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:42.863 | DEBUG    | __main__:trials:29 - Trial = 15917/30000 | Total reward = 25.36
2022-01-26 14:17:42.867 | DEBUG    | __main__:trials:24 - Trial = 15918/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.869 | DEBUG    | __main__:trials:29 - Trial = 15918/30000 | Total reward = 52.37
2022-01-26 14:17:42.872 | DEBUG    | __main__:trials:24 - Trial = 15919/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.872 | DEBUG    | __main__:trials:29 - Trial = 15919/30000 | Total reward = 40.70
2022-01-26 14:17:42.876 | DEBUG    | __main__:trials:24 - Trial = 15920/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.876 | DEBUG    | __main__:trials:29 - Trial = 15920/30000 | Total reward = 50.15
2022-01-26 14:17:42.880 | DEBUG    | __main__:trials:24 - Trial = 15921/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.881 | DEBUG    | __main__:trials:29 - Trial = 15921/30000 | Total reward = 48.30
2022-01-26 14:17:42.885 | DEBUG    | __main__:trials:24 - Trial = 15922/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.886 | DEBUG    | __main__:trials:29 - Trial = 15922/30000 | Total reward = 37.56
2022-01-26 14:17:42.890 | DEBUG    | __main__:trials:24 - Trial = 15923/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.892 | DEBUG    | __main__:trials:29 - Trial = 15923/30000 | Total reward = 53.36
2022-01-26 14:17:42.895 | DEBUG    | __main__:trials:24 - Trial = 15924/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.897 | DEBUG    | __main__:trials:29 - Trial = 15924/30000 | Total reward = 52.96
2022-01-26 14:17:42.900 | DEBUG    | __main__:trials:24 - Trial = 15925/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.902 | DEBUG    | __main__:trials:29 - Trial = 15925/30000 | Total reward = 39.28
2022-01-26 14:17:42.906 | DEBUG    | __main__:trials:24 - Trial = 15926/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.906 | DEBUG    | __main__:trials:29 - Trial = 15926/30000 | Total reward = 47.80
2022-01-26 14:17:42.911 | DEBUG    | __main__:trials:24 - Trial = 15927/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.913 | DEBUG    | __main__:trials:29 - Trial = 15927/30000 | Total reward = 44.93
2022-01-26 14:17:42.915 | DEBUG    | __main__:trials:24 - Trial = 15928/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.917 | DEBUG    | __main__:trials:29 - Trial = 15928/30000 | Total reward = 42.86
2022-01-26 14:17:42.920 | DEBUG    | __main__:trials:24 - Trial = 15929/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.922 | DEBUG    | __main__:trials:29 - Trial = 15929/30000 | Total reward = 42.08
2022-01-26 14:17:42.925 | DEBUG    | __main__:trials:24 - Trial = 15930/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.926 | DEBUG    | __main__:trials:29 - Trial = 15930/30000 | Total reward = 39.88
2022-01-26 14:17:42.929 | DEBUG    | __main__:trials:24 - Trial = 15931/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.931 | DEBUG    | __main__:trials:29 - Trial = 15931/30000 | Total reward = 61.39
2022-01-26 14:17:42.935 | DEBUG    | __main__:trials:24 - Trial = 15932/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.938 | DEBUG    | __main__:trials:29 - Trial = 15932/30000 | Total reward = 53.53
2022-01-26 14:17:42.942 | DEBUG    | __main__:trials:24 - Trial = 15933/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.943 | DEBUG    | __main__:trials:29 - Trial = 15933/30000 | Total reward = 43.66
2022-01-26 14:17:42.947 | DEBUG    | __main__:trials:24 - Trial = 15934/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.948 | DEBUG    | __main__:trials:29 - Trial = 15934/30000 | Total reward = 39.21
2022-01-26 14:17:42.952 | DEBUG    | __main__:trials:24 - Trial = 15935/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.954 | DEBUG    | __main__:trials:29 - Trial = 15935/30000 | Total reward = 44.96
2022-01-26 14:17:42.956 | DEBUG    | __main__:trials:24 - Trial = 15936/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.958 | DEBUG    | __main__:trials:29 - Trial = 15936/30000 | Total reward = 45.65
2022-01-26 14:17:42.961 | DEBUG    | __main__:trials:24 - Trial = 15937/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.962 | DEBUG    | __main__:trials:29 - Trial = 15937/30000 | Total reward = 43.64
2022-01-26 14:17:42.965 | DEBUG    | __main__:trials:24 - Trial = 15938/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.966 | DEBUG    | __main__:trials:29 - Trial = 15938/30000 | Total reward = 44.93
2022-01-26 14:17:42.969 | DEBUG    | __main__:trials:24 - Trial = 15939/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.970 | DEBUG    | __main__:trials:29 - Trial = 15939/30000 | Total reward = 52.59
2022-01-26 14:17:42.974 | DEBUG    | __main__:trials:24 - Trial = 15940/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.975 | DEBUG    | __main__:trials:29 - Trial = 15940/30000 | Total reward = 51.66
2022-01-26 14:17:42.978 | DEBUG    | __main__:trials:24 - Trial = 15941/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.980 | DEBUG    | __main__:trials:29 - Trial = 15941/30000 | Total reward = 52.07
2022-01-26 14:17:42.984 | DEBUG    | __main__:trials:24 - Trial = 15942/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.985 | DEBUG    | __main__:trials:29 - Trial = 15942/30000 | Total reward = 43.31
2022-01-26 14:17:42.989 | DEBUG    | __main__:trials:24 - Trial = 15943/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.990 | DEBUG    | __main__:trials:29 - Trial = 15943/30000 | Total reward = 50.65
2022-01-26 14:17:42.993 | DEBUG    | __main__:trials:24 - Trial = 15944/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.994 | DEBUG    | __main__:trials:29 - Trial = 15944/30000 | Total reward = 53.83
2022-01-26 14:17:42.999 | DEBUG    | __main__:trials:24 - Trial = 15945/30000 | Max number of steps (20) reached
2022-01-26 14:17:42.999 | DEBUG    | __main__:trials:29 - Trial = 15945/30000 | Total reward = 53.44
2022-01-26 14:17:43.004 | DEBUG    | __main__:trials:24 - Trial = 15946/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.005 | DEBUG    | __main__:trials:29 - Trial = 15946/30000 | Total reward = 41.11
2022-01-26 14:17:43.009 | DEBUG    | __main__:trials:24 - Trial = 15947/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.010 | DEBUG    | __main__:trials:29 - Trial = 15947/30000 | Total reward = 47.04
2022-01-26 14:17:43.013 | DEBUG    | __main__:trials:26 - Trial = 15948/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:43.015 | DEBUG    | __main__:trials:29 - Trial = 15948/30000 | Total reward = 24.59
2022-01-26 14:17:43.018 | DEBUG    | __main__:trials:24 - Trial = 15949/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.020 | DEBUG    | __main__:trials:29 - Trial = 15949/30000 | Total reward = 42.48
2022-01-26 14:17:43.023 | DEBUG    | __main__:trials:24 - Trial = 15950/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.025 | DEBUG    | __main__:trials:29 - Trial = 15950/30000 | Total reward = 37.05
2022-01-26 14:17:43.029 | DEBUG    | __main__:trials:24 - Trial = 15951/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.030 | DEBUG    | __main__:trials:29 - Trial = 15951/30000 | Total reward = 37.32
2022-01-26 14:17:43.034 | DEBUG    | __main__:trials:24 - Trial = 15952/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.035 | DEBUG    | __main__:trials:29 - Trial = 15952/30000 | Total reward = 32.58
2022-01-26 14:17:43.039 | DEBUG    | __main__:trials:24 - Trial = 15953/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.040 | DEBUG    | __main__:trials:29 - Trial = 15953/30000 | Total reward = 50.42
2022-01-26 14:17:43.043 | DEBUG    | __main__:trials:26 - Trial = 15954/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:43.045 | DEBUG    | __main__:trials:29 - Trial = 15954/30000 | Total reward = 40.91
2022-01-26 14:17:43.048 | DEBUG    | __main__:trials:24 - Trial = 15955/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.050 | DEBUG    | __main__:trials:29 - Trial = 15955/30000 | Total reward = 65.01
2022-01-26 14:17:43.054 | DEBUG    | __main__:trials:24 - Trial = 15956/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.055 | DEBUG    | __main__:trials:29 - Trial = 15956/30000 | Total reward = 46.41
2022-01-26 14:17:43.059 | DEBUG    | __main__:trials:24 - Trial = 15957/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.060 | DEBUG    | __main__:trials:29 - Trial = 15957/30000 | Total reward = 41.94
2022-01-26 14:17:43.064 | DEBUG    | __main__:trials:24 - Trial = 15958/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.066 | DEBUG    | __main__:trials:29 - Trial = 15958/30000 | Total reward = 36.48
2022-01-26 14:17:43.069 | DEBUG    | __main__:trials:24 - Trial = 15959/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.071 | DEBUG    | __main__:trials:29 - Trial = 15959/30000 | Total reward = 41.66
2022-01-26 14:17:43.076 | DEBUG    | __main__:trials:24 - Trial = 15960/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.077 | DEBUG    | __main__:trials:29 - Trial = 15960/30000 | Total reward = 33.78
2022-01-26 14:17:43.081 | DEBUG    | __main__:trials:24 - Trial = 15961/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.083 | DEBUG    | __main__:trials:29 - Trial = 15961/30000 | Total reward = 37.49
2022-01-26 14:17:43.087 | DEBUG    | __main__:trials:24 - Trial = 15962/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.089 | DEBUG    | __main__:trials:29 - Trial = 15962/30000 | Total reward = 34.77
2022-01-26 14:17:43.093 | DEBUG    | __main__:trials:24 - Trial = 15963/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.094 | DEBUG    | __main__:trials:29 - Trial = 15963/30000 | Total reward = 55.26
2022-01-26 14:17:43.097 | DEBUG    | __main__:trials:24 - Trial = 15964/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.099 | DEBUG    | __main__:trials:29 - Trial = 15964/30000 | Total reward = 35.93
2022-01-26 14:17:43.102 | DEBUG    | __main__:trials:24 - Trial = 15965/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.104 | DEBUG    | __main__:trials:29 - Trial = 15965/30000 | Total reward = 52.30
2022-01-26 14:17:43.108 | DEBUG    | __main__:trials:24 - Trial = 15966/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.109 | DEBUG    | __main__:trials:29 - Trial = 15966/30000 | Total reward = 44.04
2022-01-26 14:17:43.112 | DEBUG    | __main__:trials:24 - Trial = 15967/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.114 | DEBUG    | __main__:trials:29 - Trial = 15967/30000 | Total reward = 40.16
2022-01-26 14:17:43.118 | DEBUG    | __main__:trials:24 - Trial = 15968/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.119 | DEBUG    | __main__:trials:29 - Trial = 15968/30000 | Total reward = 40.81
2022-01-26 14:17:43.123 | DEBUG    | __main__:trials:24 - Trial = 15969/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.124 | DEBUG    | __main__:trials:29 - Trial = 15969/30000 | Total reward = 41.34
2022-01-26 14:17:43.128 | DEBUG    | __main__:trials:24 - Trial = 15970/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.130 | DEBUG    | __main__:trials:29 - Trial = 15970/30000 | Total reward = 34.87
2022-01-26 14:17:43.133 | DEBUG    | __main__:trials:24 - Trial = 15971/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.135 | DEBUG    | __main__:trials:29 - Trial = 15971/30000 | Total reward = 44.40
2022-01-26 14:17:43.139 | DEBUG    | __main__:trials:24 - Trial = 15972/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.140 | DEBUG    | __main__:trials:29 - Trial = 15972/30000 | Total reward = 63.90
2022-01-26 14:17:43.144 | DEBUG    | __main__:trials:24 - Trial = 15973/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.144 | DEBUG    | __main__:trials:29 - Trial = 15973/30000 | Total reward = 50.77
2022-01-26 14:17:43.148 | DEBUG    | __main__:trials:24 - Trial = 15974/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.149 | DEBUG    | __main__:trials:29 - Trial = 15974/30000 | Total reward = 57.23
2022-01-26 14:17:43.152 | DEBUG    | __main__:trials:24 - Trial = 15975/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.153 | DEBUG    | __main__:trials:29 - Trial = 15975/30000 | Total reward = 38.19
2022-01-26 14:17:43.156 | DEBUG    | __main__:trials:24 - Trial = 15976/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.157 | DEBUG    | __main__:trials:29 - Trial = 15976/30000 | Total reward = 41.19
2022-01-26 14:17:43.160 | DEBUG    | __main__:trials:24 - Trial = 15977/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.161 | DEBUG    | __main__:trials:29 - Trial = 15977/30000 | Total reward = 34.85
2022-01-26 14:17:43.165 | DEBUG    | __main__:trials:24 - Trial = 15978/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.166 | DEBUG    | __main__:trials:29 - Trial = 15978/30000 | Total reward = 58.70
2022-01-26 14:17:43.170 | DEBUG    | __main__:trials:24 - Trial = 15979/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.171 | DEBUG    | __main__:trials:29 - Trial = 15979/30000 | Total reward = 51.94
2022-01-26 14:17:43.175 | DEBUG    | __main__:trials:24 - Trial = 15980/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.177 | DEBUG    | __main__:trials:29 - Trial = 15980/30000 | Total reward = 51.47
2022-01-26 14:17:43.180 | DEBUG    | __main__:trials:24 - Trial = 15981/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.182 | DEBUG    | __main__:trials:29 - Trial = 15981/30000 | Total reward = 37.46
2022-01-26 14:17:43.185 | DEBUG    | __main__:trials:24 - Trial = 15982/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.187 | DEBUG    | __main__:trials:29 - Trial = 15982/30000 | Total reward = 57.64
2022-01-26 14:17:43.191 | DEBUG    | __main__:trials:24 - Trial = 15983/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.192 | DEBUG    | __main__:trials:29 - Trial = 15983/30000 | Total reward = 45.87
2022-01-26 14:17:43.197 | DEBUG    | __main__:trials:24 - Trial = 15984/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.198 | DEBUG    | __main__:trials:29 - Trial = 15984/30000 | Total reward = 55.50
2022-01-26 14:17:43.202 | DEBUG    | __main__:trials:24 - Trial = 15985/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.203 | DEBUG    | __main__:trials:29 - Trial = 15985/30000 | Total reward = 41.23
2022-01-26 14:17:43.207 | DEBUG    | __main__:trials:24 - Trial = 15986/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.209 | DEBUG    | __main__:trials:29 - Trial = 15986/30000 | Total reward = 41.92
2022-01-26 14:17:43.212 | DEBUG    | __main__:trials:24 - Trial = 15987/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.213 | DEBUG    | __main__:trials:29 - Trial = 15987/30000 | Total reward = 48.17
2022-01-26 14:17:43.216 | DEBUG    | __main__:trials:24 - Trial = 15988/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.218 | DEBUG    | __main__:trials:29 - Trial = 15988/30000 | Total reward = 50.94
2022-01-26 14:17:43.221 | DEBUG    | __main__:trials:24 - Trial = 15989/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.221 | DEBUG    | __main__:trials:29 - Trial = 15989/30000 | Total reward = 45.01
2022-01-26 14:17:43.225 | DEBUG    | __main__:trials:24 - Trial = 15990/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.227 | DEBUG    | __main__:trials:29 - Trial = 15990/30000 | Total reward = 47.20
2022-01-26 14:17:43.231 | DEBUG    | __main__:trials:24 - Trial = 15991/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.232 | DEBUG    | __main__:trials:29 - Trial = 15991/30000 | Total reward = 51.18
2022-01-26 14:17:43.235 | DEBUG    | __main__:trials:24 - Trial = 15992/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.237 | DEBUG    | __main__:trials:29 - Trial = 15992/30000 | Total reward = 47.98
2022-01-26 14:17:43.240 | DEBUG    | __main__:trials:24 - Trial = 15993/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.241 | DEBUG    | __main__:trials:29 - Trial = 15993/30000 | Total reward = 49.04
2022-01-26 14:17:43.245 | DEBUG    | __main__:trials:24 - Trial = 15994/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.247 | DEBUG    | __main__:trials:29 - Trial = 15994/30000 | Total reward = 51.21
2022-01-26 14:17:43.250 | DEBUG    | __main__:trials:24 - Trial = 15995/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.252 | DEBUG    | __main__:trials:29 - Trial = 15995/30000 | Total reward = 48.59
2022-01-26 14:17:43.256 | DEBUG    | __main__:trials:24 - Trial = 15996/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.257 | DEBUG    | __main__:trials:29 - Trial = 15996/30000 | Total reward = 49.97
2022-01-26 14:17:43.261 | DEBUG    | __main__:trials:24 - Trial = 15997/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.261 | DEBUG    | __main__:trials:29 - Trial = 15997/30000 | Total reward = 53.40
2022-01-26 14:17:43.266 | DEBUG    | __main__:trials:24 - Trial = 15998/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.267 | DEBUG    | __main__:trials:29 - Trial = 15998/30000 | Total reward = 52.65
2022-01-26 14:17:43.270 | DEBUG    | __main__:trials:24 - Trial = 15999/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.272 | DEBUG    | __main__:trials:29 - Trial = 15999/30000 | Total reward = 51.14
2022-01-26 14:17:43.275 | DEBUG    | __main__:trials:24 - Trial = 16000/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.276 | DEBUG    | __main__:trials:29 - Trial = 16000/30000 | Total reward = 39.29
2022-01-26 14:17:43.280 | DEBUG    | __main__:trials:24 - Trial = 16001/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.281 | DEBUG    | __main__:trials:29 - Trial = 16001/30000 | Total reward = 61.86
2022-01-26 14:17:43.285 | DEBUG    | __main__:trials:24 - Trial = 16002/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.286 | DEBUG    | __main__:trials:29 - Trial = 16002/30000 | Total reward = 59.40
2022-01-26 14:17:43.290 | DEBUG    | __main__:trials:24 - Trial = 16003/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.291 | DEBUG    | __main__:trials:29 - Trial = 16003/30000 | Total reward = 53.06
2022-01-26 14:17:43.295 | DEBUG    | __main__:trials:24 - Trial = 16004/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.297 | DEBUG    | __main__:trials:29 - Trial = 16004/30000 | Total reward = 51.32
2022-01-26 14:17:43.300 | DEBUG    | __main__:trials:24 - Trial = 16005/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.301 | DEBUG    | __main__:trials:29 - Trial = 16005/30000 | Total reward = 50.61
2022-01-26 14:17:43.304 | DEBUG    | __main__:trials:24 - Trial = 16006/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.306 | DEBUG    | __main__:trials:29 - Trial = 16006/30000 | Total reward = 37.92
2022-01-26 14:17:43.309 | DEBUG    | __main__:trials:24 - Trial = 16007/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.309 | DEBUG    | __main__:trials:29 - Trial = 16007/30000 | Total reward = 45.44
2022-01-26 14:17:43.313 | DEBUG    | __main__:trials:24 - Trial = 16008/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.314 | DEBUG    | __main__:trials:29 - Trial = 16008/30000 | Total reward = 44.73
2022-01-26 14:17:43.318 | DEBUG    | __main__:trials:24 - Trial = 16009/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.318 | DEBUG    | __main__:trials:29 - Trial = 16009/30000 | Total reward = 51.32
2022-01-26 14:17:43.323 | DEBUG    | __main__:trials:24 - Trial = 16010/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.324 | DEBUG    | __main__:trials:29 - Trial = 16010/30000 | Total reward = 50.29
2022-01-26 14:17:43.328 | DEBUG    | __main__:trials:24 - Trial = 16011/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.329 | DEBUG    | __main__:trials:29 - Trial = 16011/30000 | Total reward = 63.65
2022-01-26 14:17:43.333 | DEBUG    | __main__:trials:24 - Trial = 16012/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.334 | DEBUG    | __main__:trials:29 - Trial = 16012/30000 | Total reward = 53.14
2022-01-26 14:17:43.338 | DEBUG    | __main__:trials:24 - Trial = 16013/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.339 | DEBUG    | __main__:trials:29 - Trial = 16013/30000 | Total reward = 34.07
2022-01-26 14:17:43.343 | DEBUG    | __main__:trials:24 - Trial = 16014/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.344 | DEBUG    | __main__:trials:29 - Trial = 16014/30000 | Total reward = 43.98
2022-01-26 14:17:43.348 | DEBUG    | __main__:trials:24 - Trial = 16015/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.349 | DEBUG    | __main__:trials:29 - Trial = 16015/30000 | Total reward = 62.22
2022-01-26 14:17:43.352 | DEBUG    | __main__:trials:24 - Trial = 16016/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.354 | DEBUG    | __main__:trials:29 - Trial = 16016/30000 | Total reward = 47.85
2022-01-26 14:17:43.358 | DEBUG    | __main__:trials:24 - Trial = 16017/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.359 | DEBUG    | __main__:trials:29 - Trial = 16017/30000 | Total reward = 44.35
2022-01-26 14:17:43.363 | DEBUG    | __main__:trials:24 - Trial = 16018/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.364 | DEBUG    | __main__:trials:29 - Trial = 16018/30000 | Total reward = 45.94
2022-01-26 14:17:43.368 | DEBUG    | __main__:trials:24 - Trial = 16019/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.370 | DEBUG    | __main__:trials:29 - Trial = 16019/30000 | Total reward = 35.95
2022-01-26 14:17:43.374 | DEBUG    | __main__:trials:24 - Trial = 16020/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.374 | DEBUG    | __main__:trials:29 - Trial = 16020/30000 | Total reward = 39.10
2022-01-26 14:17:43.379 | DEBUG    | __main__:trials:24 - Trial = 16021/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.380 | DEBUG    | __main__:trials:29 - Trial = 16021/30000 | Total reward = 38.57
2022-01-26 14:17:43.384 | DEBUG    | __main__:trials:24 - Trial = 16022/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.386 | DEBUG    | __main__:trials:29 - Trial = 16022/30000 | Total reward = 49.67
2022-01-26 14:17:43.389 | DEBUG    | __main__:trials:24 - Trial = 16023/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.391 | DEBUG    | __main__:trials:29 - Trial = 16023/30000 | Total reward = 47.79
2022-01-26 14:17:43.394 | DEBUG    | __main__:trials:24 - Trial = 16024/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.396 | DEBUG    | __main__:trials:29 - Trial = 16024/30000 | Total reward = 53.69
2022-01-26 14:17:43.399 | DEBUG    | __main__:trials:24 - Trial = 16025/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.400 | DEBUG    | __main__:trials:29 - Trial = 16025/30000 | Total reward = 51.58
2022-01-26 14:17:43.404 | DEBUG    | __main__:trials:24 - Trial = 16026/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.405 | DEBUG    | __main__:trials:29 - Trial = 16026/30000 | Total reward = 53.42
2022-01-26 14:17:43.408 | DEBUG    | __main__:trials:24 - Trial = 16027/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.409 | DEBUG    | __main__:trials:29 - Trial = 16027/30000 | Total reward = 41.53
2022-01-26 14:17:43.412 | DEBUG    | __main__:trials:24 - Trial = 16028/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.414 | DEBUG    | __main__:trials:29 - Trial = 16028/30000 | Total reward = 35.95
2022-01-26 14:17:43.417 | DEBUG    | __main__:trials:24 - Trial = 16029/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.419 | DEBUG    | __main__:trials:29 - Trial = 16029/30000 | Total reward = 52.75
2022-01-26 14:17:43.422 | DEBUG    | __main__:trials:24 - Trial = 16030/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.423 | DEBUG    | __main__:trials:29 - Trial = 16030/30000 | Total reward = 47.82
2022-01-26 14:17:43.427 | DEBUG    | __main__:trials:24 - Trial = 16031/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.428 | DEBUG    | __main__:trials:29 - Trial = 16031/30000 | Total reward = 46.88
2022-01-26 14:17:43.432 | DEBUG    | __main__:trials:24 - Trial = 16032/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.434 | DEBUG    | __main__:trials:29 - Trial = 16032/30000 | Total reward = 47.55
2022-01-26 14:17:43.437 | DEBUG    | __main__:trials:24 - Trial = 16033/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.439 | DEBUG    | __main__:trials:29 - Trial = 16033/30000 | Total reward = 47.54
2022-01-26 14:17:43.443 | DEBUG    | __main__:trials:24 - Trial = 16034/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.443 | DEBUG    | __main__:trials:29 - Trial = 16034/30000 | Total reward = 50.22
2022-01-26 14:17:43.448 | DEBUG    | __main__:trials:24 - Trial = 16035/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.449 | DEBUG    | __main__:trials:29 - Trial = 16035/30000 | Total reward = 58.73
2022-01-26 14:17:43.453 | DEBUG    | __main__:trials:24 - Trial = 16036/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.454 | DEBUG    | __main__:trials:29 - Trial = 16036/30000 | Total reward = 51.06
2022-01-26 14:17:43.458 | DEBUG    | __main__:trials:24 - Trial = 16037/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.458 | DEBUG    | __main__:trials:29 - Trial = 16037/30000 | Total reward = 50.80
2022-01-26 14:17:43.462 | DEBUG    | __main__:trials:24 - Trial = 16038/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.463 | DEBUG    | __main__:trials:29 - Trial = 16038/30000 | Total reward = 53.79
2022-01-26 14:17:43.468 | DEBUG    | __main__:trials:24 - Trial = 16039/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.468 | DEBUG    | __main__:trials:29 - Trial = 16039/30000 | Total reward = 41.04
2022-01-26 14:17:43.472 | DEBUG    | __main__:trials:24 - Trial = 16040/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.474 | DEBUG    | __main__:trials:29 - Trial = 16040/30000 | Total reward = 42.89
2022-01-26 14:17:43.477 | DEBUG    | __main__:trials:24 - Trial = 16041/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.478 | DEBUG    | __main__:trials:29 - Trial = 16041/30000 | Total reward = 55.78
2022-01-26 14:17:43.482 | DEBUG    | __main__:trials:24 - Trial = 16042/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.484 | DEBUG    | __main__:trials:29 - Trial = 16042/30000 | Total reward = 25.93
2022-01-26 14:17:43.487 | DEBUG    | __main__:trials:24 - Trial = 16043/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.489 | DEBUG    | __main__:trials:29 - Trial = 16043/30000 | Total reward = 45.72
2022-01-26 14:17:43.492 | DEBUG    | __main__:trials:24 - Trial = 16044/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.493 | DEBUG    | __main__:trials:29 - Trial = 16044/30000 | Total reward = 51.69
2022-01-26 14:17:43.497 | DEBUG    | __main__:trials:24 - Trial = 16045/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.498 | DEBUG    | __main__:trials:29 - Trial = 16045/30000 | Total reward = 56.66
2022-01-26 14:17:43.502 | DEBUG    | __main__:trials:24 - Trial = 16046/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.503 | DEBUG    | __main__:trials:29 - Trial = 16046/30000 | Total reward = 45.83
2022-01-26 14:17:43.507 | DEBUG    | __main__:trials:24 - Trial = 16047/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.509 | DEBUG    | __main__:trials:29 - Trial = 16047/30000 | Total reward = 42.85
2022-01-26 14:17:43.512 | DEBUG    | __main__:trials:24 - Trial = 16048/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.514 | DEBUG    | __main__:trials:29 - Trial = 16048/30000 | Total reward = 34.57
2022-01-26 14:17:43.517 | DEBUG    | __main__:trials:24 - Trial = 16049/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.518 | DEBUG    | __main__:trials:29 - Trial = 16049/30000 | Total reward = 52.72
2022-01-26 14:17:43.521 | DEBUG    | __main__:trials:24 - Trial = 16050/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.522 | DEBUG    | __main__:trials:29 - Trial = 16050/30000 | Total reward = 52.66
2022-01-26 14:17:43.525 | DEBUG    | __main__:trials:24 - Trial = 16051/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.527 | DEBUG    | __main__:trials:29 - Trial = 16051/30000 | Total reward = 54.69
2022-01-26 14:17:43.530 | DEBUG    | __main__:trials:24 - Trial = 16052/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.532 | DEBUG    | __main__:trials:29 - Trial = 16052/30000 | Total reward = 41.51
2022-01-26 14:17:43.536 | DEBUG    | __main__:trials:24 - Trial = 16053/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.537 | DEBUG    | __main__:trials:29 - Trial = 16053/30000 | Total reward = 47.26
2022-01-26 14:17:43.540 | DEBUG    | __main__:trials:24 - Trial = 16054/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.542 | DEBUG    | __main__:trials:29 - Trial = 16054/30000 | Total reward = 36.77
2022-01-26 14:17:43.544 | DEBUG    | __main__:trials:24 - Trial = 16055/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.546 | DEBUG    | __main__:trials:29 - Trial = 16055/30000 | Total reward = 39.61
2022-01-26 14:17:43.550 | DEBUG    | __main__:trials:24 - Trial = 16056/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.551 | DEBUG    | __main__:trials:29 - Trial = 16056/30000 | Total reward = 37.60
2022-01-26 14:17:43.555 | DEBUG    | __main__:trials:24 - Trial = 16057/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.556 | DEBUG    | __main__:trials:29 - Trial = 16057/30000 | Total reward = 44.48
2022-01-26 14:17:43.560 | DEBUG    | __main__:trials:24 - Trial = 16058/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.562 | DEBUG    | __main__:trials:29 - Trial = 16058/30000 | Total reward = 52.66
2022-01-26 14:17:43.565 | DEBUG    | __main__:trials:24 - Trial = 16059/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.566 | DEBUG    | __main__:trials:29 - Trial = 16059/30000 | Total reward = 42.27
2022-01-26 14:17:43.570 | DEBUG    | __main__:trials:24 - Trial = 16060/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.571 | DEBUG    | __main__:trials:29 - Trial = 16060/30000 | Total reward = 51.32
2022-01-26 14:17:43.576 | DEBUG    | __main__:trials:24 - Trial = 16061/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.576 | DEBUG    | __main__:trials:29 - Trial = 16061/30000 | Total reward = 51.79
2022-01-26 14:17:43.581 | DEBUG    | __main__:trials:24 - Trial = 16062/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.583 | DEBUG    | __main__:trials:29 - Trial = 16062/30000 | Total reward = 41.71
2022-01-26 14:17:43.587 | DEBUG    | __main__:trials:24 - Trial = 16063/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.588 | DEBUG    | __main__:trials:29 - Trial = 16063/30000 | Total reward = 36.49
2022-01-26 14:17:43.592 | DEBUG    | __main__:trials:24 - Trial = 16064/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.593 | DEBUG    | __main__:trials:29 - Trial = 16064/30000 | Total reward = 57.40
2022-01-26 14:17:43.596 | DEBUG    | __main__:trials:24 - Trial = 16065/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.597 | DEBUG    | __main__:trials:29 - Trial = 16065/30000 | Total reward = 58.68
2022-01-26 14:17:43.601 | DEBUG    | __main__:trials:24 - Trial = 16066/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.601 | DEBUG    | __main__:trials:29 - Trial = 16066/30000 | Total reward = 54.55
2022-01-26 14:17:43.605 | DEBUG    | __main__:trials:24 - Trial = 16067/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.606 | DEBUG    | __main__:trials:29 - Trial = 16067/30000 | Total reward = 51.73
2022-01-26 14:17:43.609 | DEBUG    | __main__:trials:24 - Trial = 16068/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.610 | DEBUG    | __main__:trials:29 - Trial = 16068/30000 | Total reward = 52.02
2022-01-26 14:17:43.613 | DEBUG    | __main__:trials:24 - Trial = 16069/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.614 | DEBUG    | __main__:trials:29 - Trial = 16069/30000 | Total reward = 65.48
2022-01-26 14:17:43.617 | DEBUG    | __main__:trials:24 - Trial = 16070/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.618 | DEBUG    | __main__:trials:29 - Trial = 16070/30000 | Total reward = 47.86
2022-01-26 14:17:43.621 | DEBUG    | __main__:trials:24 - Trial = 16071/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.622 | DEBUG    | __main__:trials:29 - Trial = 16071/30000 | Total reward = 40.38
2022-01-26 14:17:43.625 | DEBUG    | __main__:trials:24 - Trial = 16072/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.627 | DEBUG    | __main__:trials:29 - Trial = 16072/30000 | Total reward = 49.67
2022-01-26 14:17:43.630 | DEBUG    | __main__:trials:24 - Trial = 16073/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.630 | DEBUG    | __main__:trials:29 - Trial = 16073/30000 | Total reward = 51.32
2022-01-26 14:17:43.634 | DEBUG    | __main__:trials:24 - Trial = 16074/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.636 | DEBUG    | __main__:trials:29 - Trial = 16074/30000 | Total reward = 47.77
2022-01-26 14:17:43.640 | DEBUG    | __main__:trials:24 - Trial = 16075/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.641 | DEBUG    | __main__:trials:29 - Trial = 16075/30000 | Total reward = 40.76
2022-01-26 14:17:43.645 | DEBUG    | __main__:trials:24 - Trial = 16076/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.647 | DEBUG    | __main__:trials:29 - Trial = 16076/30000 | Total reward = 57.38
2022-01-26 14:17:43.650 | DEBUG    | __main__:trials:24 - Trial = 16077/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.651 | DEBUG    | __main__:trials:29 - Trial = 16077/30000 | Total reward = 46.68
2022-01-26 14:17:43.656 | DEBUG    | __main__:trials:24 - Trial = 16078/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.657 | DEBUG    | __main__:trials:29 - Trial = 16078/30000 | Total reward = 21.91
2022-01-26 14:17:43.660 | DEBUG    | __main__:trials:24 - Trial = 16079/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.662 | DEBUG    | __main__:trials:29 - Trial = 16079/30000 | Total reward = 53.31
2022-01-26 14:17:43.665 | DEBUG    | __main__:trials:24 - Trial = 16080/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.666 | DEBUG    | __main__:trials:29 - Trial = 16080/30000 | Total reward = 51.32
2022-01-26 14:17:43.669 | DEBUG    | __main__:trials:24 - Trial = 16081/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.671 | DEBUG    | __main__:trials:29 - Trial = 16081/30000 | Total reward = 45.63
2022-01-26 14:17:43.674 | DEBUG    | __main__:trials:24 - Trial = 16082/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.675 | DEBUG    | __main__:trials:29 - Trial = 16082/30000 | Total reward = 47.94
2022-01-26 14:17:43.678 | DEBUG    | __main__:trials:24 - Trial = 16083/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.679 | DEBUG    | __main__:trials:29 - Trial = 16083/30000 | Total reward = 50.97
2022-01-26 14:17:43.683 | DEBUG    | __main__:trials:24 - Trial = 16084/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.684 | DEBUG    | __main__:trials:29 - Trial = 16084/30000 | Total reward = 22.52
2022-01-26 14:17:43.687 | DEBUG    | __main__:trials:24 - Trial = 16085/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.688 | DEBUG    | __main__:trials:29 - Trial = 16085/30000 | Total reward = 52.40
2022-01-26 14:17:43.691 | DEBUG    | __main__:trials:24 - Trial = 16086/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.693 | DEBUG    | __main__:trials:29 - Trial = 16086/30000 | Total reward = 51.73
2022-01-26 14:17:43.696 | DEBUG    | __main__:trials:24 - Trial = 16087/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.698 | DEBUG    | __main__:trials:29 - Trial = 16087/30000 | Total reward = 51.52
2022-01-26 14:17:43.701 | DEBUG    | __main__:trials:24 - Trial = 16088/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.703 | DEBUG    | __main__:trials:29 - Trial = 16088/30000 | Total reward = 43.10
2022-01-26 14:17:43.706 | DEBUG    | __main__:trials:24 - Trial = 16089/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.708 | DEBUG    | __main__:trials:29 - Trial = 16089/30000 | Total reward = 48.00
2022-01-26 14:17:43.712 | DEBUG    | __main__:trials:24 - Trial = 16090/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.713 | DEBUG    | __main__:trials:29 - Trial = 16090/30000 | Total reward = 42.30
2022-01-26 14:17:43.716 | DEBUG    | __main__:trials:24 - Trial = 16091/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.718 | DEBUG    | __main__:trials:29 - Trial = 16091/30000 | Total reward = 45.65
2022-01-26 14:17:43.721 | DEBUG    | __main__:trials:24 - Trial = 16092/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.722 | DEBUG    | __main__:trials:29 - Trial = 16092/30000 | Total reward = 49.42
2022-01-26 14:17:43.726 | DEBUG    | __main__:trials:24 - Trial = 16093/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.728 | DEBUG    | __main__:trials:29 - Trial = 16093/30000 | Total reward = 42.40
2022-01-26 14:17:43.732 | DEBUG    | __main__:trials:24 - Trial = 16094/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.733 | DEBUG    | __main__:trials:29 - Trial = 16094/30000 | Total reward = 51.50
2022-01-26 14:17:43.737 | DEBUG    | __main__:trials:24 - Trial = 16095/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.738 | DEBUG    | __main__:trials:29 - Trial = 16095/30000 | Total reward = 32.03
2022-01-26 14:17:43.742 | DEBUG    | __main__:trials:24 - Trial = 16096/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.743 | DEBUG    | __main__:trials:29 - Trial = 16096/30000 | Total reward = 54.41
2022-01-26 14:17:43.747 | DEBUG    | __main__:trials:24 - Trial = 16097/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.748 | DEBUG    | __main__:trials:29 - Trial = 16097/30000 | Total reward = 55.32
2022-01-26 14:17:43.752 | DEBUG    | __main__:trials:24 - Trial = 16098/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.753 | DEBUG    | __main__:trials:29 - Trial = 16098/30000 | Total reward = 51.32
2022-01-26 14:17:43.756 | DEBUG    | __main__:trials:24 - Trial = 16099/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.758 | DEBUG    | __main__:trials:29 - Trial = 16099/30000 | Total reward = 60.14
2022-01-26 14:17:43.761 | DEBUG    | __main__:trials:24 - Trial = 16100/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.761 | DEBUG    | __main__:trials:29 - Trial = 16100/30000 | Total reward = 49.38
2022-01-26 14:17:43.766 | DEBUG    | __main__:trials:24 - Trial = 16101/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.766 | DEBUG    | __main__:trials:29 - Trial = 16101/30000 | Total reward = 45.34
2022-01-26 14:17:43.771 | DEBUG    | __main__:trials:24 - Trial = 16102/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.772 | DEBUG    | __main__:trials:29 - Trial = 16102/30000 | Total reward = 43.94
2022-01-26 14:17:43.776 | DEBUG    | __main__:trials:24 - Trial = 16103/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.776 | DEBUG    | __main__:trials:29 - Trial = 16103/30000 | Total reward = 34.80
2022-01-26 14:17:43.780 | DEBUG    | __main__:trials:24 - Trial = 16104/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.781 | DEBUG    | __main__:trials:29 - Trial = 16104/30000 | Total reward = 48.41
2022-01-26 14:17:43.784 | DEBUG    | __main__:trials:24 - Trial = 16105/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.786 | DEBUG    | __main__:trials:29 - Trial = 16105/30000 | Total reward = 51.86
2022-01-26 14:17:43.789 | DEBUG    | __main__:trials:24 - Trial = 16106/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.790 | DEBUG    | __main__:trials:29 - Trial = 16106/30000 | Total reward = 42.20
2022-01-26 14:17:43.794 | DEBUG    | __main__:trials:24 - Trial = 16107/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.795 | DEBUG    | __main__:trials:29 - Trial = 16107/30000 | Total reward = 54.03
2022-01-26 14:17:43.799 | DEBUG    | __main__:trials:24 - Trial = 16108/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.801 | DEBUG    | __main__:trials:29 - Trial = 16108/30000 | Total reward = 54.89
2022-01-26 14:17:43.804 | DEBUG    | __main__:trials:24 - Trial = 16109/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.806 | DEBUG    | __main__:trials:29 - Trial = 16109/30000 | Total reward = 57.77
2022-01-26 14:17:43.809 | DEBUG    | __main__:trials:24 - Trial = 16110/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.810 | DEBUG    | __main__:trials:29 - Trial = 16110/30000 | Total reward = 59.48
2022-01-26 14:17:43.814 | DEBUG    | __main__:trials:24 - Trial = 16111/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.816 | DEBUG    | __main__:trials:29 - Trial = 16111/30000 | Total reward = 53.65
2022-01-26 14:17:43.820 | DEBUG    | __main__:trials:24 - Trial = 16112/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.821 | DEBUG    | __main__:trials:29 - Trial = 16112/30000 | Total reward = 50.93
2022-01-26 14:17:43.825 | DEBUG    | __main__:trials:24 - Trial = 16113/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.826 | DEBUG    | __main__:trials:29 - Trial = 16113/30000 | Total reward = 60.99
2022-01-26 14:17:43.830 | DEBUG    | __main__:trials:24 - Trial = 16114/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.831 | DEBUG    | __main__:trials:29 - Trial = 16114/30000 | Total reward = 53.18
2022-01-26 14:17:43.835 | DEBUG    | __main__:trials:24 - Trial = 16115/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.837 | DEBUG    | __main__:trials:29 - Trial = 16115/30000 | Total reward = 58.55
2022-01-26 14:17:43.840 | DEBUG    | __main__:trials:24 - Trial = 16116/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.841 | DEBUG    | __main__:trials:29 - Trial = 16116/30000 | Total reward = 57.04
2022-01-26 14:17:43.845 | DEBUG    | __main__:trials:24 - Trial = 16117/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.847 | DEBUG    | __main__:trials:29 - Trial = 16117/30000 | Total reward = 43.86
2022-01-26 14:17:43.851 | DEBUG    | __main__:trials:24 - Trial = 16118/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.852 | DEBUG    | __main__:trials:29 - Trial = 16118/30000 | Total reward = 35.60
2022-01-26 14:17:43.855 | DEBUG    | __main__:trials:24 - Trial = 16119/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.857 | DEBUG    | __main__:trials:29 - Trial = 16119/30000 | Total reward = 37.42
2022-01-26 14:17:43.860 | DEBUG    | __main__:trials:24 - Trial = 16120/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.862 | DEBUG    | __main__:trials:29 - Trial = 16120/30000 | Total reward = 55.86
2022-01-26 14:17:43.865 | DEBUG    | __main__:trials:24 - Trial = 16121/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.867 | DEBUG    | __main__:trials:29 - Trial = 16121/30000 | Total reward = 40.29
2022-01-26 14:17:43.871 | DEBUG    | __main__:trials:24 - Trial = 16122/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.872 | DEBUG    | __main__:trials:29 - Trial = 16122/30000 | Total reward = 51.32
2022-01-26 14:17:43.876 | DEBUG    | __main__:trials:24 - Trial = 16123/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.877 | DEBUG    | __main__:trials:29 - Trial = 16123/30000 | Total reward = 50.73
2022-01-26 14:17:43.880 | DEBUG    | __main__:trials:24 - Trial = 16124/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.882 | DEBUG    | __main__:trials:29 - Trial = 16124/30000 | Total reward = 45.67
2022-01-26 14:17:43.885 | DEBUG    | __main__:trials:24 - Trial = 16125/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.886 | DEBUG    | __main__:trials:29 - Trial = 16125/30000 | Total reward = 60.07
2022-01-26 14:17:43.891 | DEBUG    | __main__:trials:24 - Trial = 16126/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.892 | DEBUG    | __main__:trials:29 - Trial = 16126/30000 | Total reward = 19.87
2022-01-26 14:17:43.896 | DEBUG    | __main__:trials:24 - Trial = 16127/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.897 | DEBUG    | __main__:trials:29 - Trial = 16127/30000 | Total reward = 34.79
2022-01-26 14:17:43.900 | DEBUG    | __main__:trials:24 - Trial = 16128/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.902 | DEBUG    | __main__:trials:29 - Trial = 16128/30000 | Total reward = 62.28
2022-01-26 14:17:43.906 | DEBUG    | __main__:trials:24 - Trial = 16129/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.907 | DEBUG    | __main__:trials:29 - Trial = 16129/30000 | Total reward = 54.91
2022-01-26 14:17:43.911 | DEBUG    | __main__:trials:24 - Trial = 16130/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.912 | DEBUG    | __main__:trials:29 - Trial = 16130/30000 | Total reward = 56.46
2022-01-26 14:17:43.915 | DEBUG    | __main__:trials:24 - Trial = 16131/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.917 | DEBUG    | __main__:trials:29 - Trial = 16131/30000 | Total reward = 52.13
2022-01-26 14:17:43.920 | DEBUG    | __main__:trials:24 - Trial = 16132/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.921 | DEBUG    | __main__:trials:29 - Trial = 16132/30000 | Total reward = 50.91
2022-01-26 14:17:43.925 | DEBUG    | __main__:trials:24 - Trial = 16133/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.926 | DEBUG    | __main__:trials:29 - Trial = 16133/30000 | Total reward = 47.37
2022-01-26 14:17:43.929 | DEBUG    | __main__:trials:26 - Trial = 16134/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:43.930 | DEBUG    | __main__:trials:29 - Trial = 16134/30000 | Total reward = 24.85
2022-01-26 14:17:43.934 | DEBUG    | __main__:trials:24 - Trial = 16135/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.934 | DEBUG    | __main__:trials:29 - Trial = 16135/30000 | Total reward = 47.54
2022-01-26 14:17:43.938 | DEBUG    | __main__:trials:24 - Trial = 16136/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.940 | DEBUG    | __main__:trials:29 - Trial = 16136/30000 | Total reward = 51.73
2022-01-26 14:17:43.943 | DEBUG    | __main__:trials:24 - Trial = 16137/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.943 | DEBUG    | __main__:trials:29 - Trial = 16137/30000 | Total reward = 51.76
2022-01-26 14:17:43.947 | DEBUG    | __main__:trials:24 - Trial = 16138/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.948 | DEBUG    | __main__:trials:29 - Trial = 16138/30000 | Total reward = 49.85
2022-01-26 14:17:43.952 | DEBUG    | __main__:trials:24 - Trial = 16139/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.954 | DEBUG    | __main__:trials:29 - Trial = 16139/30000 | Total reward = 56.80
2022-01-26 14:17:43.957 | DEBUG    | __main__:trials:24 - Trial = 16140/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.958 | DEBUG    | __main__:trials:29 - Trial = 16140/30000 | Total reward = 47.59
2022-01-26 14:17:43.963 | DEBUG    | __main__:trials:24 - Trial = 16141/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.964 | DEBUG    | __main__:trials:29 - Trial = 16141/30000 | Total reward = 35.43
2022-01-26 14:17:43.967 | DEBUG    | __main__:trials:24 - Trial = 16142/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.969 | DEBUG    | __main__:trials:29 - Trial = 16142/30000 | Total reward = 36.57
2022-01-26 14:17:43.972 | DEBUG    | __main__:trials:24 - Trial = 16143/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.974 | DEBUG    | __main__:trials:29 - Trial = 16143/30000 | Total reward = 52.09
2022-01-26 14:17:43.978 | DEBUG    | __main__:trials:24 - Trial = 16144/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.979 | DEBUG    | __main__:trials:29 - Trial = 16144/30000 | Total reward = 60.62
2022-01-26 14:17:43.983 | DEBUG    | __main__:trials:24 - Trial = 16145/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.985 | DEBUG    | __main__:trials:29 - Trial = 16145/30000 | Total reward = 57.33
2022-01-26 14:17:43.988 | DEBUG    | __main__:trials:24 - Trial = 16146/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.990 | DEBUG    | __main__:trials:29 - Trial = 16146/30000 | Total reward = 57.27
2022-01-26 14:17:43.994 | DEBUG    | __main__:trials:24 - Trial = 16147/30000 | Max number of steps (20) reached
2022-01-26 14:17:43.995 | DEBUG    | __main__:trials:29 - Trial = 16147/30000 | Total reward = 45.91
2022-01-26 14:17:43.999 | DEBUG    | __main__:trials:24 - Trial = 16148/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.000 | DEBUG    | __main__:trials:29 - Trial = 16148/30000 | Total reward = 53.71
2022-01-26 14:17:44.004 | DEBUG    | __main__:trials:24 - Trial = 16149/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.005 | DEBUG    | __main__:trials:29 - Trial = 16149/30000 | Total reward = 42.05
2022-01-26 14:17:44.009 | DEBUG    | __main__:trials:24 - Trial = 16150/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.010 | DEBUG    | __main__:trials:29 - Trial = 16150/30000 | Total reward = 45.10
2022-01-26 14:17:44.014 | DEBUG    | __main__:trials:24 - Trial = 16151/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.015 | DEBUG    | __main__:trials:29 - Trial = 16151/30000 | Total reward = 50.22
2022-01-26 14:17:44.019 | DEBUG    | __main__:trials:24 - Trial = 16152/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.020 | DEBUG    | __main__:trials:29 - Trial = 16152/30000 | Total reward = 46.81
2022-01-26 14:17:44.024 | DEBUG    | __main__:trials:24 - Trial = 16153/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.026 | DEBUG    | __main__:trials:29 - Trial = 16153/30000 | Total reward = 50.48
2022-01-26 14:17:44.029 | DEBUG    | __main__:trials:24 - Trial = 16154/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.030 | DEBUG    | __main__:trials:29 - Trial = 16154/30000 | Total reward = 51.32
2022-01-26 14:17:44.035 | DEBUG    | __main__:trials:24 - Trial = 16155/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.036 | DEBUG    | __main__:trials:29 - Trial = 16155/30000 | Total reward = 59.78
2022-01-26 14:17:44.040 | DEBUG    | __main__:trials:24 - Trial = 16156/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.041 | DEBUG    | __main__:trials:29 - Trial = 16156/30000 | Total reward = 20.57
2022-01-26 14:17:44.044 | DEBUG    | __main__:trials:24 - Trial = 16157/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.046 | DEBUG    | __main__:trials:29 - Trial = 16157/30000 | Total reward = 49.95
2022-01-26 14:17:44.049 | DEBUG    | __main__:trials:24 - Trial = 16158/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.050 | DEBUG    | __main__:trials:29 - Trial = 16158/30000 | Total reward = 51.52
2022-01-26 14:17:44.053 | DEBUG    | __main__:trials:24 - Trial = 16159/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.054 | DEBUG    | __main__:trials:29 - Trial = 16159/30000 | Total reward = 41.98
2022-01-26 14:17:44.058 | DEBUG    | __main__:trials:24 - Trial = 16160/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.059 | DEBUG    | __main__:trials:29 - Trial = 16160/30000 | Total reward = 44.94
2022-01-26 14:17:44.063 | DEBUG    | __main__:trials:24 - Trial = 16161/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.065 | DEBUG    | __main__:trials:29 - Trial = 16161/30000 | Total reward = 48.08
2022-01-26 14:17:44.068 | DEBUG    | __main__:trials:24 - Trial = 16162/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.071 | DEBUG    | __main__:trials:29 - Trial = 16162/30000 | Total reward = 52.34
2022-01-26 14:17:44.074 | DEBUG    | __main__:trials:24 - Trial = 16163/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.075 | DEBUG    | __main__:trials:29 - Trial = 16163/30000 | Total reward = 60.71
2022-01-26 14:17:44.079 | DEBUG    | __main__:trials:24 - Trial = 16164/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.081 | DEBUG    | __main__:trials:29 - Trial = 16164/30000 | Total reward = 52.56
2022-01-26 14:17:44.085 | DEBUG    | __main__:trials:24 - Trial = 16165/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.086 | DEBUG    | __main__:trials:29 - Trial = 16165/30000 | Total reward = 52.49
2022-01-26 14:17:44.089 | DEBUG    | __main__:trials:24 - Trial = 16166/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.091 | DEBUG    | __main__:trials:29 - Trial = 16166/30000 | Total reward = 51.14
2022-01-26 14:17:44.094 | DEBUG    | __main__:trials:24 - Trial = 16167/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.095 | DEBUG    | __main__:trials:29 - Trial = 16167/30000 | Total reward = 52.15
2022-01-26 14:17:44.099 | DEBUG    | __main__:trials:24 - Trial = 16168/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.099 | DEBUG    | __main__:trials:29 - Trial = 16168/30000 | Total reward = 53.18
2022-01-26 14:17:44.103 | DEBUG    | __main__:trials:24 - Trial = 16169/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.104 | DEBUG    | __main__:trials:29 - Trial = 16169/30000 | Total reward = 47.80
2022-01-26 14:17:44.107 | DEBUG    | __main__:trials:24 - Trial = 16170/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.109 | DEBUG    | __main__:trials:29 - Trial = 16170/30000 | Total reward = 48.14
2022-01-26 14:17:44.112 | DEBUG    | __main__:trials:24 - Trial = 16171/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.114 | DEBUG    | __main__:trials:29 - Trial = 16171/30000 | Total reward = 51.32
2022-01-26 14:17:44.118 | DEBUG    | __main__:trials:24 - Trial = 16172/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.118 | DEBUG    | __main__:trials:29 - Trial = 16172/30000 | Total reward = 51.06
2022-01-26 14:17:44.123 | DEBUG    | __main__:trials:24 - Trial = 16173/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.123 | DEBUG    | __main__:trials:29 - Trial = 16173/30000 | Total reward = 56.86
2022-01-26 14:17:44.128 | DEBUG    | __main__:trials:24 - Trial = 16174/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.128 | DEBUG    | __main__:trials:29 - Trial = 16174/30000 | Total reward = 43.94
2022-01-26 14:17:44.132 | DEBUG    | __main__:trials:24 - Trial = 16175/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.134 | DEBUG    | __main__:trials:29 - Trial = 16175/30000 | Total reward = 63.05
2022-01-26 14:17:44.138 | DEBUG    | __main__:trials:24 - Trial = 16176/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.139 | DEBUG    | __main__:trials:29 - Trial = 16176/30000 | Total reward = 49.72
2022-01-26 14:17:44.143 | DEBUG    | __main__:trials:24 - Trial = 16177/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.144 | DEBUG    | __main__:trials:29 - Trial = 16177/30000 | Total reward = 50.44
2022-01-26 14:17:44.148 | DEBUG    | __main__:trials:24 - Trial = 16178/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.150 | DEBUG    | __main__:trials:29 - Trial = 16178/30000 | Total reward = 61.82
2022-01-26 14:17:44.154 | DEBUG    | __main__:trials:24 - Trial = 16179/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.155 | DEBUG    | __main__:trials:29 - Trial = 16179/30000 | Total reward = 51.21
2022-01-26 14:17:44.158 | DEBUG    | __main__:trials:24 - Trial = 16180/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.160 | DEBUG    | __main__:trials:29 - Trial = 16180/30000 | Total reward = 51.32
2022-01-26 14:17:44.164 | DEBUG    | __main__:trials:24 - Trial = 16181/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.164 | DEBUG    | __main__:trials:29 - Trial = 16181/30000 | Total reward = 51.34
2022-01-26 14:17:44.168 | DEBUG    | __main__:trials:24 - Trial = 16182/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.170 | DEBUG    | __main__:trials:29 - Trial = 16182/30000 | Total reward = 51.73
2022-01-26 14:17:44.174 | DEBUG    | __main__:trials:24 - Trial = 16183/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.175 | DEBUG    | __main__:trials:29 - Trial = 16183/30000 | Total reward = 49.85
2022-01-26 14:17:44.179 | DEBUG    | __main__:trials:24 - Trial = 16184/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.180 | DEBUG    | __main__:trials:29 - Trial = 16184/30000 | Total reward = 47.54
2022-01-26 14:17:44.184 | DEBUG    | __main__:trials:24 - Trial = 16185/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.185 | DEBUG    | __main__:trials:29 - Trial = 16185/30000 | Total reward = 57.84
2022-01-26 14:17:44.189 | DEBUG    | __main__:trials:24 - Trial = 16186/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.189 | DEBUG    | __main__:trials:29 - Trial = 16186/30000 | Total reward = 56.23
2022-01-26 14:17:44.194 | DEBUG    | __main__:trials:24 - Trial = 16187/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.196 | DEBUG    | __main__:trials:29 - Trial = 16187/30000 | Total reward = 56.37
2022-01-26 14:17:44.199 | DEBUG    | __main__:trials:24 - Trial = 16188/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.201 | DEBUG    | __main__:trials:29 - Trial = 16188/30000 | Total reward = 57.71
2022-01-26 14:17:44.204 | DEBUG    | __main__:trials:24 - Trial = 16189/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.205 | DEBUG    | __main__:trials:29 - Trial = 16189/30000 | Total reward = 48.06
2022-01-26 14:17:44.208 | DEBUG    | __main__:trials:24 - Trial = 16190/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.209 | DEBUG    | __main__:trials:29 - Trial = 16190/30000 | Total reward = 51.73
2022-01-26 14:17:44.212 | DEBUG    | __main__:trials:24 - Trial = 16191/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.214 | DEBUG    | __main__:trials:29 - Trial = 16191/30000 | Total reward = 54.42
2022-01-26 14:17:44.218 | DEBUG    | __main__:trials:24 - Trial = 16192/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.219 | DEBUG    | __main__:trials:29 - Trial = 16192/30000 | Total reward = 37.63
2022-01-26 14:17:44.223 | DEBUG    | __main__:trials:24 - Trial = 16193/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.225 | DEBUG    | __main__:trials:29 - Trial = 16193/30000 | Total reward = 50.67
2022-01-26 14:17:44.228 | DEBUG    | __main__:trials:24 - Trial = 16194/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.229 | DEBUG    | __main__:trials:29 - Trial = 16194/30000 | Total reward = 59.36
2022-01-26 14:17:44.233 | DEBUG    | __main__:trials:24 - Trial = 16195/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.234 | DEBUG    | __main__:trials:29 - Trial = 16195/30000 | Total reward = 56.79
2022-01-26 14:17:44.238 | DEBUG    | __main__:trials:24 - Trial = 16196/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.239 | DEBUG    | __main__:trials:29 - Trial = 16196/30000 | Total reward = 52.11
2022-01-26 14:17:44.243 | DEBUG    | __main__:trials:24 - Trial = 16197/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.244 | DEBUG    | __main__:trials:29 - Trial = 16197/30000 | Total reward = 53.50
2022-01-26 14:17:44.248 | DEBUG    | __main__:trials:24 - Trial = 16198/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.250 | DEBUG    | __main__:trials:29 - Trial = 16198/30000 | Total reward = 47.82
2022-01-26 14:17:44.253 | DEBUG    | __main__:trials:24 - Trial = 16199/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.254 | DEBUG    | __main__:trials:29 - Trial = 16199/30000 | Total reward = 51.38
2022-01-26 14:17:44.258 | DEBUG    | __main__:trials:24 - Trial = 16200/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.259 | DEBUG    | __main__:trials:29 - Trial = 16200/30000 | Total reward = 56.73
2022-01-26 14:17:44.263 | DEBUG    | __main__:trials:24 - Trial = 16201/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.263 | DEBUG    | __main__:trials:29 - Trial = 16201/30000 | Total reward = 39.95
2022-01-26 14:17:44.267 | DEBUG    | __main__:trials:24 - Trial = 16202/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.269 | DEBUG    | __main__:trials:29 - Trial = 16202/30000 | Total reward = 38.92
2022-01-26 14:17:44.273 | DEBUG    | __main__:trials:24 - Trial = 16203/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.273 | DEBUG    | __main__:trials:29 - Trial = 16203/30000 | Total reward = 45.92
2022-01-26 14:17:44.277 | DEBUG    | __main__:trials:24 - Trial = 16204/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.278 | DEBUG    | __main__:trials:29 - Trial = 16204/30000 | Total reward = 58.23
2022-01-26 14:17:44.281 | DEBUG    | __main__:trials:24 - Trial = 16205/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.283 | DEBUG    | __main__:trials:29 - Trial = 16205/30000 | Total reward = 51.83
2022-01-26 14:17:44.286 | DEBUG    | __main__:trials:24 - Trial = 16206/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.287 | DEBUG    | __main__:trials:29 - Trial = 16206/30000 | Total reward = 53.05
2022-01-26 14:17:44.291 | DEBUG    | __main__:trials:24 - Trial = 16207/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.293 | DEBUG    | __main__:trials:29 - Trial = 16207/30000 | Total reward = 50.28
2022-01-26 14:17:44.296 | DEBUG    | __main__:trials:24 - Trial = 16208/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.298 | DEBUG    | __main__:trials:29 - Trial = 16208/30000 | Total reward = 42.29
2022-01-26 14:17:44.301 | DEBUG    | __main__:trials:24 - Trial = 16209/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.303 | DEBUG    | __main__:trials:29 - Trial = 16209/30000 | Total reward = 60.89
2022-01-26 14:17:44.307 | DEBUG    | __main__:trials:24 - Trial = 16210/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.308 | DEBUG    | __main__:trials:29 - Trial = 16210/30000 | Total reward = 62.11
2022-01-26 14:17:44.312 | DEBUG    | __main__:trials:24 - Trial = 16211/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.314 | DEBUG    | __main__:trials:29 - Trial = 16211/30000 | Total reward = 51.14
2022-01-26 14:17:44.317 | DEBUG    | __main__:trials:24 - Trial = 16212/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.319 | DEBUG    | __main__:trials:29 - Trial = 16212/30000 | Total reward = 62.97
2022-01-26 14:17:44.323 | DEBUG    | __main__:trials:24 - Trial = 16213/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.323 | DEBUG    | __main__:trials:29 - Trial = 16213/30000 | Total reward = 47.59
2022-01-26 14:17:44.328 | DEBUG    | __main__:trials:24 - Trial = 16214/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.330 | DEBUG    | __main__:trials:29 - Trial = 16214/30000 | Total reward = 40.45
2022-01-26 14:17:44.333 | DEBUG    | __main__:trials:24 - Trial = 16215/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.335 | DEBUG    | __main__:trials:29 - Trial = 16215/30000 | Total reward = 54.61
2022-01-26 14:17:44.339 | DEBUG    | __main__:trials:24 - Trial = 16216/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.340 | DEBUG    | __main__:trials:29 - Trial = 16216/30000 | Total reward = 39.28
2022-01-26 14:17:44.343 | DEBUG    | __main__:trials:24 - Trial = 16217/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.345 | DEBUG    | __main__:trials:29 - Trial = 16217/30000 | Total reward = 51.32
2022-01-26 14:17:44.349 | DEBUG    | __main__:trials:24 - Trial = 16218/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.351 | DEBUG    | __main__:trials:29 - Trial = 16218/30000 | Total reward = 51.90
2022-01-26 14:17:44.353 | DEBUG    | __main__:trials:26 - Trial = 16219/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.355 | DEBUG    | __main__:trials:29 - Trial = 16219/30000 | Total reward = 22.58
2022-01-26 14:17:44.358 | DEBUG    | __main__:trials:24 - Trial = 16220/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.360 | DEBUG    | __main__:trials:29 - Trial = 16220/30000 | Total reward = 52.84
2022-01-26 14:17:44.363 | DEBUG    | __main__:trials:24 - Trial = 16221/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.365 | DEBUG    | __main__:trials:29 - Trial = 16221/30000 | Total reward = 51.32
2022-01-26 14:17:44.368 | DEBUG    | __main__:trials:24 - Trial = 16222/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.370 | DEBUG    | __main__:trials:29 - Trial = 16222/30000 | Total reward = 53.65
2022-01-26 14:17:44.373 | DEBUG    | __main__:trials:24 - Trial = 16223/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.374 | DEBUG    | __main__:trials:29 - Trial = 16223/30000 | Total reward = 48.72
2022-01-26 14:17:44.377 | DEBUG    | __main__:trials:24 - Trial = 16224/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.378 | DEBUG    | __main__:trials:29 - Trial = 16224/30000 | Total reward = 47.03
2022-01-26 14:17:44.381 | DEBUG    | __main__:trials:24 - Trial = 16225/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.383 | DEBUG    | __main__:trials:29 - Trial = 16225/30000 | Total reward = 56.33
2022-01-26 14:17:44.387 | DEBUG    | __main__:trials:24 - Trial = 16226/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.387 | DEBUG    | __main__:trials:29 - Trial = 16226/30000 | Total reward = 31.81
2022-01-26 14:17:44.392 | DEBUG    | __main__:trials:24 - Trial = 16227/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.392 | DEBUG    | __main__:trials:29 - Trial = 16227/30000 | Total reward = 55.93
2022-01-26 14:17:44.396 | DEBUG    | __main__:trials:24 - Trial = 16228/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.397 | DEBUG    | __main__:trials:29 - Trial = 16228/30000 | Total reward = 58.06
2022-01-26 14:17:44.401 | DEBUG    | __main__:trials:24 - Trial = 16229/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.403 | DEBUG    | __main__:trials:29 - Trial = 16229/30000 | Total reward = 9.02
2022-01-26 14:17:44.406 | DEBUG    | __main__:trials:24 - Trial = 16230/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.408 | DEBUG    | __main__:trials:29 - Trial = 16230/30000 | Total reward = 50.66
2022-01-26 14:17:44.412 | DEBUG    | __main__:trials:24 - Trial = 16231/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.413 | DEBUG    | __main__:trials:29 - Trial = 16231/30000 | Total reward = 52.25
2022-01-26 14:17:44.417 | DEBUG    | __main__:trials:24 - Trial = 16232/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.418 | DEBUG    | __main__:trials:29 - Trial = 16232/30000 | Total reward = 46.43
2022-01-26 14:17:44.422 | DEBUG    | __main__:trials:24 - Trial = 16233/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.423 | DEBUG    | __main__:trials:29 - Trial = 16233/30000 | Total reward = 42.58
2022-01-26 14:17:44.426 | DEBUG    | __main__:trials:24 - Trial = 16234/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.428 | DEBUG    | __main__:trials:29 - Trial = 16234/30000 | Total reward = 53.05
2022-01-26 14:17:44.431 | DEBUG    | __main__:trials:24 - Trial = 16235/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.432 | DEBUG    | __main__:trials:29 - Trial = 16235/30000 | Total reward = 51.73
2022-01-26 14:17:44.435 | DEBUG    | __main__:trials:24 - Trial = 16236/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.437 | DEBUG    | __main__:trials:29 - Trial = 16236/30000 | Total reward = 61.18
2022-01-26 14:17:44.441 | DEBUG    | __main__:trials:26 - Trial = 16237/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.442 | DEBUG    | __main__:trials:29 - Trial = 16237/30000 | Total reward = 27.52
2022-01-26 14:17:44.445 | DEBUG    | __main__:trials:24 - Trial = 16238/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.446 | DEBUG    | __main__:trials:29 - Trial = 16238/30000 | Total reward = 52.35
2022-01-26 14:17:44.449 | DEBUG    | __main__:trials:24 - Trial = 16239/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.450 | DEBUG    | __main__:trials:29 - Trial = 16239/30000 | Total reward = 40.63
2022-01-26 14:17:44.453 | DEBUG    | __main__:trials:24 - Trial = 16240/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.454 | DEBUG    | __main__:trials:29 - Trial = 16240/30000 | Total reward = 23.71
2022-01-26 14:17:44.457 | DEBUG    | __main__:trials:24 - Trial = 16241/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.459 | DEBUG    | __main__:trials:29 - Trial = 16241/30000 | Total reward = 39.61
2022-01-26 14:17:44.462 | DEBUG    | __main__:trials:24 - Trial = 16242/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.464 | DEBUG    | __main__:trials:29 - Trial = 16242/30000 | Total reward = 50.88
2022-01-26 14:17:44.468 | DEBUG    | __main__:trials:24 - Trial = 16243/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.469 | DEBUG    | __main__:trials:29 - Trial = 16243/30000 | Total reward = 38.39
2022-01-26 14:17:44.472 | DEBUG    | __main__:trials:24 - Trial = 16244/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.474 | DEBUG    | __main__:trials:29 - Trial = 16244/30000 | Total reward = 52.46
2022-01-26 14:17:44.477 | DEBUG    | __main__:trials:24 - Trial = 16245/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.478 | DEBUG    | __main__:trials:29 - Trial = 16245/30000 | Total reward = 32.44
2022-01-26 14:17:44.482 | DEBUG    | __main__:trials:24 - Trial = 16246/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.484 | DEBUG    | __main__:trials:29 - Trial = 16246/30000 | Total reward = 49.61
2022-01-26 14:17:44.486 | DEBUG    | __main__:trials:26 - Trial = 16247/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.488 | DEBUG    | __main__:trials:29 - Trial = 16247/30000 | Total reward = 22.83
2022-01-26 14:17:44.491 | DEBUG    | __main__:trials:24 - Trial = 16248/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.493 | DEBUG    | __main__:trials:29 - Trial = 16248/30000 | Total reward = 43.78
2022-01-26 14:17:44.496 | DEBUG    | __main__:trials:24 - Trial = 16249/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.498 | DEBUG    | __main__:trials:29 - Trial = 16249/30000 | Total reward = 44.32
2022-01-26 14:17:44.502 | DEBUG    | __main__:trials:24 - Trial = 16250/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.503 | DEBUG    | __main__:trials:29 - Trial = 16250/30000 | Total reward = 38.79
2022-01-26 14:17:44.507 | DEBUG    | __main__:trials:24 - Trial = 16251/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.508 | DEBUG    | __main__:trials:29 - Trial = 16251/30000 | Total reward = 35.46
2022-01-26 14:17:44.512 | DEBUG    | __main__:trials:24 - Trial = 16252/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.513 | DEBUG    | __main__:trials:29 - Trial = 16252/30000 | Total reward = 49.70
2022-01-26 14:17:44.517 | DEBUG    | __main__:trials:24 - Trial = 16253/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.517 | DEBUG    | __main__:trials:29 - Trial = 16253/30000 | Total reward = 36.93
2022-01-26 14:17:44.523 | DEBUG    | __main__:trials:24 - Trial = 16254/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.524 | DEBUG    | __main__:trials:29 - Trial = 16254/30000 | Total reward = 47.30
2022-01-26 14:17:44.528 | DEBUG    | __main__:trials:24 - Trial = 16255/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.530 | DEBUG    | __main__:trials:29 - Trial = 16255/30000 | Total reward = 51.43
2022-01-26 14:17:44.533 | DEBUG    | __main__:trials:24 - Trial = 16256/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.535 | DEBUG    | __main__:trials:29 - Trial = 16256/30000 | Total reward = 48.52
2022-01-26 14:17:44.539 | DEBUG    | __main__:trials:24 - Trial = 16257/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.540 | DEBUG    | __main__:trials:29 - Trial = 16257/30000 | Total reward = 30.71
2022-01-26 14:17:44.544 | DEBUG    | __main__:trials:24 - Trial = 16258/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.545 | DEBUG    | __main__:trials:29 - Trial = 16258/30000 | Total reward = 39.48
2022-01-26 14:17:44.549 | DEBUG    | __main__:trials:24 - Trial = 16259/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.551 | DEBUG    | __main__:trials:29 - Trial = 16259/30000 | Total reward = 59.28
2022-01-26 14:17:44.554 | DEBUG    | __main__:trials:26 - Trial = 16260/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.555 | DEBUG    | __main__:trials:29 - Trial = 16260/30000 | Total reward = 30.28
2022-01-26 14:17:44.559 | DEBUG    | __main__:trials:24 - Trial = 16261/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.560 | DEBUG    | __main__:trials:29 - Trial = 16261/30000 | Total reward = 43.52
2022-01-26 14:17:44.564 | DEBUG    | __main__:trials:24 - Trial = 16262/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.565 | DEBUG    | __main__:trials:29 - Trial = 16262/30000 | Total reward = 52.34
2022-01-26 14:17:44.569 | DEBUG    | __main__:trials:24 - Trial = 16263/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.570 | DEBUG    | __main__:trials:29 - Trial = 16263/30000 | Total reward = 43.83
2022-01-26 14:17:44.574 | DEBUG    | __main__:trials:24 - Trial = 16264/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.576 | DEBUG    | __main__:trials:29 - Trial = 16264/30000 | Total reward = 49.05
2022-01-26 14:17:44.580 | DEBUG    | __main__:trials:24 - Trial = 16265/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.580 | DEBUG    | __main__:trials:29 - Trial = 16265/30000 | Total reward = 44.32
2022-01-26 14:17:44.584 | DEBUG    | __main__:trials:24 - Trial = 16266/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.586 | DEBUG    | __main__:trials:29 - Trial = 16266/30000 | Total reward = 41.36
2022-01-26 14:17:44.590 | DEBUG    | __main__:trials:24 - Trial = 16267/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.591 | DEBUG    | __main__:trials:29 - Trial = 16267/30000 | Total reward = 50.86
2022-01-26 14:17:44.595 | DEBUG    | __main__:trials:24 - Trial = 16268/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.597 | DEBUG    | __main__:trials:29 - Trial = 16268/30000 | Total reward = 47.78
2022-01-26 14:17:44.600 | DEBUG    | __main__:trials:24 - Trial = 16269/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.602 | DEBUG    | __main__:trials:29 - Trial = 16269/30000 | Total reward = 47.91
2022-01-26 14:17:44.606 | DEBUG    | __main__:trials:24 - Trial = 16270/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.607 | DEBUG    | __main__:trials:29 - Trial = 16270/30000 | Total reward = 63.71
2022-01-26 14:17:44.610 | DEBUG    | __main__:trials:24 - Trial = 16271/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.612 | DEBUG    | __main__:trials:29 - Trial = 16271/30000 | Total reward = 43.54
2022-01-26 14:17:44.616 | DEBUG    | __main__:trials:24 - Trial = 16272/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.617 | DEBUG    | __main__:trials:29 - Trial = 16272/30000 | Total reward = 38.14
2022-01-26 14:17:44.621 | DEBUG    | __main__:trials:24 - Trial = 16273/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.622 | DEBUG    | __main__:trials:29 - Trial = 16273/30000 | Total reward = 35.16
2022-01-26 14:17:44.626 | DEBUG    | __main__:trials:24 - Trial = 16274/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.627 | DEBUG    | __main__:trials:29 - Trial = 16274/30000 | Total reward = 43.41
2022-01-26 14:17:44.631 | DEBUG    | __main__:trials:24 - Trial = 16275/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.632 | DEBUG    | __main__:trials:29 - Trial = 16275/30000 | Total reward = 33.15
2022-01-26 14:17:44.636 | DEBUG    | __main__:trials:26 - Trial = 16276/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.638 | DEBUG    | __main__:trials:29 - Trial = 16276/30000 | Total reward = 38.15
2022-01-26 14:17:44.641 | DEBUG    | __main__:trials:24 - Trial = 16277/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.643 | DEBUG    | __main__:trials:29 - Trial = 16277/30000 | Total reward = 38.73
2022-01-26 14:17:44.646 | DEBUG    | __main__:trials:24 - Trial = 16278/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.648 | DEBUG    | __main__:trials:29 - Trial = 16278/30000 | Total reward = 40.72
2022-01-26 14:17:44.651 | DEBUG    | __main__:trials:24 - Trial = 16279/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.652 | DEBUG    | __main__:trials:29 - Trial = 16279/30000 | Total reward = 54.80
2022-01-26 14:17:44.656 | DEBUG    | __main__:trials:24 - Trial = 16280/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.658 | DEBUG    | __main__:trials:29 - Trial = 16280/30000 | Total reward = 50.65
2022-01-26 14:17:44.661 | DEBUG    | __main__:trials:24 - Trial = 16281/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.663 | DEBUG    | __main__:trials:29 - Trial = 16281/30000 | Total reward = 45.34
2022-01-26 14:17:44.666 | DEBUG    | __main__:trials:24 - Trial = 16282/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.667 | DEBUG    | __main__:trials:29 - Trial = 16282/30000 | Total reward = 47.22
2022-01-26 14:17:44.670 | DEBUG    | __main__:trials:24 - Trial = 16283/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.672 | DEBUG    | __main__:trials:29 - Trial = 16283/30000 | Total reward = 26.10
2022-01-26 14:17:44.675 | DEBUG    | __main__:trials:24 - Trial = 16284/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.677 | DEBUG    | __main__:trials:29 - Trial = 16284/30000 | Total reward = 52.47
2022-01-26 14:17:44.680 | DEBUG    | __main__:trials:24 - Trial = 16285/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.682 | DEBUG    | __main__:trials:29 - Trial = 16285/30000 | Total reward = 54.26
2022-01-26 14:17:44.686 | DEBUG    | __main__:trials:24 - Trial = 16286/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.687 | DEBUG    | __main__:trials:29 - Trial = 16286/30000 | Total reward = 44.13
2022-01-26 14:17:44.691 | DEBUG    | __main__:trials:24 - Trial = 16287/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.692 | DEBUG    | __main__:trials:29 - Trial = 16287/30000 | Total reward = 40.88
2022-01-26 14:17:44.696 | DEBUG    | __main__:trials:24 - Trial = 16288/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.697 | DEBUG    | __main__:trials:29 - Trial = 16288/30000 | Total reward = 40.07
2022-01-26 14:17:44.701 | DEBUG    | __main__:trials:24 - Trial = 16289/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.702 | DEBUG    | __main__:trials:29 - Trial = 16289/30000 | Total reward = 52.77
2022-01-26 14:17:44.706 | DEBUG    | __main__:trials:24 - Trial = 16290/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.706 | DEBUG    | __main__:trials:29 - Trial = 16290/30000 | Total reward = 40.99
2022-01-26 14:17:44.711 | DEBUG    | __main__:trials:24 - Trial = 16291/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.711 | DEBUG    | __main__:trials:29 - Trial = 16291/30000 | Total reward = 46.94
2022-01-26 14:17:44.716 | DEBUG    | __main__:trials:24 - Trial = 16292/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.717 | DEBUG    | __main__:trials:29 - Trial = 16292/30000 | Total reward = 40.37
2022-01-26 14:17:44.721 | DEBUG    | __main__:trials:24 - Trial = 16293/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.723 | DEBUG    | __main__:trials:29 - Trial = 16293/30000 | Total reward = 35.14
2022-01-26 14:17:44.726 | DEBUG    | __main__:trials:24 - Trial = 16294/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.728 | DEBUG    | __main__:trials:29 - Trial = 16294/30000 | Total reward = 60.07
2022-01-26 14:17:44.732 | DEBUG    | __main__:trials:24 - Trial = 16295/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.733 | DEBUG    | __main__:trials:29 - Trial = 16295/30000 | Total reward = 43.86
2022-01-26 14:17:44.737 | DEBUG    | __main__:trials:24 - Trial = 16296/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.738 | DEBUG    | __main__:trials:29 - Trial = 16296/30000 | Total reward = 42.03
2022-01-26 14:17:44.742 | DEBUG    | __main__:trials:24 - Trial = 16297/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.744 | DEBUG    | __main__:trials:29 - Trial = 16297/30000 | Total reward = 33.53
2022-01-26 14:17:44.746 | DEBUG    | __main__:trials:24 - Trial = 16298/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.748 | DEBUG    | __main__:trials:29 - Trial = 16298/30000 | Total reward = 39.18
2022-01-26 14:17:44.751 | DEBUG    | __main__:trials:24 - Trial = 16299/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.753 | DEBUG    | __main__:trials:29 - Trial = 16299/30000 | Total reward = 34.92
2022-01-26 14:17:44.756 | DEBUG    | __main__:trials:24 - Trial = 16300/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.758 | DEBUG    | __main__:trials:29 - Trial = 16300/30000 | Total reward = 37.42
2022-01-26 14:17:44.761 | DEBUG    | __main__:trials:24 - Trial = 16301/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.762 | DEBUG    | __main__:trials:29 - Trial = 16301/30000 | Total reward = 48.06
2022-01-26 14:17:44.765 | DEBUG    | __main__:trials:24 - Trial = 16302/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.766 | DEBUG    | __main__:trials:29 - Trial = 16302/30000 | Total reward = 40.10
2022-01-26 14:17:44.769 | DEBUG    | __main__:trials:24 - Trial = 16303/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.771 | DEBUG    | __main__:trials:29 - Trial = 16303/30000 | Total reward = 44.00
2022-01-26 14:17:44.774 | DEBUG    | __main__:trials:24 - Trial = 16304/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.775 | DEBUG    | __main__:trials:29 - Trial = 16304/30000 | Total reward = 56.93
2022-01-26 14:17:44.780 | DEBUG    | __main__:trials:24 - Trial = 16305/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.781 | DEBUG    | __main__:trials:29 - Trial = 16305/30000 | Total reward = 40.10
2022-01-26 14:17:44.785 | DEBUG    | __main__:trials:24 - Trial = 16306/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.786 | DEBUG    | __main__:trials:29 - Trial = 16306/30000 | Total reward = 61.75
2022-01-26 14:17:44.790 | DEBUG    | __main__:trials:24 - Trial = 16307/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.790 | DEBUG    | __main__:trials:29 - Trial = 16307/30000 | Total reward = 46.38
2022-01-26 14:17:44.794 | DEBUG    | __main__:trials:24 - Trial = 16308/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.796 | DEBUG    | __main__:trials:29 - Trial = 16308/30000 | Total reward = 52.76
2022-01-26 14:17:44.799 | DEBUG    | __main__:trials:24 - Trial = 16309/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.800 | DEBUG    | __main__:trials:29 - Trial = 16309/30000 | Total reward = 40.84
2022-01-26 14:17:44.804 | DEBUG    | __main__:trials:24 - Trial = 16310/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.805 | DEBUG    | __main__:trials:29 - Trial = 16310/30000 | Total reward = 39.48
2022-01-26 14:17:44.809 | DEBUG    | __main__:trials:24 - Trial = 16311/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.810 | DEBUG    | __main__:trials:29 - Trial = 16311/30000 | Total reward = 41.36
2022-01-26 14:17:44.814 | DEBUG    | __main__:trials:24 - Trial = 16312/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.816 | DEBUG    | __main__:trials:29 - Trial = 16312/30000 | Total reward = 35.44
2022-01-26 14:17:44.819 | DEBUG    | __main__:trials:24 - Trial = 16313/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.820 | DEBUG    | __main__:trials:29 - Trial = 16313/30000 | Total reward = 34.64
2022-01-26 14:17:44.823 | DEBUG    | __main__:trials:24 - Trial = 16314/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.825 | DEBUG    | __main__:trials:29 - Trial = 16314/30000 | Total reward = 43.83
2022-01-26 14:17:44.828 | DEBUG    | __main__:trials:24 - Trial = 16315/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.830 | DEBUG    | __main__:trials:29 - Trial = 16315/30000 | Total reward = 41.58
2022-01-26 14:17:44.834 | DEBUG    | __main__:trials:24 - Trial = 16316/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.835 | DEBUG    | __main__:trials:29 - Trial = 16316/30000 | Total reward = 35.59
2022-01-26 14:17:44.839 | DEBUG    | __main__:trials:24 - Trial = 16317/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.840 | DEBUG    | __main__:trials:29 - Trial = 16317/30000 | Total reward = 47.75
2022-01-26 14:17:44.844 | DEBUG    | __main__:trials:24 - Trial = 16318/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.846 | DEBUG    | __main__:trials:29 - Trial = 16318/30000 | Total reward = 48.69
2022-01-26 14:17:44.849 | DEBUG    | __main__:trials:24 - Trial = 16319/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.851 | DEBUG    | __main__:trials:29 - Trial = 16319/30000 | Total reward = 53.45
2022-01-26 14:17:44.854 | DEBUG    | __main__:trials:24 - Trial = 16320/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.855 | DEBUG    | __main__:trials:29 - Trial = 16320/30000 | Total reward = 51.43
2022-01-26 14:17:44.858 | DEBUG    | __main__:trials:24 - Trial = 16321/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.860 | DEBUG    | __main__:trials:29 - Trial = 16321/30000 | Total reward = 39.42
2022-01-26 14:17:44.864 | DEBUG    | __main__:trials:24 - Trial = 16322/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.865 | DEBUG    | __main__:trials:29 - Trial = 16322/30000 | Total reward = 65.29
2022-01-26 14:17:44.869 | DEBUG    | __main__:trials:24 - Trial = 16323/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.870 | DEBUG    | __main__:trials:29 - Trial = 16323/30000 | Total reward = 42.20
2022-01-26 14:17:44.873 | DEBUG    | __main__:trials:24 - Trial = 16324/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.874 | DEBUG    | __main__:trials:29 - Trial = 16324/30000 | Total reward = 52.07
2022-01-26 14:17:44.878 | DEBUG    | __main__:trials:24 - Trial = 16325/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.879 | DEBUG    | __main__:trials:29 - Trial = 16325/30000 | Total reward = 54.06
2022-01-26 14:17:44.882 | DEBUG    | __main__:trials:24 - Trial = 16326/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.884 | DEBUG    | __main__:trials:29 - Trial = 16326/30000 | Total reward = 43.17
2022-01-26 14:17:44.887 | DEBUG    | __main__:trials:24 - Trial = 16327/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.888 | DEBUG    | __main__:trials:29 - Trial = 16327/30000 | Total reward = 39.46
2022-01-26 14:17:44.891 | DEBUG    | __main__:trials:24 - Trial = 16328/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.893 | DEBUG    | __main__:trials:29 - Trial = 16328/30000 | Total reward = 53.87
2022-01-26 14:17:44.896 | DEBUG    | __main__:trials:24 - Trial = 16329/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.897 | DEBUG    | __main__:trials:29 - Trial = 16329/30000 | Total reward = 50.32
2022-01-26 14:17:44.901 | DEBUG    | __main__:trials:26 - Trial = 16330/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.903 | DEBUG    | __main__:trials:29 - Trial = 16330/30000 | Total reward = 34.60
2022-01-26 14:17:44.907 | DEBUG    | __main__:trials:24 - Trial = 16331/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.908 | DEBUG    | __main__:trials:29 - Trial = 16331/30000 | Total reward = 47.91
2022-01-26 14:17:44.912 | DEBUG    | __main__:trials:24 - Trial = 16332/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.913 | DEBUG    | __main__:trials:29 - Trial = 16332/30000 | Total reward = 61.55
2022-01-26 14:17:44.917 | DEBUG    | __main__:trials:24 - Trial = 16333/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.918 | DEBUG    | __main__:trials:29 - Trial = 16333/30000 | Total reward = 37.31
2022-01-26 14:17:44.922 | DEBUG    | __main__:trials:24 - Trial = 16334/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.924 | DEBUG    | __main__:trials:29 - Trial = 16334/30000 | Total reward = 51.29
2022-01-26 14:17:44.927 | DEBUG    | __main__:trials:24 - Trial = 16335/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.928 | DEBUG    | __main__:trials:29 - Trial = 16335/30000 | Total reward = 41.72
2022-01-26 14:17:44.931 | DEBUG    | __main__:trials:24 - Trial = 16336/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.933 | DEBUG    | __main__:trials:29 - Trial = 16336/30000 | Total reward = 43.34
2022-01-26 14:17:44.936 | DEBUG    | __main__:trials:24 - Trial = 16337/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.937 | DEBUG    | __main__:trials:29 - Trial = 16337/30000 | Total reward = 38.98
2022-01-26 14:17:44.940 | DEBUG    | __main__:trials:24 - Trial = 16338/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.942 | DEBUG    | __main__:trials:29 - Trial = 16338/30000 | Total reward = 34.99
2022-01-26 14:17:44.946 | DEBUG    | __main__:trials:24 - Trial = 16339/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.947 | DEBUG    | __main__:trials:29 - Trial = 16339/30000 | Total reward = 40.44
2022-01-26 14:17:44.951 | DEBUG    | __main__:trials:24 - Trial = 16340/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.952 | DEBUG    | __main__:trials:29 - Trial = 16340/30000 | Total reward = 37.66
2022-01-26 14:17:44.956 | DEBUG    | __main__:trials:24 - Trial = 16341/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.958 | DEBUG    | __main__:trials:29 - Trial = 16341/30000 | Total reward = 38.33
2022-01-26 14:17:44.961 | DEBUG    | __main__:trials:24 - Trial = 16342/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.962 | DEBUG    | __main__:trials:29 - Trial = 16342/30000 | Total reward = 42.67
2022-01-26 14:17:44.965 | DEBUG    | __main__:trials:26 - Trial = 16343/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:44.966 | DEBUG    | __main__:trials:29 - Trial = 16343/30000 | Total reward = 25.11
2022-01-26 14:17:44.970 | DEBUG    | __main__:trials:24 - Trial = 16344/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.972 | DEBUG    | __main__:trials:29 - Trial = 16344/30000 | Total reward = 54.23
2022-01-26 14:17:44.975 | DEBUG    | __main__:trials:24 - Trial = 16345/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.977 | DEBUG    | __main__:trials:29 - Trial = 16345/30000 | Total reward = 54.87
2022-01-26 14:17:44.980 | DEBUG    | __main__:trials:24 - Trial = 16346/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.982 | DEBUG    | __main__:trials:29 - Trial = 16346/30000 | Total reward = 52.37
2022-01-26 14:17:44.985 | DEBUG    | __main__:trials:24 - Trial = 16347/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.987 | DEBUG    | __main__:trials:29 - Trial = 16347/30000 | Total reward = 39.62
2022-01-26 14:17:44.990 | DEBUG    | __main__:trials:24 - Trial = 16348/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.991 | DEBUG    | __main__:trials:29 - Trial = 16348/30000 | Total reward = 38.99
2022-01-26 14:17:44.995 | DEBUG    | __main__:trials:24 - Trial = 16349/30000 | Max number of steps (20) reached
2022-01-26 14:17:44.997 | DEBUG    | __main__:trials:29 - Trial = 16349/30000 | Total reward = 35.61
2022-01-26 14:17:45.000 | DEBUG    | __main__:trials:24 - Trial = 16350/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.002 | DEBUG    | __main__:trials:29 - Trial = 16350/30000 | Total reward = 51.85
2022-01-26 14:17:45.005 | DEBUG    | __main__:trials:24 - Trial = 16351/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.007 | DEBUG    | __main__:trials:29 - Trial = 16351/30000 | Total reward = 44.08
2022-01-26 14:17:45.010 | DEBUG    | __main__:trials:24 - Trial = 16352/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.011 | DEBUG    | __main__:trials:29 - Trial = 16352/30000 | Total reward = 45.51
2022-01-26 14:17:45.015 | DEBUG    | __main__:trials:24 - Trial = 16353/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.017 | DEBUG    | __main__:trials:29 - Trial = 16353/30000 | Total reward = 39.41
2022-01-26 14:17:45.020 | DEBUG    | __main__:trials:26 - Trial = 16354/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.021 | DEBUG    | __main__:trials:29 - Trial = 16354/30000 | Total reward = 14.36
2022-01-26 14:17:45.024 | DEBUG    | __main__:trials:26 - Trial = 16355/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.025 | DEBUG    | __main__:trials:29 - Trial = 16355/30000 | Total reward = 22.62
2022-01-26 14:17:45.028 | DEBUG    | __main__:trials:24 - Trial = 16356/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.030 | DEBUG    | __main__:trials:29 - Trial = 16356/30000 | Total reward = 40.85
2022-01-26 14:17:45.033 | DEBUG    | __main__:trials:24 - Trial = 16357/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.035 | DEBUG    | __main__:trials:29 - Trial = 16357/30000 | Total reward = 62.23
2022-01-26 14:17:45.038 | DEBUG    | __main__:trials:24 - Trial = 16358/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.039 | DEBUG    | __main__:trials:29 - Trial = 16358/30000 | Total reward = 39.23
2022-01-26 14:17:45.043 | DEBUG    | __main__:trials:24 - Trial = 16359/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.044 | DEBUG    | __main__:trials:29 - Trial = 16359/30000 | Total reward = 35.07
2022-01-26 14:17:45.047 | DEBUG    | __main__:trials:24 - Trial = 16360/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.049 | DEBUG    | __main__:trials:29 - Trial = 16360/30000 | Total reward = 34.36
2022-01-26 14:17:45.052 | DEBUG    | __main__:trials:24 - Trial = 16361/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.053 | DEBUG    | __main__:trials:29 - Trial = 16361/30000 | Total reward = 39.50
2022-01-26 14:17:45.058 | DEBUG    | __main__:trials:24 - Trial = 16362/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.059 | DEBUG    | __main__:trials:29 - Trial = 16362/30000 | Total reward = 40.87
2022-01-26 14:17:45.063 | DEBUG    | __main__:trials:24 - Trial = 16363/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.064 | DEBUG    | __main__:trials:29 - Trial = 16363/30000 | Total reward = 61.33
2022-01-26 14:17:45.068 | DEBUG    | __main__:trials:24 - Trial = 16364/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.069 | DEBUG    | __main__:trials:29 - Trial = 16364/30000 | Total reward = 45.63
2022-01-26 14:17:45.072 | DEBUG    | __main__:trials:24 - Trial = 16365/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.074 | DEBUG    | __main__:trials:29 - Trial = 16365/30000 | Total reward = 63.78
2022-01-26 14:17:45.078 | DEBUG    | __main__:trials:24 - Trial = 16366/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.078 | DEBUG    | __main__:trials:29 - Trial = 16366/30000 | Total reward = 53.36
2022-01-26 14:17:45.083 | DEBUG    | __main__:trials:24 - Trial = 16367/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.083 | DEBUG    | __main__:trials:29 - Trial = 16367/30000 | Total reward = 43.27
2022-01-26 14:17:45.088 | DEBUG    | __main__:trials:24 - Trial = 16368/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.089 | DEBUG    | __main__:trials:29 - Trial = 16368/30000 | Total reward = 40.46
2022-01-26 14:17:45.093 | DEBUG    | __main__:trials:24 - Trial = 16369/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.094 | DEBUG    | __main__:trials:29 - Trial = 16369/30000 | Total reward = 39.67
2022-01-26 14:17:45.097 | DEBUG    | __main__:trials:24 - Trial = 16370/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.098 | DEBUG    | __main__:trials:29 - Trial = 16370/30000 | Total reward = 44.68
2022-01-26 14:17:45.102 | DEBUG    | __main__:trials:24 - Trial = 16371/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.103 | DEBUG    | __main__:trials:29 - Trial = 16371/30000 | Total reward = 53.20
2022-01-26 14:17:45.107 | DEBUG    | __main__:trials:24 - Trial = 16372/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.108 | DEBUG    | __main__:trials:29 - Trial = 16372/30000 | Total reward = 47.94
2022-01-26 14:17:45.112 | DEBUG    | __main__:trials:24 - Trial = 16373/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.113 | DEBUG    | __main__:trials:29 - Trial = 16373/30000 | Total reward = 35.08
2022-01-26 14:17:45.117 | DEBUG    | __main__:trials:24 - Trial = 16374/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.118 | DEBUG    | __main__:trials:29 - Trial = 16374/30000 | Total reward = 40.68
2022-01-26 14:17:45.121 | DEBUG    | __main__:trials:24 - Trial = 16375/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.122 | DEBUG    | __main__:trials:29 - Trial = 16375/30000 | Total reward = 47.62
2022-01-26 14:17:45.127 | DEBUG    | __main__:trials:24 - Trial = 16376/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.128 | DEBUG    | __main__:trials:29 - Trial = 16376/30000 | Total reward = 41.01
2022-01-26 14:17:45.132 | DEBUG    | __main__:trials:24 - Trial = 16377/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.132 | DEBUG    | __main__:trials:29 - Trial = 16377/30000 | Total reward = 55.17
2022-01-26 14:17:45.136 | DEBUG    | __main__:trials:24 - Trial = 16378/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.137 | DEBUG    | __main__:trials:29 - Trial = 16378/30000 | Total reward = 36.81
2022-01-26 14:17:45.141 | DEBUG    | __main__:trials:24 - Trial = 16379/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.142 | DEBUG    | __main__:trials:29 - Trial = 16379/30000 | Total reward = 65.16
2022-01-26 14:17:45.146 | DEBUG    | __main__:trials:24 - Trial = 16380/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.146 | DEBUG    | __main__:trials:29 - Trial = 16380/30000 | Total reward = 33.92
2022-01-26 14:17:45.150 | DEBUG    | __main__:trials:24 - Trial = 16381/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.151 | DEBUG    | __main__:trials:29 - Trial = 16381/30000 | Total reward = 35.99
2022-01-26 14:17:45.155 | DEBUG    | __main__:trials:24 - Trial = 16382/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.156 | DEBUG    | __main__:trials:29 - Trial = 16382/30000 | Total reward = 44.10
2022-01-26 14:17:45.159 | DEBUG    | __main__:trials:24 - Trial = 16383/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.161 | DEBUG    | __main__:trials:29 - Trial = 16383/30000 | Total reward = 47.88
2022-01-26 14:17:45.164 | DEBUG    | __main__:trials:24 - Trial = 16384/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.165 | DEBUG    | __main__:trials:29 - Trial = 16384/30000 | Total reward = 41.74
2022-01-26 14:17:45.169 | DEBUG    | __main__:trials:24 - Trial = 16385/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.170 | DEBUG    | __main__:trials:29 - Trial = 16385/30000 | Total reward = 57.96
2022-01-26 14:17:45.173 | DEBUG    | __main__:trials:24 - Trial = 16386/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.174 | DEBUG    | __main__:trials:29 - Trial = 16386/30000 | Total reward = 56.07
2022-01-26 14:17:45.177 | DEBUG    | __main__:trials:24 - Trial = 16387/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.178 | DEBUG    | __main__:trials:29 - Trial = 16387/30000 | Total reward = 33.68
2022-01-26 14:17:45.182 | DEBUG    | __main__:trials:24 - Trial = 16388/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.184 | DEBUG    | __main__:trials:29 - Trial = 16388/30000 | Total reward = 41.45
2022-01-26 14:17:45.187 | DEBUG    | __main__:trials:24 - Trial = 16389/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.189 | DEBUG    | __main__:trials:29 - Trial = 16389/30000 | Total reward = 45.75
2022-01-26 14:17:45.193 | DEBUG    | __main__:trials:24 - Trial = 16390/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.195 | DEBUG    | __main__:trials:29 - Trial = 16390/30000 | Total reward = 46.40
2022-01-26 14:17:45.198 | DEBUG    | __main__:trials:24 - Trial = 16391/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.200 | DEBUG    | __main__:trials:29 - Trial = 16391/30000 | Total reward = 43.90
2022-01-26 14:17:45.203 | DEBUG    | __main__:trials:24 - Trial = 16392/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.204 | DEBUG    | __main__:trials:29 - Trial = 16392/30000 | Total reward = 42.51
2022-01-26 14:17:45.209 | DEBUG    | __main__:trials:24 - Trial = 16393/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.210 | DEBUG    | __main__:trials:29 - Trial = 16393/30000 | Total reward = 36.91
2022-01-26 14:17:45.213 | DEBUG    | __main__:trials:26 - Trial = 16394/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.214 | DEBUG    | __main__:trials:29 - Trial = 16394/30000 | Total reward = 20.76
2022-01-26 14:17:45.218 | DEBUG    | __main__:trials:24 - Trial = 16395/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.219 | DEBUG    | __main__:trials:29 - Trial = 16395/30000 | Total reward = 45.90
2022-01-26 14:17:45.223 | DEBUG    | __main__:trials:24 - Trial = 16396/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.225 | DEBUG    | __main__:trials:29 - Trial = 16396/30000 | Total reward = 47.63
2022-01-26 14:17:45.228 | DEBUG    | __main__:trials:24 - Trial = 16397/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.229 | DEBUG    | __main__:trials:29 - Trial = 16397/30000 | Total reward = 35.40
2022-01-26 14:17:45.233 | DEBUG    | __main__:trials:24 - Trial = 16398/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.234 | DEBUG    | __main__:trials:29 - Trial = 16398/30000 | Total reward = 46.91
2022-01-26 14:17:45.238 | DEBUG    | __main__:trials:24 - Trial = 16399/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.239 | DEBUG    | __main__:trials:29 - Trial = 16399/30000 | Total reward = 56.79
2022-01-26 14:17:45.243 | DEBUG    | __main__:trials:24 - Trial = 16400/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.244 | DEBUG    | __main__:trials:29 - Trial = 16400/30000 | Total reward = 33.94
2022-01-26 14:17:45.248 | DEBUG    | __main__:trials:24 - Trial = 16401/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.250 | DEBUG    | __main__:trials:29 - Trial = 16401/30000 | Total reward = 31.05
2022-01-26 14:17:45.253 | DEBUG    | __main__:trials:24 - Trial = 16402/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.254 | DEBUG    | __main__:trials:29 - Trial = 16402/30000 | Total reward = 57.71
2022-01-26 14:17:45.258 | DEBUG    | __main__:trials:24 - Trial = 16403/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.258 | DEBUG    | __main__:trials:29 - Trial = 16403/30000 | Total reward = 36.19
2022-01-26 14:17:45.263 | DEBUG    | __main__:trials:24 - Trial = 16404/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.264 | DEBUG    | __main__:trials:29 - Trial = 16404/30000 | Total reward = 52.37
2022-01-26 14:17:45.268 | DEBUG    | __main__:trials:24 - Trial = 16405/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.270 | DEBUG    | __main__:trials:29 - Trial = 16405/30000 | Total reward = 46.30
2022-01-26 14:17:45.273 | DEBUG    | __main__:trials:24 - Trial = 16406/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.275 | DEBUG    | __main__:trials:29 - Trial = 16406/30000 | Total reward = 56.51
2022-01-26 14:17:45.278 | DEBUG    | __main__:trials:24 - Trial = 16407/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.279 | DEBUG    | __main__:trials:29 - Trial = 16407/30000 | Total reward = 55.31
2022-01-26 14:17:45.283 | DEBUG    | __main__:trials:24 - Trial = 16408/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.283 | DEBUG    | __main__:trials:29 - Trial = 16408/30000 | Total reward = 42.92
2022-01-26 14:17:45.287 | DEBUG    | __main__:trials:24 - Trial = 16409/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.288 | DEBUG    | __main__:trials:29 - Trial = 16409/30000 | Total reward = 41.26
2022-01-26 14:17:45.291 | DEBUG    | __main__:trials:24 - Trial = 16410/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.292 | DEBUG    | __main__:trials:29 - Trial = 16410/30000 | Total reward = 53.98
2022-01-26 14:17:45.295 | DEBUG    | __main__:trials:24 - Trial = 16411/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.297 | DEBUG    | __main__:trials:29 - Trial = 16411/30000 | Total reward = 43.35
2022-01-26 14:17:45.300 | DEBUG    | __main__:trials:24 - Trial = 16412/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.301 | DEBUG    | __main__:trials:29 - Trial = 16412/30000 | Total reward = 38.76
2022-01-26 14:17:45.305 | DEBUG    | __main__:trials:24 - Trial = 16413/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.306 | DEBUG    | __main__:trials:29 - Trial = 16413/30000 | Total reward = 50.27
2022-01-26 14:17:45.310 | DEBUG    | __main__:trials:24 - Trial = 16414/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.311 | DEBUG    | __main__:trials:29 - Trial = 16414/30000 | Total reward = 45.88
2022-01-26 14:17:45.314 | DEBUG    | __main__:trials:24 - Trial = 16415/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.315 | DEBUG    | __main__:trials:29 - Trial = 16415/30000 | Total reward = 44.10
2022-01-26 14:17:45.318 | DEBUG    | __main__:trials:24 - Trial = 16416/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.320 | DEBUG    | __main__:trials:29 - Trial = 16416/30000 | Total reward = 35.44
2022-01-26 14:17:45.323 | DEBUG    | __main__:trials:24 - Trial = 16417/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.324 | DEBUG    | __main__:trials:29 - Trial = 16417/30000 | Total reward = 44.59
2022-01-26 14:17:45.327 | DEBUG    | __main__:trials:24 - Trial = 16418/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.329 | DEBUG    | __main__:trials:29 - Trial = 16418/30000 | Total reward = 37.11
2022-01-26 14:17:45.332 | DEBUG    | __main__:trials:24 - Trial = 16419/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.333 | DEBUG    | __main__:trials:29 - Trial = 16419/30000 | Total reward = 53.33
2022-01-26 14:17:45.337 | DEBUG    | __main__:trials:24 - Trial = 16420/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.338 | DEBUG    | __main__:trials:29 - Trial = 16420/30000 | Total reward = 51.62
2022-01-26 14:17:45.341 | DEBUG    | __main__:trials:24 - Trial = 16421/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.342 | DEBUG    | __main__:trials:29 - Trial = 16421/30000 | Total reward = 51.59
2022-01-26 14:17:45.346 | DEBUG    | __main__:trials:26 - Trial = 16422/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.346 | DEBUG    | __main__:trials:29 - Trial = 16422/30000 | Total reward = 29.57
2022-01-26 14:17:45.350 | DEBUG    | __main__:trials:24 - Trial = 16423/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.351 | DEBUG    | __main__:trials:29 - Trial = 16423/30000 | Total reward = 42.43
2022-01-26 14:17:45.355 | DEBUG    | __main__:trials:24 - Trial = 16424/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.356 | DEBUG    | __main__:trials:29 - Trial = 16424/30000 | Total reward = 41.77
2022-01-26 14:17:45.360 | DEBUG    | __main__:trials:24 - Trial = 16425/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.360 | DEBUG    | __main__:trials:29 - Trial = 16425/30000 | Total reward = 38.80
2022-01-26 14:17:45.365 | DEBUG    | __main__:trials:24 - Trial = 16426/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.366 | DEBUG    | __main__:trials:29 - Trial = 16426/30000 | Total reward = 41.73
2022-01-26 14:17:45.369 | DEBUG    | __main__:trials:24 - Trial = 16427/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.371 | DEBUG    | __main__:trials:29 - Trial = 16427/30000 | Total reward = 44.43
2022-01-26 14:17:45.375 | DEBUG    | __main__:trials:24 - Trial = 16428/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.375 | DEBUG    | __main__:trials:29 - Trial = 16428/30000 | Total reward = 40.03
2022-01-26 14:17:45.380 | DEBUG    | __main__:trials:24 - Trial = 16429/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.381 | DEBUG    | __main__:trials:29 - Trial = 16429/30000 | Total reward = 40.89
2022-01-26 14:17:45.384 | DEBUG    | __main__:trials:24 - Trial = 16430/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.385 | DEBUG    | __main__:trials:29 - Trial = 16430/30000 | Total reward = 36.25
2022-01-26 14:17:45.388 | DEBUG    | __main__:trials:24 - Trial = 16431/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.389 | DEBUG    | __main__:trials:29 - Trial = 16431/30000 | Total reward = 40.37
2022-01-26 14:17:45.392 | DEBUG    | __main__:trials:24 - Trial = 16432/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.393 | DEBUG    | __main__:trials:29 - Trial = 16432/30000 | Total reward = 55.24
2022-01-26 14:17:45.397 | DEBUG    | __main__:trials:24 - Trial = 16433/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.397 | DEBUG    | __main__:trials:29 - Trial = 16433/30000 | Total reward = 46.27
2022-01-26 14:17:45.401 | DEBUG    | __main__:trials:24 - Trial = 16434/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.402 | DEBUG    | __main__:trials:29 - Trial = 16434/30000 | Total reward = 56.02
2022-01-26 14:17:45.405 | DEBUG    | __main__:trials:24 - Trial = 16435/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.406 | DEBUG    | __main__:trials:29 - Trial = 16435/30000 | Total reward = 60.52
2022-01-26 14:17:45.408 | DEBUG    | __main__:trials:26 - Trial = 16436/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.410 | DEBUG    | __main__:trials:29 - Trial = 16436/30000 | Total reward = 19.09
2022-01-26 14:17:45.413 | DEBUG    | __main__:trials:24 - Trial = 16437/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.414 | DEBUG    | __main__:trials:29 - Trial = 16437/30000 | Total reward = 42.20
2022-01-26 14:17:45.417 | DEBUG    | __main__:trials:24 - Trial = 16438/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.417 | DEBUG    | __main__:trials:29 - Trial = 16438/30000 | Total reward = 43.17
2022-01-26 14:17:45.420 | DEBUG    | __main__:trials:24 - Trial = 16439/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.421 | DEBUG    | __main__:trials:29 - Trial = 16439/30000 | Total reward = 64.02
2022-01-26 14:17:45.425 | DEBUG    | __main__:trials:24 - Trial = 16440/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.425 | DEBUG    | __main__:trials:29 - Trial = 16440/30000 | Total reward = 54.23
2022-01-26 14:17:45.429 | DEBUG    | __main__:trials:24 - Trial = 16441/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.430 | DEBUG    | __main__:trials:29 - Trial = 16441/30000 | Total reward = 41.26
2022-01-26 14:17:45.433 | DEBUG    | __main__:trials:24 - Trial = 16442/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.434 | DEBUG    | __main__:trials:29 - Trial = 16442/30000 | Total reward = 35.69
2022-01-26 14:17:45.437 | DEBUG    | __main__:trials:24 - Trial = 16443/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.438 | DEBUG    | __main__:trials:29 - Trial = 16443/30000 | Total reward = 46.62
2022-01-26 14:17:45.441 | DEBUG    | __main__:trials:24 - Trial = 16444/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.443 | DEBUG    | __main__:trials:29 - Trial = 16444/30000 | Total reward = 34.30
2022-01-26 14:17:45.446 | DEBUG    | __main__:trials:24 - Trial = 16445/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.447 | DEBUG    | __main__:trials:29 - Trial = 16445/30000 | Total reward = 56.81
2022-01-26 14:17:45.449 | DEBUG    | __main__:trials:24 - Trial = 16446/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.450 | DEBUG    | __main__:trials:29 - Trial = 16446/30000 | Total reward = 36.89
2022-01-26 14:17:45.454 | DEBUG    | __main__:trials:24 - Trial = 16447/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.456 | DEBUG    | __main__:trials:29 - Trial = 16447/30000 | Total reward = 52.26
2022-01-26 14:17:45.458 | DEBUG    | __main__:trials:24 - Trial = 16448/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.460 | DEBUG    | __main__:trials:29 - Trial = 16448/30000 | Total reward = 63.32
2022-01-26 14:17:45.464 | DEBUG    | __main__:trials:24 - Trial = 16449/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.464 | DEBUG    | __main__:trials:29 - Trial = 16449/30000 | Total reward = 44.10
2022-01-26 14:17:45.467 | DEBUG    | __main__:trials:26 - Trial = 16450/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.469 | DEBUG    | __main__:trials:29 - Trial = 16450/30000 | Total reward = 23.79
2022-01-26 14:17:45.472 | DEBUG    | __main__:trials:24 - Trial = 16451/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.472 | DEBUG    | __main__:trials:29 - Trial = 16451/30000 | Total reward = 42.42
2022-01-26 14:17:45.476 | DEBUG    | __main__:trials:24 - Trial = 16452/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.477 | DEBUG    | __main__:trials:29 - Trial = 16452/30000 | Total reward = 53.82
2022-01-26 14:17:45.480 | DEBUG    | __main__:trials:24 - Trial = 16453/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.482 | DEBUG    | __main__:trials:29 - Trial = 16453/30000 | Total reward = 37.22
2022-01-26 14:17:45.485 | DEBUG    | __main__:trials:24 - Trial = 16454/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.486 | DEBUG    | __main__:trials:29 - Trial = 16454/30000 | Total reward = 49.10
2022-01-26 14:17:45.489 | DEBUG    | __main__:trials:24 - Trial = 16455/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.491 | DEBUG    | __main__:trials:29 - Trial = 16455/30000 | Total reward = 46.01
2022-01-26 14:17:45.493 | DEBUG    | __main__:trials:24 - Trial = 16456/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.494 | DEBUG    | __main__:trials:29 - Trial = 16456/30000 | Total reward = 54.48
2022-01-26 14:17:45.497 | DEBUG    | __main__:trials:24 - Trial = 16457/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.498 | DEBUG    | __main__:trials:29 - Trial = 16457/30000 | Total reward = 42.08
2022-01-26 14:17:45.501 | DEBUG    | __main__:trials:24 - Trial = 16458/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.503 | DEBUG    | __main__:trials:29 - Trial = 16458/30000 | Total reward = 56.43
2022-01-26 14:17:45.506 | DEBUG    | __main__:trials:24 - Trial = 16459/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.508 | DEBUG    | __main__:trials:29 - Trial = 16459/30000 | Total reward = 47.46
2022-01-26 14:17:45.510 | DEBUG    | __main__:trials:24 - Trial = 16460/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.511 | DEBUG    | __main__:trials:29 - Trial = 16460/30000 | Total reward = 36.87
2022-01-26 14:17:45.514 | DEBUG    | __main__:trials:24 - Trial = 16461/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.516 | DEBUG    | __main__:trials:29 - Trial = 16461/30000 | Total reward = 53.58
2022-01-26 14:17:45.519 | DEBUG    | __main__:trials:24 - Trial = 16462/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.521 | DEBUG    | __main__:trials:29 - Trial = 16462/30000 | Total reward = 47.87
2022-01-26 14:17:45.524 | DEBUG    | __main__:trials:24 - Trial = 16463/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.525 | DEBUG    | __main__:trials:29 - Trial = 16463/30000 | Total reward = 40.35
2022-01-26 14:17:45.528 | DEBUG    | __main__:trials:24 - Trial = 16464/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.530 | DEBUG    | __main__:trials:29 - Trial = 16464/30000 | Total reward = 54.83
2022-01-26 14:17:45.533 | DEBUG    | __main__:trials:24 - Trial = 16465/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.535 | DEBUG    | __main__:trials:29 - Trial = 16465/30000 | Total reward = 24.89
2022-01-26 14:17:45.538 | DEBUG    | __main__:trials:24 - Trial = 16466/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.539 | DEBUG    | __main__:trials:29 - Trial = 16466/30000 | Total reward = 62.43
2022-01-26 14:17:45.542 | DEBUG    | __main__:trials:24 - Trial = 16467/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.543 | DEBUG    | __main__:trials:29 - Trial = 16467/30000 | Total reward = 40.43
2022-01-26 14:17:45.546 | DEBUG    | __main__:trials:24 - Trial = 16468/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.548 | DEBUG    | __main__:trials:29 - Trial = 16468/30000 | Total reward = 47.20
2022-01-26 14:17:45.551 | DEBUG    | __main__:trials:24 - Trial = 16469/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.553 | DEBUG    | __main__:trials:29 - Trial = 16469/30000 | Total reward = 46.95
2022-01-26 14:17:45.556 | DEBUG    | __main__:trials:24 - Trial = 16470/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.556 | DEBUG    | __main__:trials:29 - Trial = 16470/30000 | Total reward = 53.64
2022-01-26 14:17:45.559 | DEBUG    | __main__:trials:24 - Trial = 16471/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.561 | DEBUG    | __main__:trials:29 - Trial = 16471/30000 | Total reward = 46.39
2022-01-26 14:17:45.564 | DEBUG    | __main__:trials:24 - Trial = 16472/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.565 | DEBUG    | __main__:trials:29 - Trial = 16472/30000 | Total reward = 45.83
2022-01-26 14:17:45.568 | DEBUG    | __main__:trials:24 - Trial = 16473/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.569 | DEBUG    | __main__:trials:29 - Trial = 16473/30000 | Total reward = 51.57
2022-01-26 14:17:45.573 | DEBUG    | __main__:trials:24 - Trial = 16474/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.573 | DEBUG    | __main__:trials:29 - Trial = 16474/30000 | Total reward = 38.82
2022-01-26 14:17:45.577 | DEBUG    | __main__:trials:24 - Trial = 16475/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.577 | DEBUG    | __main__:trials:29 - Trial = 16475/30000 | Total reward = 51.54
2022-01-26 14:17:45.581 | DEBUG    | __main__:trials:24 - Trial = 16476/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.582 | DEBUG    | __main__:trials:29 - Trial = 16476/30000 | Total reward = 46.39
2022-01-26 14:17:45.585 | DEBUG    | __main__:trials:24 - Trial = 16477/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.587 | DEBUG    | __main__:trials:29 - Trial = 16477/30000 | Total reward = 35.17
2022-01-26 14:17:45.590 | DEBUG    | __main__:trials:24 - Trial = 16478/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.591 | DEBUG    | __main__:trials:29 - Trial = 16478/30000 | Total reward = 49.01
2022-01-26 14:17:45.594 | DEBUG    | __main__:trials:24 - Trial = 16479/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.596 | DEBUG    | __main__:trials:29 - Trial = 16479/30000 | Total reward = 52.88
2022-01-26 14:17:45.598 | DEBUG    | __main__:trials:24 - Trial = 16480/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.600 | DEBUG    | __main__:trials:29 - Trial = 16480/30000 | Total reward = 52.26
2022-01-26 14:17:45.603 | DEBUG    | __main__:trials:24 - Trial = 16481/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.604 | DEBUG    | __main__:trials:29 - Trial = 16481/30000 | Total reward = 51.56
2022-01-26 14:17:45.608 | DEBUG    | __main__:trials:24 - Trial = 16482/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.609 | DEBUG    | __main__:trials:29 - Trial = 16482/30000 | Total reward = 45.56
2022-01-26 14:17:45.612 | DEBUG    | __main__:trials:24 - Trial = 16483/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.613 | DEBUG    | __main__:trials:29 - Trial = 16483/30000 | Total reward = 51.67
2022-01-26 14:17:45.616 | DEBUG    | __main__:trials:24 - Trial = 16484/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.617 | DEBUG    | __main__:trials:29 - Trial = 16484/30000 | Total reward = 41.47
2022-01-26 14:17:45.620 | DEBUG    | __main__:trials:24 - Trial = 16485/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.621 | DEBUG    | __main__:trials:29 - Trial = 16485/30000 | Total reward = 56.66
2022-01-26 14:17:45.624 | DEBUG    | __main__:trials:24 - Trial = 16486/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.625 | DEBUG    | __main__:trials:29 - Trial = 16486/30000 | Total reward = 44.89
2022-01-26 14:17:45.628 | DEBUG    | __main__:trials:24 - Trial = 16487/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.630 | DEBUG    | __main__:trials:29 - Trial = 16487/30000 | Total reward = 32.65
2022-01-26 14:17:45.633 | DEBUG    | __main__:trials:24 - Trial = 16488/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.634 | DEBUG    | __main__:trials:29 - Trial = 16488/30000 | Total reward = 36.69
2022-01-26 14:17:45.637 | DEBUG    | __main__:trials:24 - Trial = 16489/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.638 | DEBUG    | __main__:trials:29 - Trial = 16489/30000 | Total reward = 63.17
2022-01-26 14:17:45.641 | DEBUG    | __main__:trials:24 - Trial = 16490/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.642 | DEBUG    | __main__:trials:29 - Trial = 16490/30000 | Total reward = 38.47
2022-01-26 14:17:45.645 | DEBUG    | __main__:trials:24 - Trial = 16491/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.646 | DEBUG    | __main__:trials:29 - Trial = 16491/30000 | Total reward = 43.32
2022-01-26 14:17:45.650 | DEBUG    | __main__:trials:24 - Trial = 16492/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.650 | DEBUG    | __main__:trials:29 - Trial = 16492/30000 | Total reward = 39.24
2022-01-26 14:17:45.653 | DEBUG    | __main__:trials:24 - Trial = 16493/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.655 | DEBUG    | __main__:trials:29 - Trial = 16493/30000 | Total reward = 46.00
2022-01-26 14:17:45.658 | DEBUG    | __main__:trials:24 - Trial = 16494/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.660 | DEBUG    | __main__:trials:29 - Trial = 16494/30000 | Total reward = 38.53
2022-01-26 14:17:45.663 | DEBUG    | __main__:trials:24 - Trial = 16495/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.664 | DEBUG    | __main__:trials:29 - Trial = 16495/30000 | Total reward = 40.89
2022-01-26 14:17:45.668 | DEBUG    | __main__:trials:24 - Trial = 16496/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.668 | DEBUG    | __main__:trials:29 - Trial = 16496/30000 | Total reward = 64.39
2022-01-26 14:17:45.672 | DEBUG    | __main__:trials:24 - Trial = 16497/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.673 | DEBUG    | __main__:trials:29 - Trial = 16497/30000 | Total reward = 39.03
2022-01-26 14:17:45.676 | DEBUG    | __main__:trials:24 - Trial = 16498/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.677 | DEBUG    | __main__:trials:29 - Trial = 16498/30000 | Total reward = 54.00
2022-01-26 14:17:45.680 | DEBUG    | __main__:trials:24 - Trial = 16499/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.681 | DEBUG    | __main__:trials:29 - Trial = 16499/30000 | Total reward = 47.75
2022-01-26 14:17:45.684 | DEBUG    | __main__:trials:24 - Trial = 16500/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.685 | DEBUG    | __main__:trials:29 - Trial = 16500/30000 | Total reward = 47.29
2022-01-26 14:17:45.688 | DEBUG    | __main__:trials:24 - Trial = 16501/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.689 | DEBUG    | __main__:trials:29 - Trial = 16501/30000 | Total reward = 46.78
2022-01-26 14:17:45.692 | DEBUG    | __main__:trials:24 - Trial = 16502/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.694 | DEBUG    | __main__:trials:29 - Trial = 16502/30000 | Total reward = 46.75
2022-01-26 14:17:45.697 | DEBUG    | __main__:trials:26 - Trial = 16503/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.698 | DEBUG    | __main__:trials:29 - Trial = 16503/30000 | Total reward = 34.79
2022-01-26 14:17:45.702 | DEBUG    | __main__:trials:24 - Trial = 16504/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.703 | DEBUG    | __main__:trials:29 - Trial = 16504/30000 | Total reward = 42.68
2022-01-26 14:17:45.707 | DEBUG    | __main__:trials:24 - Trial = 16505/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.707 | DEBUG    | __main__:trials:29 - Trial = 16505/30000 | Total reward = 32.65
2022-01-26 14:17:45.710 | DEBUG    | __main__:trials:26 - Trial = 16506/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:45.712 | DEBUG    | __main__:trials:29 - Trial = 16506/30000 | Total reward = 19.74
2022-01-26 14:17:45.715 | DEBUG    | __main__:trials:24 - Trial = 16507/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.717 | DEBUG    | __main__:trials:29 - Trial = 16507/30000 | Total reward = 45.10
2022-01-26 14:17:45.720 | DEBUG    | __main__:trials:24 - Trial = 16508/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.721 | DEBUG    | __main__:trials:29 - Trial = 16508/30000 | Total reward = 42.48
2022-01-26 14:17:45.725 | DEBUG    | __main__:trials:24 - Trial = 16509/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.726 | DEBUG    | __main__:trials:29 - Trial = 16509/30000 | Total reward = 45.63
2022-01-26 14:17:45.730 | DEBUG    | __main__:trials:24 - Trial = 16510/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.732 | DEBUG    | __main__:trials:29 - Trial = 16510/30000 | Total reward = 53.02
2022-01-26 14:17:45.735 | DEBUG    | __main__:trials:24 - Trial = 16511/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.737 | DEBUG    | __main__:trials:29 - Trial = 16511/30000 | Total reward = 39.62
2022-01-26 14:17:45.740 | DEBUG    | __main__:trials:24 - Trial = 16512/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.741 | DEBUG    | __main__:trials:29 - Trial = 16512/30000 | Total reward = 64.96
2022-01-26 14:17:45.745 | DEBUG    | __main__:trials:24 - Trial = 16513/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.746 | DEBUG    | __main__:trials:29 - Trial = 16513/30000 | Total reward = 52.57
2022-01-26 14:17:45.749 | DEBUG    | __main__:trials:24 - Trial = 16514/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.750 | DEBUG    | __main__:trials:29 - Trial = 16514/30000 | Total reward = 46.39
2022-01-26 14:17:45.753 | DEBUG    | __main__:trials:24 - Trial = 16515/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.754 | DEBUG    | __main__:trials:29 - Trial = 16515/30000 | Total reward = 32.18
2022-01-26 14:17:45.757 | DEBUG    | __main__:trials:24 - Trial = 16516/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.759 | DEBUG    | __main__:trials:29 - Trial = 16516/30000 | Total reward = 36.42
2022-01-26 14:17:45.761 | DEBUG    | __main__:trials:24 - Trial = 16517/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.763 | DEBUG    | __main__:trials:29 - Trial = 16517/30000 | Total reward = 30.19
2022-01-26 14:17:45.766 | DEBUG    | __main__:trials:24 - Trial = 16518/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.768 | DEBUG    | __main__:trials:29 - Trial = 16518/30000 | Total reward = 51.27
2022-01-26 14:17:45.771 | DEBUG    | __main__:trials:24 - Trial = 16519/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.772 | DEBUG    | __main__:trials:29 - Trial = 16519/30000 | Total reward = 56.29
2022-01-26 14:17:45.776 | DEBUG    | __main__:trials:24 - Trial = 16520/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.777 | DEBUG    | __main__:trials:29 - Trial = 16520/30000 | Total reward = 51.75
2022-01-26 14:17:45.780 | DEBUG    | __main__:trials:24 - Trial = 16521/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.781 | DEBUG    | __main__:trials:29 - Trial = 16521/30000 | Total reward = 40.13
2022-01-26 14:17:45.784 | DEBUG    | __main__:trials:24 - Trial = 16522/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.786 | DEBUG    | __main__:trials:29 - Trial = 16522/30000 | Total reward = 55.71
2022-01-26 14:17:45.790 | DEBUG    | __main__:trials:24 - Trial = 16523/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.792 | DEBUG    | __main__:trials:29 - Trial = 16523/30000 | Total reward = 53.25
2022-01-26 14:17:45.795 | DEBUG    | __main__:trials:24 - Trial = 16524/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.797 | DEBUG    | __main__:trials:29 - Trial = 16524/30000 | Total reward = 52.84
2022-01-26 14:17:45.800 | DEBUG    | __main__:trials:24 - Trial = 16525/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.801 | DEBUG    | __main__:trials:29 - Trial = 16525/30000 | Total reward = 61.17
2022-01-26 14:17:45.805 | DEBUG    | __main__:trials:24 - Trial = 16526/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.807 | DEBUG    | __main__:trials:29 - Trial = 16526/30000 | Total reward = 40.93
2022-01-26 14:17:45.810 | DEBUG    | __main__:trials:24 - Trial = 16527/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.811 | DEBUG    | __main__:trials:29 - Trial = 16527/30000 | Total reward = 26.46
2022-01-26 14:17:45.815 | DEBUG    | __main__:trials:24 - Trial = 16528/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.815 | DEBUG    | __main__:trials:29 - Trial = 16528/30000 | Total reward = 45.90
2022-01-26 14:17:45.819 | DEBUG    | __main__:trials:24 - Trial = 16529/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.820 | DEBUG    | __main__:trials:29 - Trial = 16529/30000 | Total reward = 46.30
2022-01-26 14:17:45.823 | DEBUG    | __main__:trials:24 - Trial = 16530/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.824 | DEBUG    | __main__:trials:29 - Trial = 16530/30000 | Total reward = 47.30
2022-01-26 14:17:45.827 | DEBUG    | __main__:trials:24 - Trial = 16531/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.829 | DEBUG    | __main__:trials:29 - Trial = 16531/30000 | Total reward = 38.65
2022-01-26 14:17:45.832 | DEBUG    | __main__:trials:24 - Trial = 16532/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.834 | DEBUG    | __main__:trials:29 - Trial = 16532/30000 | Total reward = 33.71
2022-01-26 14:17:45.838 | DEBUG    | __main__:trials:24 - Trial = 16533/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.839 | DEBUG    | __main__:trials:29 - Trial = 16533/30000 | Total reward = 65.72
2022-01-26 14:17:45.843 | DEBUG    | __main__:trials:24 - Trial = 16534/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.844 | DEBUG    | __main__:trials:29 - Trial = 16534/30000 | Total reward = 42.59
2022-01-26 14:17:45.848 | DEBUG    | __main__:trials:24 - Trial = 16535/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.850 | DEBUG    | __main__:trials:29 - Trial = 16535/30000 | Total reward = 53.15
2022-01-26 14:17:45.853 | DEBUG    | __main__:trials:24 - Trial = 16536/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.855 | DEBUG    | __main__:trials:29 - Trial = 16536/30000 | Total reward = 44.38
2022-01-26 14:17:45.858 | DEBUG    | __main__:trials:24 - Trial = 16537/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.860 | DEBUG    | __main__:trials:29 - Trial = 16537/30000 | Total reward = 46.72
2022-01-26 14:17:45.863 | DEBUG    | __main__:trials:24 - Trial = 16538/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.865 | DEBUG    | __main__:trials:29 - Trial = 16538/30000 | Total reward = 47.16
2022-01-26 14:17:45.868 | DEBUG    | __main__:trials:24 - Trial = 16539/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.869 | DEBUG    | __main__:trials:29 - Trial = 16539/30000 | Total reward = 54.46
2022-01-26 14:17:45.873 | DEBUG    | __main__:trials:24 - Trial = 16540/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.875 | DEBUG    | __main__:trials:29 - Trial = 16540/30000 | Total reward = 48.36
2022-01-26 14:17:45.877 | DEBUG    | __main__:trials:24 - Trial = 16541/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.879 | DEBUG    | __main__:trials:29 - Trial = 16541/30000 | Total reward = 36.67
2022-01-26 14:17:45.883 | DEBUG    | __main__:trials:24 - Trial = 16542/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.884 | DEBUG    | __main__:trials:29 - Trial = 16542/30000 | Total reward = 42.29
2022-01-26 14:17:45.888 | DEBUG    | __main__:trials:24 - Trial = 16543/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.889 | DEBUG    | __main__:trials:29 - Trial = 16543/30000 | Total reward = 43.83
2022-01-26 14:17:45.893 | DEBUG    | __main__:trials:24 - Trial = 16544/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.894 | DEBUG    | __main__:trials:29 - Trial = 16544/30000 | Total reward = 36.08
2022-01-26 14:17:45.898 | DEBUG    | __main__:trials:24 - Trial = 16545/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.899 | DEBUG    | __main__:trials:29 - Trial = 16545/30000 | Total reward = 42.94
2022-01-26 14:17:45.903 | DEBUG    | __main__:trials:24 - Trial = 16546/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.904 | DEBUG    | __main__:trials:29 - Trial = 16546/30000 | Total reward = 55.26
2022-01-26 14:17:45.908 | DEBUG    | __main__:trials:24 - Trial = 16547/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.909 | DEBUG    | __main__:trials:29 - Trial = 16547/30000 | Total reward = 50.46
2022-01-26 14:17:45.913 | DEBUG    | __main__:trials:24 - Trial = 16548/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.915 | DEBUG    | __main__:trials:29 - Trial = 16548/30000 | Total reward = 38.31
2022-01-26 14:17:45.918 | DEBUG    | __main__:trials:24 - Trial = 16549/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.920 | DEBUG    | __main__:trials:29 - Trial = 16549/30000 | Total reward = 52.07
2022-01-26 14:17:45.922 | DEBUG    | __main__:trials:24 - Trial = 16550/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.924 | DEBUG    | __main__:trials:29 - Trial = 16550/30000 | Total reward = 49.78
2022-01-26 14:17:45.928 | DEBUG    | __main__:trials:24 - Trial = 16551/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.929 | DEBUG    | __main__:trials:29 - Trial = 16551/30000 | Total reward = 48.95
2022-01-26 14:17:45.933 | DEBUG    | __main__:trials:24 - Trial = 16552/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.934 | DEBUG    | __main__:trials:29 - Trial = 16552/30000 | Total reward = 42.55
2022-01-26 14:17:45.938 | DEBUG    | __main__:trials:24 - Trial = 16553/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.939 | DEBUG    | __main__:trials:29 - Trial = 16553/30000 | Total reward = 41.99
2022-01-26 14:17:45.943 | DEBUG    | __main__:trials:24 - Trial = 16554/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.944 | DEBUG    | __main__:trials:29 - Trial = 16554/30000 | Total reward = 45.38
2022-01-26 14:17:45.948 | DEBUG    | __main__:trials:24 - Trial = 16555/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.949 | DEBUG    | __main__:trials:29 - Trial = 16555/30000 | Total reward = 61.72
2022-01-26 14:17:45.953 | DEBUG    | __main__:trials:24 - Trial = 16556/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.955 | DEBUG    | __main__:trials:29 - Trial = 16556/30000 | Total reward = 50.70
2022-01-26 14:17:45.959 | DEBUG    | __main__:trials:24 - Trial = 16557/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.960 | DEBUG    | __main__:trials:29 - Trial = 16557/30000 | Total reward = 40.25
2022-01-26 14:17:45.964 | DEBUG    | __main__:trials:24 - Trial = 16558/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.965 | DEBUG    | __main__:trials:29 - Trial = 16558/30000 | Total reward = 33.06
2022-01-26 14:17:45.969 | DEBUG    | __main__:trials:24 - Trial = 16559/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.969 | DEBUG    | __main__:trials:29 - Trial = 16559/30000 | Total reward = 30.84
2022-01-26 14:17:45.973 | DEBUG    | __main__:trials:24 - Trial = 16560/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.974 | DEBUG    | __main__:trials:29 - Trial = 16560/30000 | Total reward = 44.71
2022-01-26 14:17:45.978 | DEBUG    | __main__:trials:24 - Trial = 16561/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.979 | DEBUG    | __main__:trials:29 - Trial = 16561/30000 | Total reward = 41.81
2022-01-26 14:17:45.983 | DEBUG    | __main__:trials:24 - Trial = 16562/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.984 | DEBUG    | __main__:trials:29 - Trial = 16562/30000 | Total reward = 46.92
2022-01-26 14:17:45.988 | DEBUG    | __main__:trials:24 - Trial = 16563/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.989 | DEBUG    | __main__:trials:29 - Trial = 16563/30000 | Total reward = 50.21
2022-01-26 14:17:45.992 | DEBUG    | __main__:trials:24 - Trial = 16564/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.994 | DEBUG    | __main__:trials:29 - Trial = 16564/30000 | Total reward = 51.58
2022-01-26 14:17:45.997 | DEBUG    | __main__:trials:24 - Trial = 16565/30000 | Max number of steps (20) reached
2022-01-26 14:17:45.999 | DEBUG    | __main__:trials:29 - Trial = 16565/30000 | Total reward = 38.63
2022-01-26 14:17:46.002 | DEBUG    | __main__:trials:24 - Trial = 16566/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.004 | DEBUG    | __main__:trials:29 - Trial = 16566/30000 | Total reward = 37.38
2022-01-26 14:17:46.007 | DEBUG    | __main__:trials:24 - Trial = 16567/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.009 | DEBUG    | __main__:trials:29 - Trial = 16567/30000 | Total reward = 46.92
2022-01-26 14:17:46.013 | DEBUG    | __main__:trials:24 - Trial = 16568/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.014 | DEBUG    | __main__:trials:29 - Trial = 16568/30000 | Total reward = 39.74
2022-01-26 14:17:46.017 | DEBUG    | __main__:trials:24 - Trial = 16569/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.018 | DEBUG    | __main__:trials:29 - Trial = 16569/30000 | Total reward = 23.46
2022-01-26 14:17:46.021 | DEBUG    | __main__:trials:24 - Trial = 16570/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.023 | DEBUG    | __main__:trials:29 - Trial = 16570/30000 | Total reward = 27.26
2022-01-26 14:17:46.025 | DEBUG    | __main__:trials:24 - Trial = 16571/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.027 | DEBUG    | __main__:trials:29 - Trial = 16571/30000 | Total reward = 40.65
2022-01-26 14:17:46.030 | DEBUG    | __main__:trials:24 - Trial = 16572/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.031 | DEBUG    | __main__:trials:29 - Trial = 16572/30000 | Total reward = 47.29
2022-01-26 14:17:46.034 | DEBUG    | __main__:trials:24 - Trial = 16573/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.035 | DEBUG    | __main__:trials:29 - Trial = 16573/30000 | Total reward = 40.56
2022-01-26 14:17:46.040 | DEBUG    | __main__:trials:24 - Trial = 16574/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.040 | DEBUG    | __main__:trials:29 - Trial = 16574/30000 | Total reward = 46.18
2022-01-26 14:17:46.045 | DEBUG    | __main__:trials:24 - Trial = 16575/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.046 | DEBUG    | __main__:trials:29 - Trial = 16575/30000 | Total reward = 41.83
2022-01-26 14:17:46.050 | DEBUG    | __main__:trials:24 - Trial = 16576/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.051 | DEBUG    | __main__:trials:29 - Trial = 16576/30000 | Total reward = 51.48
2022-01-26 14:17:46.055 | DEBUG    | __main__:trials:24 - Trial = 16577/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.057 | DEBUG    | __main__:trials:29 - Trial = 16577/30000 | Total reward = 50.43
2022-01-26 14:17:46.059 | DEBUG    | __main__:trials:26 - Trial = 16578/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.061 | DEBUG    | __main__:trials:29 - Trial = 16578/30000 | Total reward = 18.09
2022-01-26 14:17:46.065 | DEBUG    | __main__:trials:24 - Trial = 16579/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.066 | DEBUG    | __main__:trials:29 - Trial = 16579/30000 | Total reward = 51.32
2022-01-26 14:17:46.070 | DEBUG    | __main__:trials:24 - Trial = 16580/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.071 | DEBUG    | __main__:trials:29 - Trial = 16580/30000 | Total reward = 45.70
2022-01-26 14:17:46.074 | DEBUG    | __main__:trials:24 - Trial = 16581/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.076 | DEBUG    | __main__:trials:29 - Trial = 16581/30000 | Total reward = 38.16
2022-01-26 14:17:46.079 | DEBUG    | __main__:trials:24 - Trial = 16582/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.080 | DEBUG    | __main__:trials:29 - Trial = 16582/30000 | Total reward = 47.06
2022-01-26 14:17:46.084 | DEBUG    | __main__:trials:24 - Trial = 16583/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.085 | DEBUG    | __main__:trials:29 - Trial = 16583/30000 | Total reward = 65.65
2022-01-26 14:17:46.088 | DEBUG    | __main__:trials:24 - Trial = 16584/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.089 | DEBUG    | __main__:trials:29 - Trial = 16584/30000 | Total reward = 57.61
2022-01-26 14:17:46.092 | DEBUG    | __main__:trials:24 - Trial = 16585/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.094 | DEBUG    | __main__:trials:29 - Trial = 16585/30000 | Total reward = 55.82
2022-01-26 14:17:46.097 | DEBUG    | __main__:trials:24 - Trial = 16586/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.098 | DEBUG    | __main__:trials:29 - Trial = 16586/30000 | Total reward = 52.86
2022-01-26 14:17:46.102 | DEBUG    | __main__:trials:24 - Trial = 16587/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.103 | DEBUG    | __main__:trials:29 - Trial = 16587/30000 | Total reward = 47.19
2022-01-26 14:17:46.107 | DEBUG    | __main__:trials:24 - Trial = 16588/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.108 | DEBUG    | __main__:trials:29 - Trial = 16588/30000 | Total reward = 41.04
2022-01-26 14:17:46.112 | DEBUG    | __main__:trials:24 - Trial = 16589/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.113 | DEBUG    | __main__:trials:29 - Trial = 16589/30000 | Total reward = 42.53
2022-01-26 14:17:46.117 | DEBUG    | __main__:trials:24 - Trial = 16590/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.118 | DEBUG    | __main__:trials:29 - Trial = 16590/30000 | Total reward = 53.31
2022-01-26 14:17:46.122 | DEBUG    | __main__:trials:24 - Trial = 16591/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.123 | DEBUG    | __main__:trials:29 - Trial = 16591/30000 | Total reward = 51.10
2022-01-26 14:17:46.127 | DEBUG    | __main__:trials:24 - Trial = 16592/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.127 | DEBUG    | __main__:trials:29 - Trial = 16592/30000 | Total reward = 49.67
2022-01-26 14:17:46.131 | DEBUG    | __main__:trials:24 - Trial = 16593/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.133 | DEBUG    | __main__:trials:29 - Trial = 16593/30000 | Total reward = 62.02
2022-01-26 14:17:46.136 | DEBUG    | __main__:trials:24 - Trial = 16594/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.137 | DEBUG    | __main__:trials:29 - Trial = 16594/30000 | Total reward = 40.20
2022-01-26 14:17:46.142 | DEBUG    | __main__:trials:24 - Trial = 16595/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.142 | DEBUG    | __main__:trials:29 - Trial = 16595/30000 | Total reward = 31.73
2022-01-26 14:17:46.146 | DEBUG    | __main__:trials:24 - Trial = 16596/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.147 | DEBUG    | __main__:trials:29 - Trial = 16596/30000 | Total reward = 55.98
2022-01-26 14:17:46.151 | DEBUG    | __main__:trials:24 - Trial = 16597/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.152 | DEBUG    | __main__:trials:29 - Trial = 16597/30000 | Total reward = 40.95
2022-01-26 14:17:46.156 | DEBUG    | __main__:trials:24 - Trial = 16598/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.157 | DEBUG    | __main__:trials:29 - Trial = 16598/30000 | Total reward = 34.07
2022-01-26 14:17:46.160 | DEBUG    | __main__:trials:24 - Trial = 16599/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.162 | DEBUG    | __main__:trials:29 - Trial = 16599/30000 | Total reward = 39.56
2022-01-26 14:17:46.165 | DEBUG    | __main__:trials:24 - Trial = 16600/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.166 | DEBUG    | __main__:trials:29 - Trial = 16600/30000 | Total reward = 46.63
2022-01-26 14:17:46.169 | DEBUG    | __main__:trials:24 - Trial = 16601/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.170 | DEBUG    | __main__:trials:29 - Trial = 16601/30000 | Total reward = 35.54
2022-01-26 14:17:46.173 | DEBUG    | __main__:trials:24 - Trial = 16602/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.175 | DEBUG    | __main__:trials:29 - Trial = 16602/30000 | Total reward = 52.96
2022-01-26 14:17:46.178 | DEBUG    | __main__:trials:24 - Trial = 16603/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.179 | DEBUG    | __main__:trials:29 - Trial = 16603/30000 | Total reward = 53.06
2022-01-26 14:17:46.183 | DEBUG    | __main__:trials:24 - Trial = 16604/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.185 | DEBUG    | __main__:trials:29 - Trial = 16604/30000 | Total reward = 57.43
2022-01-26 14:17:46.188 | DEBUG    | __main__:trials:24 - Trial = 16605/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.190 | DEBUG    | __main__:trials:29 - Trial = 16605/30000 | Total reward = 44.27
2022-01-26 14:17:46.193 | DEBUG    | __main__:trials:24 - Trial = 16606/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.195 | DEBUG    | __main__:trials:29 - Trial = 16606/30000 | Total reward = 43.51
2022-01-26 14:17:46.198 | DEBUG    | __main__:trials:24 - Trial = 16607/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.199 | DEBUG    | __main__:trials:29 - Trial = 16607/30000 | Total reward = 45.84
2022-01-26 14:17:46.203 | DEBUG    | __main__:trials:24 - Trial = 16608/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.205 | DEBUG    | __main__:trials:29 - Trial = 16608/30000 | Total reward = 52.10
2022-01-26 14:17:46.208 | DEBUG    | __main__:trials:24 - Trial = 16609/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.210 | DEBUG    | __main__:trials:29 - Trial = 16609/30000 | Total reward = 38.85
2022-01-26 14:17:46.213 | DEBUG    | __main__:trials:24 - Trial = 16610/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.214 | DEBUG    | __main__:trials:29 - Trial = 16610/30000 | Total reward = 53.35
2022-01-26 14:17:46.217 | DEBUG    | __main__:trials:24 - Trial = 16611/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.219 | DEBUG    | __main__:trials:29 - Trial = 16611/30000 | Total reward = 43.87
2022-01-26 14:17:46.222 | DEBUG    | __main__:trials:24 - Trial = 16612/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.223 | DEBUG    | __main__:trials:29 - Trial = 16612/30000 | Total reward = 41.29
2022-01-26 14:17:46.227 | DEBUG    | __main__:trials:24 - Trial = 16613/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.229 | DEBUG    | __main__:trials:29 - Trial = 16613/30000 | Total reward = 43.29
2022-01-26 14:17:46.231 | DEBUG    | __main__:trials:24 - Trial = 16614/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.233 | DEBUG    | __main__:trials:29 - Trial = 16614/30000 | Total reward = 56.46
2022-01-26 14:17:46.236 | DEBUG    | __main__:trials:24 - Trial = 16615/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.238 | DEBUG    | __main__:trials:29 - Trial = 16615/30000 | Total reward = 38.44
2022-01-26 14:17:46.242 | DEBUG    | __main__:trials:24 - Trial = 16616/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.243 | DEBUG    | __main__:trials:29 - Trial = 16616/30000 | Total reward = 53.35
2022-01-26 14:17:46.247 | DEBUG    | __main__:trials:24 - Trial = 16617/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.248 | DEBUG    | __main__:trials:29 - Trial = 16617/30000 | Total reward = 54.49
2022-01-26 14:17:46.251 | DEBUG    | __main__:trials:24 - Trial = 16618/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.253 | DEBUG    | __main__:trials:29 - Trial = 16618/30000 | Total reward = 39.62
2022-01-26 14:17:46.256 | DEBUG    | __main__:trials:24 - Trial = 16619/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.257 | DEBUG    | __main__:trials:29 - Trial = 16619/30000 | Total reward = 40.44
2022-01-26 14:17:46.261 | DEBUG    | __main__:trials:24 - Trial = 16620/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.263 | DEBUG    | __main__:trials:29 - Trial = 16620/30000 | Total reward = 39.71
2022-01-26 14:17:46.266 | DEBUG    | __main__:trials:24 - Trial = 16621/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.267 | DEBUG    | __main__:trials:29 - Trial = 16621/30000 | Total reward = 46.65
2022-01-26 14:17:46.271 | DEBUG    | __main__:trials:24 - Trial = 16622/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.272 | DEBUG    | __main__:trials:29 - Trial = 16622/30000 | Total reward = 59.00
2022-01-26 14:17:46.278 | DEBUG    | __main__:trials:24 - Trial = 16623/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.280 | DEBUG    | __main__:trials:29 - Trial = 16623/30000 | Total reward = 42.21
2022-01-26 14:17:46.283 | DEBUG    | __main__:trials:24 - Trial = 16624/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.285 | DEBUG    | __main__:trials:29 - Trial = 16624/30000 | Total reward = 51.78
2022-01-26 14:17:46.288 | DEBUG    | __main__:trials:26 - Trial = 16625/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.289 | DEBUG    | __main__:trials:29 - Trial = 16625/30000 | Total reward = 25.19
2022-01-26 14:17:46.293 | DEBUG    | __main__:trials:24 - Trial = 16626/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.294 | DEBUG    | __main__:trials:29 - Trial = 16626/30000 | Total reward = 46.78
2022-01-26 14:17:46.298 | DEBUG    | __main__:trials:24 - Trial = 16627/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.300 | DEBUG    | __main__:trials:29 - Trial = 16627/30000 | Total reward = 46.91
2022-01-26 14:17:46.303 | DEBUG    | __main__:trials:24 - Trial = 16628/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.305 | DEBUG    | __main__:trials:29 - Trial = 16628/30000 | Total reward = 57.41
2022-01-26 14:17:46.309 | DEBUG    | __main__:trials:24 - Trial = 16629/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.310 | DEBUG    | __main__:trials:29 - Trial = 16629/30000 | Total reward = 28.72
2022-01-26 14:17:46.313 | DEBUG    | __main__:trials:24 - Trial = 16630/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.315 | DEBUG    | __main__:trials:29 - Trial = 16630/30000 | Total reward = 34.96
2022-01-26 14:17:46.319 | DEBUG    | __main__:trials:24 - Trial = 16631/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.320 | DEBUG    | __main__:trials:29 - Trial = 16631/30000 | Total reward = 42.49
2022-01-26 14:17:46.323 | DEBUG    | __main__:trials:24 - Trial = 16632/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.324 | DEBUG    | __main__:trials:29 - Trial = 16632/30000 | Total reward = 48.87
2022-01-26 14:17:46.327 | DEBUG    | __main__:trials:24 - Trial = 16633/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.329 | DEBUG    | __main__:trials:29 - Trial = 16633/30000 | Total reward = 61.18
2022-01-26 14:17:46.332 | DEBUG    | __main__:trials:24 - Trial = 16634/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.334 | DEBUG    | __main__:trials:29 - Trial = 16634/30000 | Total reward = 37.17
2022-01-26 14:17:46.338 | DEBUG    | __main__:trials:24 - Trial = 16635/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.339 | DEBUG    | __main__:trials:29 - Trial = 16635/30000 | Total reward = 47.55
2022-01-26 14:17:46.342 | DEBUG    | __main__:trials:26 - Trial = 16636/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.344 | DEBUG    | __main__:trials:29 - Trial = 16636/30000 | Total reward = 20.23
2022-01-26 14:17:46.347 | DEBUG    | __main__:trials:24 - Trial = 16637/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.349 | DEBUG    | __main__:trials:29 - Trial = 16637/30000 | Total reward = 45.48
2022-01-26 14:17:46.351 | DEBUG    | __main__:trials:26 - Trial = 16638/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.353 | DEBUG    | __main__:trials:29 - Trial = 16638/30000 | Total reward = 12.92
2022-01-26 14:17:46.356 | DEBUG    | __main__:trials:24 - Trial = 16639/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.357 | DEBUG    | __main__:trials:29 - Trial = 16639/30000 | Total reward = 36.90
2022-01-26 14:17:46.361 | DEBUG    | __main__:trials:24 - Trial = 16640/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.361 | DEBUG    | __main__:trials:29 - Trial = 16640/30000 | Total reward = 54.05
2022-01-26 14:17:46.365 | DEBUG    | __main__:trials:24 - Trial = 16641/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.365 | DEBUG    | __main__:trials:29 - Trial = 16641/30000 | Total reward = 51.39
2022-01-26 14:17:46.369 | DEBUG    | __main__:trials:24 - Trial = 16642/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.371 | DEBUG    | __main__:trials:29 - Trial = 16642/30000 | Total reward = 35.11
2022-01-26 14:17:46.374 | DEBUG    | __main__:trials:24 - Trial = 16643/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.376 | DEBUG    | __main__:trials:29 - Trial = 16643/30000 | Total reward = 42.70
2022-01-26 14:17:46.379 | DEBUG    | __main__:trials:24 - Trial = 16644/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.380 | DEBUG    | __main__:trials:29 - Trial = 16644/30000 | Total reward = 61.24
2022-01-26 14:17:46.384 | DEBUG    | __main__:trials:24 - Trial = 16645/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.385 | DEBUG    | __main__:trials:29 - Trial = 16645/30000 | Total reward = 48.06
2022-01-26 14:17:46.389 | DEBUG    | __main__:trials:24 - Trial = 16646/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.390 | DEBUG    | __main__:trials:29 - Trial = 16646/30000 | Total reward = 56.48
2022-01-26 14:17:46.394 | DEBUG    | __main__:trials:24 - Trial = 16647/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.395 | DEBUG    | __main__:trials:29 - Trial = 16647/30000 | Total reward = 41.25
2022-01-26 14:17:46.398 | DEBUG    | __main__:trials:24 - Trial = 16648/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.400 | DEBUG    | __main__:trials:29 - Trial = 16648/30000 | Total reward = 45.28
2022-01-26 14:17:46.404 | DEBUG    | __main__:trials:24 - Trial = 16649/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.405 | DEBUG    | __main__:trials:29 - Trial = 16649/30000 | Total reward = 54.69
2022-01-26 14:17:46.409 | DEBUG    | __main__:trials:24 - Trial = 16650/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.410 | DEBUG    | __main__:trials:29 - Trial = 16650/30000 | Total reward = 40.45
2022-01-26 14:17:46.414 | DEBUG    | __main__:trials:24 - Trial = 16651/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.415 | DEBUG    | __main__:trials:29 - Trial = 16651/30000 | Total reward = 58.89
2022-01-26 14:17:46.419 | DEBUG    | __main__:trials:24 - Trial = 16652/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.420 | DEBUG    | __main__:trials:29 - Trial = 16652/30000 | Total reward = 33.85
2022-01-26 14:17:46.425 | DEBUG    | __main__:trials:24 - Trial = 16653/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.426 | DEBUG    | __main__:trials:29 - Trial = 16653/30000 | Total reward = 42.26
2022-01-26 14:17:46.430 | DEBUG    | __main__:trials:24 - Trial = 16654/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.431 | DEBUG    | __main__:trials:29 - Trial = 16654/30000 | Total reward = 37.66
2022-01-26 14:17:46.434 | DEBUG    | __main__:trials:24 - Trial = 16655/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.436 | DEBUG    | __main__:trials:29 - Trial = 16655/30000 | Total reward = 57.84
2022-01-26 14:17:46.440 | DEBUG    | __main__:trials:24 - Trial = 16656/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.442 | DEBUG    | __main__:trials:29 - Trial = 16656/30000 | Total reward = 49.71
2022-01-26 14:17:46.444 | DEBUG    | __main__:trials:24 - Trial = 16657/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.446 | DEBUG    | __main__:trials:29 - Trial = 16657/30000 | Total reward = 45.77
2022-01-26 14:17:46.449 | DEBUG    | __main__:trials:24 - Trial = 16658/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.451 | DEBUG    | __main__:trials:29 - Trial = 16658/30000 | Total reward = 38.56
2022-01-26 14:17:46.455 | DEBUG    | __main__:trials:24 - Trial = 16659/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.457 | DEBUG    | __main__:trials:29 - Trial = 16659/30000 | Total reward = 40.66
2022-01-26 14:17:46.460 | DEBUG    | __main__:trials:24 - Trial = 16660/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.462 | DEBUG    | __main__:trials:29 - Trial = 16660/30000 | Total reward = 50.92
2022-01-26 14:17:46.465 | DEBUG    | __main__:trials:24 - Trial = 16661/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.466 | DEBUG    | __main__:trials:29 - Trial = 16661/30000 | Total reward = 41.49
2022-01-26 14:17:46.470 | DEBUG    | __main__:trials:24 - Trial = 16662/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.472 | DEBUG    | __main__:trials:29 - Trial = 16662/30000 | Total reward = 51.57
2022-01-26 14:17:46.476 | DEBUG    | __main__:trials:24 - Trial = 16663/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.478 | DEBUG    | __main__:trials:29 - Trial = 16663/30000 | Total reward = 38.36
2022-01-26 14:17:46.482 | DEBUG    | __main__:trials:26 - Trial = 16664/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.484 | DEBUG    | __main__:trials:29 - Trial = 16664/30000 | Total reward = 39.78
2022-01-26 14:17:46.488 | DEBUG    | __main__:trials:24 - Trial = 16665/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.489 | DEBUG    | __main__:trials:29 - Trial = 16665/30000 | Total reward = 65.44
2022-01-26 14:17:46.492 | DEBUG    | __main__:trials:24 - Trial = 16666/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.494 | DEBUG    | __main__:trials:29 - Trial = 16666/30000 | Total reward = 38.91
2022-01-26 14:17:46.498 | DEBUG    | __main__:trials:24 - Trial = 16667/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.499 | DEBUG    | __main__:trials:29 - Trial = 16667/30000 | Total reward = 38.74
2022-01-26 14:17:46.503 | DEBUG    | __main__:trials:24 - Trial = 16668/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.504 | DEBUG    | __main__:trials:29 - Trial = 16668/30000 | Total reward = 43.25
2022-01-26 14:17:46.508 | DEBUG    | __main__:trials:24 - Trial = 16669/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.510 | DEBUG    | __main__:trials:29 - Trial = 16669/30000 | Total reward = 44.77
2022-01-26 14:17:46.513 | DEBUG    | __main__:trials:24 - Trial = 16670/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.514 | DEBUG    | __main__:trials:29 - Trial = 16670/30000 | Total reward = 40.38
2022-01-26 14:17:46.518 | DEBUG    | __main__:trials:24 - Trial = 16671/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.520 | DEBUG    | __main__:trials:29 - Trial = 16671/30000 | Total reward = 46.09
2022-01-26 14:17:46.523 | DEBUG    | __main__:trials:24 - Trial = 16672/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.525 | DEBUG    | __main__:trials:29 - Trial = 16672/30000 | Total reward = 46.00
2022-01-26 14:17:46.528 | DEBUG    | __main__:trials:24 - Trial = 16673/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.530 | DEBUG    | __main__:trials:29 - Trial = 16673/30000 | Total reward = 41.01
2022-01-26 14:17:46.533 | DEBUG    | __main__:trials:24 - Trial = 16674/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.535 | DEBUG    | __main__:trials:29 - Trial = 16674/30000 | Total reward = 36.43
2022-01-26 14:17:46.539 | DEBUG    | __main__:trials:24 - Trial = 16675/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.540 | DEBUG    | __main__:trials:29 - Trial = 16675/30000 | Total reward = 45.02
2022-01-26 14:17:46.544 | DEBUG    | __main__:trials:24 - Trial = 16676/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.546 | DEBUG    | __main__:trials:29 - Trial = 16676/30000 | Total reward = 38.95
2022-01-26 14:17:46.549 | DEBUG    | __main__:trials:24 - Trial = 16677/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.551 | DEBUG    | __main__:trials:29 - Trial = 16677/30000 | Total reward = 46.44
2022-01-26 14:17:46.555 | DEBUG    | __main__:trials:24 - Trial = 16678/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.556 | DEBUG    | __main__:trials:29 - Trial = 16678/30000 | Total reward = 34.21
2022-01-26 14:17:46.560 | DEBUG    | __main__:trials:24 - Trial = 16679/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.561 | DEBUG    | __main__:trials:29 - Trial = 16679/30000 | Total reward = 56.54
2022-01-26 14:17:46.565 | DEBUG    | __main__:trials:24 - Trial = 16680/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.565 | DEBUG    | __main__:trials:29 - Trial = 16680/30000 | Total reward = 39.01
2022-01-26 14:17:46.568 | DEBUG    | __main__:trials:24 - Trial = 16681/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.570 | DEBUG    | __main__:trials:29 - Trial = 16681/30000 | Total reward = 37.97
2022-01-26 14:17:46.574 | DEBUG    | __main__:trials:24 - Trial = 16682/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.575 | DEBUG    | __main__:trials:29 - Trial = 16682/30000 | Total reward = 37.72
2022-01-26 14:17:46.578 | DEBUG    | __main__:trials:24 - Trial = 16683/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.580 | DEBUG    | __main__:trials:29 - Trial = 16683/30000 | Total reward = 59.58
2022-01-26 14:17:46.584 | DEBUG    | __main__:trials:24 - Trial = 16684/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.585 | DEBUG    | __main__:trials:29 - Trial = 16684/30000 | Total reward = 40.23
2022-01-26 14:17:46.589 | DEBUG    | __main__:trials:24 - Trial = 16685/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.590 | DEBUG    | __main__:trials:29 - Trial = 16685/30000 | Total reward = 42.65
2022-01-26 14:17:46.592 | DEBUG    | __main__:trials:26 - Trial = 16686/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.594 | DEBUG    | __main__:trials:29 - Trial = 16686/30000 | Total reward = 21.62
2022-01-26 14:17:46.598 | DEBUG    | __main__:trials:24 - Trial = 16687/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.599 | DEBUG    | __main__:trials:29 - Trial = 16687/30000 | Total reward = 37.04
2022-01-26 14:17:46.603 | DEBUG    | __main__:trials:24 - Trial = 16688/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.605 | DEBUG    | __main__:trials:29 - Trial = 16688/30000 | Total reward = 37.80
2022-01-26 14:17:46.608 | DEBUG    | __main__:trials:24 - Trial = 16689/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.610 | DEBUG    | __main__:trials:29 - Trial = 16689/30000 | Total reward = 43.84
2022-01-26 14:17:46.613 | DEBUG    | __main__:trials:24 - Trial = 16690/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.615 | DEBUG    | __main__:trials:29 - Trial = 16690/30000 | Total reward = 37.61
2022-01-26 14:17:46.619 | DEBUG    | __main__:trials:24 - Trial = 16691/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.620 | DEBUG    | __main__:trials:29 - Trial = 16691/30000 | Total reward = 45.96
2022-01-26 14:17:46.624 | DEBUG    | __main__:trials:24 - Trial = 16692/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.625 | DEBUG    | __main__:trials:29 - Trial = 16692/30000 | Total reward = 53.50
2022-01-26 14:17:46.629 | DEBUG    | __main__:trials:24 - Trial = 16693/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.631 | DEBUG    | __main__:trials:29 - Trial = 16693/30000 | Total reward = 44.25
2022-01-26 14:17:46.634 | DEBUG    | __main__:trials:24 - Trial = 16694/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.636 | DEBUG    | __main__:trials:29 - Trial = 16694/30000 | Total reward = 45.31
2022-01-26 14:17:46.639 | DEBUG    | __main__:trials:24 - Trial = 16695/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.641 | DEBUG    | __main__:trials:29 - Trial = 16695/30000 | Total reward = 41.93
2022-01-26 14:17:46.644 | DEBUG    | __main__:trials:24 - Trial = 16696/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.646 | DEBUG    | __main__:trials:29 - Trial = 16696/30000 | Total reward = 40.12
2022-01-26 14:17:46.649 | DEBUG    | __main__:trials:24 - Trial = 16697/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.650 | DEBUG    | __main__:trials:29 - Trial = 16697/30000 | Total reward = 37.23
2022-01-26 14:17:46.654 | DEBUG    | __main__:trials:24 - Trial = 16698/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.656 | DEBUG    | __main__:trials:29 - Trial = 16698/30000 | Total reward = 42.60
2022-01-26 14:17:46.659 | DEBUG    | __main__:trials:24 - Trial = 16699/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.661 | DEBUG    | __main__:trials:29 - Trial = 16699/30000 | Total reward = 38.13
2022-01-26 14:17:46.665 | DEBUG    | __main__:trials:24 - Trial = 16700/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.666 | DEBUG    | __main__:trials:29 - Trial = 16700/30000 | Total reward = 51.33
2022-01-26 14:17:46.670 | DEBUG    | __main__:trials:24 - Trial = 16701/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.672 | DEBUG    | __main__:trials:29 - Trial = 16701/30000 | Total reward = 41.97
2022-01-26 14:17:46.675 | DEBUG    | __main__:trials:24 - Trial = 16702/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.677 | DEBUG    | __main__:trials:29 - Trial = 16702/30000 | Total reward = 59.20
2022-01-26 14:17:46.680 | DEBUG    | __main__:trials:24 - Trial = 16703/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.682 | DEBUG    | __main__:trials:29 - Trial = 16703/30000 | Total reward = 39.56
2022-01-26 14:17:46.686 | DEBUG    | __main__:trials:24 - Trial = 16704/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.687 | DEBUG    | __main__:trials:29 - Trial = 16704/30000 | Total reward = 42.47
2022-01-26 14:17:46.691 | DEBUG    | __main__:trials:24 - Trial = 16705/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.693 | DEBUG    | __main__:trials:29 - Trial = 16705/30000 | Total reward = 46.11
2022-01-26 14:17:46.696 | DEBUG    | __main__:trials:24 - Trial = 16706/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.697 | DEBUG    | __main__:trials:29 - Trial = 16706/30000 | Total reward = 35.78
2022-01-26 14:17:46.701 | DEBUG    | __main__:trials:26 - Trial = 16707/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.702 | DEBUG    | __main__:trials:29 - Trial = 16707/30000 | Total reward = 35.75
2022-01-26 14:17:46.706 | DEBUG    | __main__:trials:24 - Trial = 16708/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.707 | DEBUG    | __main__:trials:29 - Trial = 16708/30000 | Total reward = 42.53
2022-01-26 14:17:46.711 | DEBUG    | __main__:trials:24 - Trial = 16709/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.713 | DEBUG    | __main__:trials:29 - Trial = 16709/30000 | Total reward = 38.95
2022-01-26 14:17:46.716 | DEBUG    | __main__:trials:24 - Trial = 16710/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.717 | DEBUG    | __main__:trials:29 - Trial = 16710/30000 | Total reward = 40.69
2022-01-26 14:17:46.721 | DEBUG    | __main__:trials:24 - Trial = 16711/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.722 | DEBUG    | __main__:trials:29 - Trial = 16711/30000 | Total reward = 44.52
2022-01-26 14:17:46.726 | DEBUG    | __main__:trials:24 - Trial = 16712/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.726 | DEBUG    | __main__:trials:29 - Trial = 16712/30000 | Total reward = 25.88
2022-01-26 14:17:46.731 | DEBUG    | __main__:trials:24 - Trial = 16713/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.732 | DEBUG    | __main__:trials:29 - Trial = 16713/30000 | Total reward = 46.39
2022-01-26 14:17:46.736 | DEBUG    | __main__:trials:24 - Trial = 16714/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.738 | DEBUG    | __main__:trials:29 - Trial = 16714/30000 | Total reward = 37.29
2022-01-26 14:17:46.741 | DEBUG    | __main__:trials:24 - Trial = 16715/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.743 | DEBUG    | __main__:trials:29 - Trial = 16715/30000 | Total reward = 52.31
2022-01-26 14:17:46.747 | DEBUG    | __main__:trials:24 - Trial = 16716/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.748 | DEBUG    | __main__:trials:29 - Trial = 16716/30000 | Total reward = 40.47
2022-01-26 14:17:46.752 | DEBUG    | __main__:trials:24 - Trial = 16717/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.754 | DEBUG    | __main__:trials:29 - Trial = 16717/30000 | Total reward = 35.67
2022-01-26 14:17:46.757 | DEBUG    | __main__:trials:24 - Trial = 16718/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.759 | DEBUG    | __main__:trials:29 - Trial = 16718/30000 | Total reward = 38.32
2022-01-26 14:17:46.763 | DEBUG    | __main__:trials:24 - Trial = 16719/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.764 | DEBUG    | __main__:trials:29 - Trial = 16719/30000 | Total reward = 42.39
2022-01-26 14:17:46.768 | DEBUG    | __main__:trials:26 - Trial = 16720/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:46.769 | DEBUG    | __main__:trials:29 - Trial = 16720/30000 | Total reward = 20.28
2022-01-26 14:17:46.773 | DEBUG    | __main__:trials:24 - Trial = 16721/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.775 | DEBUG    | __main__:trials:29 - Trial = 16721/30000 | Total reward = 41.48
2022-01-26 14:17:46.779 | DEBUG    | __main__:trials:24 - Trial = 16722/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.780 | DEBUG    | __main__:trials:29 - Trial = 16722/30000 | Total reward = 38.77
2022-01-26 14:17:46.784 | DEBUG    | __main__:trials:24 - Trial = 16723/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.785 | DEBUG    | __main__:trials:29 - Trial = 16723/30000 | Total reward = 35.68
2022-01-26 14:17:46.789 | DEBUG    | __main__:trials:24 - Trial = 16724/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.790 | DEBUG    | __main__:trials:29 - Trial = 16724/30000 | Total reward = 48.44
2022-01-26 14:17:46.794 | DEBUG    | __main__:trials:24 - Trial = 16725/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.794 | DEBUG    | __main__:trials:29 - Trial = 16725/30000 | Total reward = 46.07
2022-01-26 14:17:46.798 | DEBUG    | __main__:trials:24 - Trial = 16726/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.800 | DEBUG    | __main__:trials:29 - Trial = 16726/30000 | Total reward = 45.85
2022-01-26 14:17:46.803 | DEBUG    | __main__:trials:24 - Trial = 16727/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.804 | DEBUG    | __main__:trials:29 - Trial = 16727/30000 | Total reward = 44.13
2022-01-26 14:17:46.808 | DEBUG    | __main__:trials:24 - Trial = 16728/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.809 | DEBUG    | __main__:trials:29 - Trial = 16728/30000 | Total reward = 50.56
2022-01-26 14:17:46.813 | DEBUG    | __main__:trials:24 - Trial = 16729/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.814 | DEBUG    | __main__:trials:29 - Trial = 16729/30000 | Total reward = 46.85
2022-01-26 14:17:46.818 | DEBUG    | __main__:trials:24 - Trial = 16730/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.819 | DEBUG    | __main__:trials:29 - Trial = 16730/30000 | Total reward = 40.25
2022-01-26 14:17:46.823 | DEBUG    | __main__:trials:24 - Trial = 16731/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.824 | DEBUG    | __main__:trials:29 - Trial = 16731/30000 | Total reward = 46.69
2022-01-26 14:17:46.828 | DEBUG    | __main__:trials:24 - Trial = 16732/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.829 | DEBUG    | __main__:trials:29 - Trial = 16732/30000 | Total reward = 44.80
2022-01-26 14:17:46.833 | DEBUG    | __main__:trials:24 - Trial = 16733/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.834 | DEBUG    | __main__:trials:29 - Trial = 16733/30000 | Total reward = 40.26
2022-01-26 14:17:46.838 | DEBUG    | __main__:trials:24 - Trial = 16734/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.840 | DEBUG    | __main__:trials:29 - Trial = 16734/30000 | Total reward = 43.46
2022-01-26 14:17:46.844 | DEBUG    | __main__:trials:24 - Trial = 16735/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.845 | DEBUG    | __main__:trials:29 - Trial = 16735/30000 | Total reward = 32.97
2022-01-26 14:17:46.848 | DEBUG    | __main__:trials:24 - Trial = 16736/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.849 | DEBUG    | __main__:trials:29 - Trial = 16736/30000 | Total reward = 36.85
2022-01-26 14:17:46.854 | DEBUG    | __main__:trials:24 - Trial = 16737/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.854 | DEBUG    | __main__:trials:29 - Trial = 16737/30000 | Total reward = 34.77
2022-01-26 14:17:46.858 | DEBUG    | __main__:trials:24 - Trial = 16738/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.860 | DEBUG    | __main__:trials:29 - Trial = 16738/30000 | Total reward = 37.44
2022-01-26 14:17:46.864 | DEBUG    | __main__:trials:24 - Trial = 16739/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.865 | DEBUG    | __main__:trials:29 - Trial = 16739/30000 | Total reward = 63.05
2022-01-26 14:17:46.869 | DEBUG    | __main__:trials:24 - Trial = 16740/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.870 | DEBUG    | __main__:trials:29 - Trial = 16740/30000 | Total reward = 32.67
2022-01-26 14:17:46.873 | DEBUG    | __main__:trials:24 - Trial = 16741/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.875 | DEBUG    | __main__:trials:29 - Trial = 16741/30000 | Total reward = 38.36
2022-01-26 14:17:46.879 | DEBUG    | __main__:trials:24 - Trial = 16742/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.881 | DEBUG    | __main__:trials:29 - Trial = 16742/30000 | Total reward = 54.79
2022-01-26 14:17:46.884 | DEBUG    | __main__:trials:24 - Trial = 16743/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.884 | DEBUG    | __main__:trials:29 - Trial = 16743/30000 | Total reward = 41.32
2022-01-26 14:17:46.888 | DEBUG    | __main__:trials:24 - Trial = 16744/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.889 | DEBUG    | __main__:trials:29 - Trial = 16744/30000 | Total reward = 50.51
2022-01-26 14:17:46.893 | DEBUG    | __main__:trials:24 - Trial = 16745/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.895 | DEBUG    | __main__:trials:29 - Trial = 16745/30000 | Total reward = 38.63
2022-01-26 14:17:46.898 | DEBUG    | __main__:trials:24 - Trial = 16746/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.899 | DEBUG    | __main__:trials:29 - Trial = 16746/30000 | Total reward = 63.96
2022-01-26 14:17:46.903 | DEBUG    | __main__:trials:24 - Trial = 16747/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.905 | DEBUG    | __main__:trials:29 - Trial = 16747/30000 | Total reward = 52.98
2022-01-26 14:17:46.908 | DEBUG    | __main__:trials:24 - Trial = 16748/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.909 | DEBUG    | __main__:trials:29 - Trial = 16748/30000 | Total reward = 36.53
2022-01-26 14:17:46.913 | DEBUG    | __main__:trials:24 - Trial = 16749/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.915 | DEBUG    | __main__:trials:29 - Trial = 16749/30000 | Total reward = 39.07
2022-01-26 14:17:46.918 | DEBUG    | __main__:trials:24 - Trial = 16750/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.920 | DEBUG    | __main__:trials:29 - Trial = 16750/30000 | Total reward = 38.37
2022-01-26 14:17:46.924 | DEBUG    | __main__:trials:24 - Trial = 16751/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.925 | DEBUG    | __main__:trials:29 - Trial = 16751/30000 | Total reward = 49.73
2022-01-26 14:17:46.928 | DEBUG    | __main__:trials:24 - Trial = 16752/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.930 | DEBUG    | __main__:trials:29 - Trial = 16752/30000 | Total reward = 45.87
2022-01-26 14:17:46.933 | DEBUG    | __main__:trials:24 - Trial = 16753/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.934 | DEBUG    | __main__:trials:29 - Trial = 16753/30000 | Total reward = 53.02
2022-01-26 14:17:46.937 | DEBUG    | __main__:trials:24 - Trial = 16754/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.938 | DEBUG    | __main__:trials:29 - Trial = 16754/30000 | Total reward = 59.56
2022-01-26 14:17:46.941 | DEBUG    | __main__:trials:24 - Trial = 16755/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.943 | DEBUG    | __main__:trials:29 - Trial = 16755/30000 | Total reward = 52.96
2022-01-26 14:17:46.947 | DEBUG    | __main__:trials:24 - Trial = 16756/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.948 | DEBUG    | __main__:trials:29 - Trial = 16756/30000 | Total reward = 55.74
2022-01-26 14:17:46.952 | DEBUG    | __main__:trials:24 - Trial = 16757/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.954 | DEBUG    | __main__:trials:29 - Trial = 16757/30000 | Total reward = 51.93
2022-01-26 14:17:46.958 | DEBUG    | __main__:trials:24 - Trial = 16758/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.959 | DEBUG    | __main__:trials:29 - Trial = 16758/30000 | Total reward = 39.46
2022-01-26 14:17:46.963 | DEBUG    | __main__:trials:24 - Trial = 16759/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.965 | DEBUG    | __main__:trials:29 - Trial = 16759/30000 | Total reward = 52.82
2022-01-26 14:17:46.968 | DEBUG    | __main__:trials:24 - Trial = 16760/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.970 | DEBUG    | __main__:trials:29 - Trial = 16760/30000 | Total reward = 55.96
2022-01-26 14:17:46.973 | DEBUG    | __main__:trials:24 - Trial = 16761/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.975 | DEBUG    | __main__:trials:29 - Trial = 16761/30000 | Total reward = 50.27
2022-01-26 14:17:46.979 | DEBUG    | __main__:trials:24 - Trial = 16762/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.980 | DEBUG    | __main__:trials:29 - Trial = 16762/30000 | Total reward = 61.29
2022-01-26 14:17:46.984 | DEBUG    | __main__:trials:24 - Trial = 16763/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.984 | DEBUG    | __main__:trials:29 - Trial = 16763/30000 | Total reward = 59.56
2022-01-26 14:17:46.989 | DEBUG    | __main__:trials:24 - Trial = 16764/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.990 | DEBUG    | __main__:trials:29 - Trial = 16764/30000 | Total reward = 55.47
2022-01-26 14:17:46.994 | DEBUG    | __main__:trials:24 - Trial = 16765/30000 | Max number of steps (20) reached
2022-01-26 14:17:46.995 | DEBUG    | __main__:trials:29 - Trial = 16765/30000 | Total reward = 37.73
2022-01-26 14:17:46.999 | DEBUG    | __main__:trials:24 - Trial = 16766/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.000 | DEBUG    | __main__:trials:29 - Trial = 16766/30000 | Total reward = 63.24
2022-01-26 14:17:47.003 | DEBUG    | __main__:trials:24 - Trial = 16767/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.004 | DEBUG    | __main__:trials:29 - Trial = 16767/30000 | Total reward = 49.18
2022-01-26 14:17:47.008 | DEBUG    | __main__:trials:24 - Trial = 16768/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.009 | DEBUG    | __main__:trials:29 - Trial = 16768/30000 | Total reward = 52.20
2022-01-26 14:17:47.013 | DEBUG    | __main__:trials:24 - Trial = 16769/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.015 | DEBUG    | __main__:trials:29 - Trial = 16769/30000 | Total reward = 52.22
2022-01-26 14:17:47.018 | DEBUG    | __main__:trials:24 - Trial = 16770/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.020 | DEBUG    | __main__:trials:29 - Trial = 16770/30000 | Total reward = 52.83
2022-01-26 14:17:47.023 | DEBUG    | __main__:trials:24 - Trial = 16771/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.025 | DEBUG    | __main__:trials:29 - Trial = 16771/30000 | Total reward = 38.41
2022-01-26 14:17:47.028 | DEBUG    | __main__:trials:24 - Trial = 16772/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.029 | DEBUG    | __main__:trials:29 - Trial = 16772/30000 | Total reward = 39.27
2022-01-26 14:17:47.034 | DEBUG    | __main__:trials:24 - Trial = 16773/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.034 | DEBUG    | __main__:trials:29 - Trial = 16773/30000 | Total reward = 39.33
2022-01-26 14:17:47.038 | DEBUG    | __main__:trials:24 - Trial = 16774/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.040 | DEBUG    | __main__:trials:29 - Trial = 16774/30000 | Total reward = 66.71
2022-01-26 14:17:47.044 | DEBUG    | __main__:trials:24 - Trial = 16775/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.045 | DEBUG    | __main__:trials:29 - Trial = 16775/30000 | Total reward = 53.35
2022-01-26 14:17:47.048 | DEBUG    | __main__:trials:24 - Trial = 16776/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.050 | DEBUG    | __main__:trials:29 - Trial = 16776/30000 | Total reward = 32.25
2022-01-26 14:17:47.054 | DEBUG    | __main__:trials:24 - Trial = 16777/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.055 | DEBUG    | __main__:trials:29 - Trial = 16777/30000 | Total reward = 40.56
2022-01-26 14:17:47.059 | DEBUG    | __main__:trials:24 - Trial = 16778/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.060 | DEBUG    | __main__:trials:29 - Trial = 16778/30000 | Total reward = 52.44
2022-01-26 14:17:47.064 | DEBUG    | __main__:trials:24 - Trial = 16779/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.065 | DEBUG    | __main__:trials:29 - Trial = 16779/30000 | Total reward = 52.47
2022-01-26 14:17:47.068 | DEBUG    | __main__:trials:24 - Trial = 16780/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.070 | DEBUG    | __main__:trials:29 - Trial = 16780/30000 | Total reward = 55.99
2022-01-26 14:17:47.074 | DEBUG    | __main__:trials:24 - Trial = 16781/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.075 | DEBUG    | __main__:trials:29 - Trial = 16781/30000 | Total reward = 34.44
2022-01-26 14:17:47.079 | DEBUG    | __main__:trials:24 - Trial = 16782/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.081 | DEBUG    | __main__:trials:29 - Trial = 16782/30000 | Total reward = 52.55
2022-01-26 14:17:47.084 | DEBUG    | __main__:trials:24 - Trial = 16783/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.085 | DEBUG    | __main__:trials:29 - Trial = 16783/30000 | Total reward = 47.99
2022-01-26 14:17:47.088 | DEBUG    | __main__:trials:24 - Trial = 16784/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.089 | DEBUG    | __main__:trials:29 - Trial = 16784/30000 | Total reward = 36.59
2022-01-26 14:17:47.092 | DEBUG    | __main__:trials:24 - Trial = 16785/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.094 | DEBUG    | __main__:trials:29 - Trial = 16785/30000 | Total reward = 42.78
2022-01-26 14:17:47.097 | DEBUG    | __main__:trials:24 - Trial = 16786/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.098 | DEBUG    | __main__:trials:29 - Trial = 16786/30000 | Total reward = 40.05
2022-01-26 14:17:47.101 | DEBUG    | __main__:trials:24 - Trial = 16787/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.103 | DEBUG    | __main__:trials:29 - Trial = 16787/30000 | Total reward = 37.13
2022-01-26 14:17:47.107 | DEBUG    | __main__:trials:24 - Trial = 16788/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.109 | DEBUG    | __main__:trials:29 - Trial = 16788/30000 | Total reward = 59.18
2022-01-26 14:17:47.112 | DEBUG    | __main__:trials:24 - Trial = 16789/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.114 | DEBUG    | __main__:trials:29 - Trial = 16789/30000 | Total reward = 37.39
2022-01-26 14:17:47.118 | DEBUG    | __main__:trials:24 - Trial = 16790/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.119 | DEBUG    | __main__:trials:29 - Trial = 16790/30000 | Total reward = 38.36
2022-01-26 14:17:47.123 | DEBUG    | __main__:trials:24 - Trial = 16791/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.124 | DEBUG    | __main__:trials:29 - Trial = 16791/30000 | Total reward = 38.36
2022-01-26 14:17:47.128 | DEBUG    | __main__:trials:24 - Trial = 16792/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.130 | DEBUG    | __main__:trials:29 - Trial = 16792/30000 | Total reward = 39.66
2022-01-26 14:17:47.133 | DEBUG    | __main__:trials:24 - Trial = 16793/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.135 | DEBUG    | __main__:trials:29 - Trial = 16793/30000 | Total reward = 42.74
2022-01-26 14:17:47.139 | DEBUG    | __main__:trials:24 - Trial = 16794/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.140 | DEBUG    | __main__:trials:29 - Trial = 16794/30000 | Total reward = 45.63
2022-01-26 14:17:47.143 | DEBUG    | __main__:trials:24 - Trial = 16795/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.145 | DEBUG    | __main__:trials:29 - Trial = 16795/30000 | Total reward = 42.24
2022-01-26 14:17:47.149 | DEBUG    | __main__:trials:24 - Trial = 16796/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.151 | DEBUG    | __main__:trials:29 - Trial = 16796/30000 | Total reward = 51.22
2022-01-26 14:17:47.155 | DEBUG    | __main__:trials:24 - Trial = 16797/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.156 | DEBUG    | __main__:trials:29 - Trial = 16797/30000 | Total reward = 39.67
2022-01-26 14:17:47.160 | DEBUG    | __main__:trials:24 - Trial = 16798/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.162 | DEBUG    | __main__:trials:29 - Trial = 16798/30000 | Total reward = 34.51
2022-01-26 14:17:47.166 | DEBUG    | __main__:trials:24 - Trial = 16799/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.167 | DEBUG    | __main__:trials:29 - Trial = 16799/30000 | Total reward = 46.27
2022-01-26 14:17:47.172 | DEBUG    | __main__:trials:24 - Trial = 16800/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.173 | DEBUG    | __main__:trials:29 - Trial = 16800/30000 | Total reward = 44.85
2022-01-26 14:17:47.177 | DEBUG    | __main__:trials:24 - Trial = 16801/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.178 | DEBUG    | __main__:trials:29 - Trial = 16801/30000 | Total reward = 46.25
2022-01-26 14:17:47.181 | DEBUG    | __main__:trials:24 - Trial = 16802/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.183 | DEBUG    | __main__:trials:29 - Trial = 16802/30000 | Total reward = 38.17
2022-01-26 14:17:47.186 | DEBUG    | __main__:trials:24 - Trial = 16803/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.188 | DEBUG    | __main__:trials:29 - Trial = 16803/30000 | Total reward = 40.61
2022-01-26 14:17:47.192 | DEBUG    | __main__:trials:26 - Trial = 16804/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:47.193 | DEBUG    | __main__:trials:29 - Trial = 16804/30000 | Total reward = 27.37
2022-01-26 14:17:47.197 | DEBUG    | __main__:trials:24 - Trial = 16805/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.199 | DEBUG    | __main__:trials:29 - Trial = 16805/30000 | Total reward = 35.76
2022-01-26 14:17:47.203 | DEBUG    | __main__:trials:24 - Trial = 16806/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.203 | DEBUG    | __main__:trials:29 - Trial = 16806/30000 | Total reward = 34.23
2022-01-26 14:17:47.207 | DEBUG    | __main__:trials:24 - Trial = 16807/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.209 | DEBUG    | __main__:trials:29 - Trial = 16807/30000 | Total reward = 44.11
2022-01-26 14:17:47.212 | DEBUG    | __main__:trials:24 - Trial = 16808/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.214 | DEBUG    | __main__:trials:29 - Trial = 16808/30000 | Total reward = 41.07
2022-01-26 14:17:47.217 | DEBUG    | __main__:trials:24 - Trial = 16809/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.218 | DEBUG    | __main__:trials:29 - Trial = 16809/30000 | Total reward = 54.86
2022-01-26 14:17:47.222 | DEBUG    | __main__:trials:24 - Trial = 16810/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.224 | DEBUG    | __main__:trials:29 - Trial = 16810/30000 | Total reward = 40.64
2022-01-26 14:17:47.228 | DEBUG    | __main__:trials:24 - Trial = 16811/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.229 | DEBUG    | __main__:trials:29 - Trial = 16811/30000 | Total reward = 42.58
2022-01-26 14:17:47.519 | DEBUG    | __main__:trials:24 - Trial = 16812/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.522 | DEBUG    | __main__:trials:29 - Trial = 16812/30000 | Total reward = 40.68
2022-01-26 14:17:47.526 | DEBUG    | __main__:trials:24 - Trial = 16813/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.528 | DEBUG    | __main__:trials:29 - Trial = 16813/30000 | Total reward = 49.30
2022-01-26 14:17:47.532 | DEBUG    | __main__:trials:24 - Trial = 16814/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.532 | DEBUG    | __main__:trials:29 - Trial = 16814/30000 | Total reward = 54.50
2022-01-26 14:17:47.536 | DEBUG    | __main__:trials:24 - Trial = 16815/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.537 | DEBUG    | __main__:trials:29 - Trial = 16815/30000 | Total reward = 52.01
2022-01-26 14:17:47.542 | DEBUG    | __main__:trials:24 - Trial = 16816/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.542 | DEBUG    | __main__:trials:29 - Trial = 16816/30000 | Total reward = 57.69
2022-01-26 14:17:47.547 | DEBUG    | __main__:trials:24 - Trial = 16817/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.549 | DEBUG    | __main__:trials:29 - Trial = 16817/30000 | Total reward = 51.68
2022-01-26 14:17:47.552 | DEBUG    | __main__:trials:24 - Trial = 16818/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.553 | DEBUG    | __main__:trials:29 - Trial = 16818/30000 | Total reward = 36.43
2022-01-26 14:17:47.557 | DEBUG    | __main__:trials:24 - Trial = 16819/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.559 | DEBUG    | __main__:trials:29 - Trial = 16819/30000 | Total reward = 51.78
2022-01-26 14:17:47.563 | DEBUG    | __main__:trials:24 - Trial = 16820/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.564 | DEBUG    | __main__:trials:29 - Trial = 16820/30000 | Total reward = 56.08
2022-01-26 14:17:47.568 | DEBUG    | __main__:trials:24 - Trial = 16821/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.569 | DEBUG    | __main__:trials:29 - Trial = 16821/30000 | Total reward = 50.70
2022-01-26 14:17:47.573 | DEBUG    | __main__:trials:24 - Trial = 16822/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.574 | DEBUG    | __main__:trials:29 - Trial = 16822/30000 | Total reward = 52.17
2022-01-26 14:17:47.578 | DEBUG    | __main__:trials:24 - Trial = 16823/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.579 | DEBUG    | __main__:trials:29 - Trial = 16823/30000 | Total reward = 56.31
2022-01-26 14:17:47.583 | DEBUG    | __main__:trials:24 - Trial = 16824/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.584 | DEBUG    | __main__:trials:29 - Trial = 16824/30000 | Total reward = 55.46
2022-01-26 14:17:47.588 | DEBUG    | __main__:trials:24 - Trial = 16825/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.590 | DEBUG    | __main__:trials:29 - Trial = 16825/30000 | Total reward = 63.24
2022-01-26 14:17:47.594 | DEBUG    | __main__:trials:24 - Trial = 16826/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.595 | DEBUG    | __main__:trials:29 - Trial = 16826/30000 | Total reward = 53.51
2022-01-26 14:17:47.599 | DEBUG    | __main__:trials:24 - Trial = 16827/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.600 | DEBUG    | __main__:trials:29 - Trial = 16827/30000 | Total reward = 54.42
2022-01-26 14:17:47.604 | DEBUG    | __main__:trials:24 - Trial = 16828/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.606 | DEBUG    | __main__:trials:29 - Trial = 16828/30000 | Total reward = 54.38
2022-01-26 14:17:47.610 | DEBUG    | __main__:trials:24 - Trial = 16829/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.610 | DEBUG    | __main__:trials:29 - Trial = 16829/30000 | Total reward = 52.82
2022-01-26 14:17:47.615 | DEBUG    | __main__:trials:24 - Trial = 16830/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.616 | DEBUG    | __main__:trials:29 - Trial = 16830/30000 | Total reward = 46.24
2022-01-26 14:17:47.620 | DEBUG    | __main__:trials:24 - Trial = 16831/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.622 | DEBUG    | __main__:trials:29 - Trial = 16831/30000 | Total reward = 56.64
2022-01-26 14:17:47.625 | DEBUG    | __main__:trials:24 - Trial = 16832/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.626 | DEBUG    | __main__:trials:29 - Trial = 16832/30000 | Total reward = 54.98
2022-01-26 14:17:47.630 | DEBUG    | __main__:trials:24 - Trial = 16833/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.631 | DEBUG    | __main__:trials:29 - Trial = 16833/30000 | Total reward = 53.51
2022-01-26 14:17:47.635 | DEBUG    | __main__:trials:24 - Trial = 16834/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.635 | DEBUG    | __main__:trials:29 - Trial = 16834/30000 | Total reward = 51.26
2022-01-26 14:17:47.639 | DEBUG    | __main__:trials:24 - Trial = 16835/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.641 | DEBUG    | __main__:trials:29 - Trial = 16835/30000 | Total reward = 43.29
2022-01-26 14:17:47.644 | DEBUG    | __main__:trials:26 - Trial = 16836/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:47.645 | DEBUG    | __main__:trials:29 - Trial = 16836/30000 | Total reward = 27.46
2022-01-26 14:17:47.648 | DEBUG    | __main__:trials:24 - Trial = 16837/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.649 | DEBUG    | __main__:trials:29 - Trial = 16837/30000 | Total reward = 48.43
2022-01-26 14:17:47.653 | DEBUG    | __main__:trials:24 - Trial = 16838/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.653 | DEBUG    | __main__:trials:29 - Trial = 16838/30000 | Total reward = 48.74
2022-01-26 14:17:47.657 | DEBUG    | __main__:trials:24 - Trial = 16839/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.659 | DEBUG    | __main__:trials:29 - Trial = 16839/30000 | Total reward = 46.45
2022-01-26 14:17:47.662 | DEBUG    | __main__:trials:24 - Trial = 16840/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.663 | DEBUG    | __main__:trials:29 - Trial = 16840/30000 | Total reward = 53.35
2022-01-26 14:17:47.667 | DEBUG    | __main__:trials:24 - Trial = 16841/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.668 | DEBUG    | __main__:trials:29 - Trial = 16841/30000 | Total reward = 48.31
2022-01-26 14:17:47.671 | DEBUG    | __main__:trials:24 - Trial = 16842/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.673 | DEBUG    | __main__:trials:29 - Trial = 16842/30000 | Total reward = 50.85
2022-01-26 14:17:47.676 | DEBUG    | __main__:trials:24 - Trial = 16843/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.678 | DEBUG    | __main__:trials:29 - Trial = 16843/30000 | Total reward = 52.59
2022-01-26 14:17:47.682 | DEBUG    | __main__:trials:24 - Trial = 16844/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.683 | DEBUG    | __main__:trials:29 - Trial = 16844/30000 | Total reward = 52.44
2022-01-26 14:17:47.686 | DEBUG    | __main__:trials:24 - Trial = 16845/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.688 | DEBUG    | __main__:trials:29 - Trial = 16845/30000 | Total reward = 61.51
2022-01-26 14:17:47.691 | DEBUG    | __main__:trials:24 - Trial = 16846/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.692 | DEBUG    | __main__:trials:29 - Trial = 16846/30000 | Total reward = 48.85
2022-01-26 14:17:47.696 | DEBUG    | __main__:trials:24 - Trial = 16847/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.697 | DEBUG    | __main__:trials:29 - Trial = 16847/30000 | Total reward = 52.98
2022-01-26 14:17:47.700 | DEBUG    | __main__:trials:24 - Trial = 16848/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.702 | DEBUG    | __main__:trials:29 - Trial = 16848/30000 | Total reward = 51.68
2022-01-26 14:17:47.706 | DEBUG    | __main__:trials:24 - Trial = 16849/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.707 | DEBUG    | __main__:trials:29 - Trial = 16849/30000 | Total reward = 52.26
2022-01-26 14:17:47.710 | DEBUG    | __main__:trials:24 - Trial = 16850/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.711 | DEBUG    | __main__:trials:29 - Trial = 16850/30000 | Total reward = 48.57
2022-01-26 14:17:47.715 | DEBUG    | __main__:trials:24 - Trial = 16851/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.717 | DEBUG    | __main__:trials:29 - Trial = 16851/30000 | Total reward = 54.69
2022-01-26 14:17:47.719 | DEBUG    | __main__:trials:24 - Trial = 16852/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.721 | DEBUG    | __main__:trials:29 - Trial = 16852/30000 | Total reward = 48.18
2022-01-26 14:17:47.724 | DEBUG    | __main__:trials:24 - Trial = 16853/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.726 | DEBUG    | __main__:trials:29 - Trial = 16853/30000 | Total reward = 48.19
2022-01-26 14:17:47.729 | DEBUG    | __main__:trials:24 - Trial = 16854/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.730 | DEBUG    | __main__:trials:29 - Trial = 16854/30000 | Total reward = 40.27
2022-01-26 14:17:47.733 | DEBUG    | __main__:trials:24 - Trial = 16855/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.735 | DEBUG    | __main__:trials:29 - Trial = 16855/30000 | Total reward = 43.69
2022-01-26 14:17:47.738 | DEBUG    | __main__:trials:24 - Trial = 16856/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.739 | DEBUG    | __main__:trials:29 - Trial = 16856/30000 | Total reward = 42.03
2022-01-26 14:17:47.743 | DEBUG    | __main__:trials:24 - Trial = 16857/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.744 | DEBUG    | __main__:trials:29 - Trial = 16857/30000 | Total reward = 59.11
2022-01-26 14:17:47.747 | DEBUG    | __main__:trials:24 - Trial = 16858/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.749 | DEBUG    | __main__:trials:29 - Trial = 16858/30000 | Total reward = 50.27
2022-01-26 14:17:47.753 | DEBUG    | __main__:trials:24 - Trial = 16859/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.754 | DEBUG    | __main__:trials:29 - Trial = 16859/30000 | Total reward = 46.39
2022-01-26 14:17:47.757 | DEBUG    | __main__:trials:24 - Trial = 16860/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.759 | DEBUG    | __main__:trials:29 - Trial = 16860/30000 | Total reward = 41.84
2022-01-26 14:17:47.762 | DEBUG    | __main__:trials:24 - Trial = 16861/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.763 | DEBUG    | __main__:trials:29 - Trial = 16861/30000 | Total reward = 44.30
2022-01-26 14:17:47.766 | DEBUG    | __main__:trials:24 - Trial = 16862/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.767 | DEBUG    | __main__:trials:29 - Trial = 16862/30000 | Total reward = 46.00
2022-01-26 14:17:47.769 | DEBUG    | __main__:trials:24 - Trial = 16863/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.771 | DEBUG    | __main__:trials:29 - Trial = 16863/30000 | Total reward = 41.01
2022-01-26 14:17:47.774 | DEBUG    | __main__:trials:24 - Trial = 16864/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.775 | DEBUG    | __main__:trials:29 - Trial = 16864/30000 | Total reward = 58.69
2022-01-26 14:17:47.779 | DEBUG    | __main__:trials:24 - Trial = 16865/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.779 | DEBUG    | __main__:trials:29 - Trial = 16865/30000 | Total reward = 51.79
2022-01-26 14:17:47.784 | DEBUG    | __main__:trials:24 - Trial = 16866/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.787 | DEBUG    | __main__:trials:29 - Trial = 16866/30000 | Total reward = 59.14
2022-01-26 14:17:47.790 | DEBUG    | __main__:trials:24 - Trial = 16867/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.792 | DEBUG    | __main__:trials:29 - Trial = 16867/30000 | Total reward = 50.43
2022-01-26 14:17:47.796 | DEBUG    | __main__:trials:24 - Trial = 16868/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.797 | DEBUG    | __main__:trials:29 - Trial = 16868/30000 | Total reward = 51.28
2022-01-26 14:17:47.801 | DEBUG    | __main__:trials:24 - Trial = 16869/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.802 | DEBUG    | __main__:trials:29 - Trial = 16869/30000 | Total reward = 31.67
2022-01-26 14:17:47.806 | DEBUG    | __main__:trials:24 - Trial = 16870/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.808 | DEBUG    | __main__:trials:29 - Trial = 16870/30000 | Total reward = 47.79
2022-01-26 14:17:47.812 | DEBUG    | __main__:trials:26 - Trial = 16871/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:47.813 | DEBUG    | __main__:trials:29 - Trial = 16871/30000 | Total reward = 27.21
2022-01-26 14:17:47.817 | DEBUG    | __main__:trials:24 - Trial = 16872/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.819 | DEBUG    | __main__:trials:29 - Trial = 16872/30000 | Total reward = 54.84
2022-01-26 14:17:47.822 | DEBUG    | __main__:trials:24 - Trial = 16873/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.824 | DEBUG    | __main__:trials:29 - Trial = 16873/30000 | Total reward = 46.36
2022-01-26 14:17:47.827 | DEBUG    | __main__:trials:24 - Trial = 16874/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.829 | DEBUG    | __main__:trials:29 - Trial = 16874/30000 | Total reward = 37.64
2022-01-26 14:17:47.832 | DEBUG    | __main__:trials:24 - Trial = 16875/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.833 | DEBUG    | __main__:trials:29 - Trial = 16875/30000 | Total reward = 53.40
2022-01-26 14:17:47.836 | DEBUG    | __main__:trials:24 - Trial = 16876/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.838 | DEBUG    | __main__:trials:29 - Trial = 16876/30000 | Total reward = 41.98
2022-01-26 14:17:47.842 | DEBUG    | __main__:trials:24 - Trial = 16877/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.842 | DEBUG    | __main__:trials:29 - Trial = 16877/30000 | Total reward = 47.42
2022-01-26 14:17:47.847 | DEBUG    | __main__:trials:24 - Trial = 16878/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.848 | DEBUG    | __main__:trials:29 - Trial = 16878/30000 | Total reward = 41.39
2022-01-26 14:17:47.852 | DEBUG    | __main__:trials:24 - Trial = 16879/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.853 | DEBUG    | __main__:trials:29 - Trial = 16879/30000 | Total reward = 59.53
2022-01-26 14:17:47.857 | DEBUG    | __main__:trials:24 - Trial = 16880/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.859 | DEBUG    | __main__:trials:29 - Trial = 16880/30000 | Total reward = 44.74
2022-01-26 14:17:47.862 | DEBUG    | __main__:trials:24 - Trial = 16881/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.863 | DEBUG    | __main__:trials:29 - Trial = 16881/30000 | Total reward = 59.93
2022-01-26 14:17:47.867 | DEBUG    | __main__:trials:24 - Trial = 16882/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.869 | DEBUG    | __main__:trials:29 - Trial = 16882/30000 | Total reward = 51.84
2022-01-26 14:17:47.873 | DEBUG    | __main__:trials:24 - Trial = 16883/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.874 | DEBUG    | __main__:trials:29 - Trial = 16883/30000 | Total reward = 35.58
2022-01-26 14:17:47.877 | DEBUG    | __main__:trials:24 - Trial = 16884/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.878 | DEBUG    | __main__:trials:29 - Trial = 16884/30000 | Total reward = 39.81
2022-01-26 14:17:47.881 | DEBUG    | __main__:trials:24 - Trial = 16885/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.882 | DEBUG    | __main__:trials:29 - Trial = 16885/30000 | Total reward = 43.91
2022-01-26 14:17:47.885 | DEBUG    | __main__:trials:24 - Trial = 16886/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.887 | DEBUG    | __main__:trials:29 - Trial = 16886/30000 | Total reward = 44.11
2022-01-26 14:17:47.891 | DEBUG    | __main__:trials:24 - Trial = 16887/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.891 | DEBUG    | __main__:trials:29 - Trial = 16887/30000 | Total reward = 53.76
2022-01-26 14:17:47.896 | DEBUG    | __main__:trials:24 - Trial = 16888/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.897 | DEBUG    | __main__:trials:29 - Trial = 16888/30000 | Total reward = 40.98
2022-01-26 14:17:47.901 | DEBUG    | __main__:trials:24 - Trial = 16889/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.902 | DEBUG    | __main__:trials:29 - Trial = 16889/30000 | Total reward = 51.35
2022-01-26 14:17:47.906 | DEBUG    | __main__:trials:24 - Trial = 16890/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.906 | DEBUG    | __main__:trials:29 - Trial = 16890/30000 | Total reward = 42.60
2022-01-26 14:17:47.911 | DEBUG    | __main__:trials:24 - Trial = 16891/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.913 | DEBUG    | __main__:trials:29 - Trial = 16891/30000 | Total reward = 60.50
2022-01-26 14:17:47.916 | DEBUG    | __main__:trials:24 - Trial = 16892/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.918 | DEBUG    | __main__:trials:29 - Trial = 16892/30000 | Total reward = 67.84
2022-01-26 14:17:47.921 | DEBUG    | __main__:trials:24 - Trial = 16893/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.923 | DEBUG    | __main__:trials:29 - Trial = 16893/30000 | Total reward = 54.47
2022-01-26 14:17:47.927 | DEBUG    | __main__:trials:24 - Trial = 16894/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.928 | DEBUG    | __main__:trials:29 - Trial = 16894/30000 | Total reward = 56.49
2022-01-26 14:17:47.932 | DEBUG    | __main__:trials:24 - Trial = 16895/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.933 | DEBUG    | __main__:trials:29 - Trial = 16895/30000 | Total reward = 47.90
2022-01-26 14:17:47.936 | DEBUG    | __main__:trials:24 - Trial = 16896/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.938 | DEBUG    | __main__:trials:29 - Trial = 16896/30000 | Total reward = 38.31
2022-01-26 14:17:47.942 | DEBUG    | __main__:trials:24 - Trial = 16897/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.943 | DEBUG    | __main__:trials:29 - Trial = 16897/30000 | Total reward = 52.32
2022-01-26 14:17:47.947 | DEBUG    | __main__:trials:24 - Trial = 16898/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.949 | DEBUG    | __main__:trials:29 - Trial = 16898/30000 | Total reward = 44.37
2022-01-26 14:17:47.952 | DEBUG    | __main__:trials:24 - Trial = 16899/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.953 | DEBUG    | __main__:trials:29 - Trial = 16899/30000 | Total reward = 52.44
2022-01-26 14:17:47.956 | DEBUG    | __main__:trials:24 - Trial = 16900/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.957 | DEBUG    | __main__:trials:29 - Trial = 16900/30000 | Total reward = 62.74
2022-01-26 14:17:47.961 | DEBUG    | __main__:trials:24 - Trial = 16901/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.962 | DEBUG    | __main__:trials:29 - Trial = 16901/30000 | Total reward = 59.21
2022-01-26 14:17:47.966 | DEBUG    | __main__:trials:24 - Trial = 16902/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.967 | DEBUG    | __main__:trials:29 - Trial = 16902/30000 | Total reward = 51.22
2022-01-26 14:17:47.970 | DEBUG    | __main__:trials:24 - Trial = 16903/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.971 | DEBUG    | __main__:trials:29 - Trial = 16903/30000 | Total reward = 51.80
2022-01-26 14:17:47.973 | DEBUG    | __main__:trials:26 - Trial = 16904/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:47.975 | DEBUG    | __main__:trials:29 - Trial = 16904/30000 | Total reward = 29.16
2022-01-26 14:17:47.979 | DEBUG    | __main__:trials:24 - Trial = 16905/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.980 | DEBUG    | __main__:trials:29 - Trial = 16905/30000 | Total reward = 60.47
2022-01-26 14:17:47.983 | DEBUG    | __main__:trials:24 - Trial = 16906/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.984 | DEBUG    | __main__:trials:29 - Trial = 16906/30000 | Total reward = 52.49
2022-01-26 14:17:47.988 | DEBUG    | __main__:trials:24 - Trial = 16907/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.990 | DEBUG    | __main__:trials:29 - Trial = 16907/30000 | Total reward = 39.96
2022-01-26 14:17:47.993 | DEBUG    | __main__:trials:24 - Trial = 16908/30000 | Max number of steps (20) reached
2022-01-26 14:17:47.995 | DEBUG    | __main__:trials:29 - Trial = 16908/30000 | Total reward = 55.12
2022-01-26 14:17:47.999 | DEBUG    | __main__:trials:24 - Trial = 16909/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.000 | DEBUG    | __main__:trials:29 - Trial = 16909/30000 | Total reward = 47.99
2022-01-26 14:17:48.003 | DEBUG    | __main__:trials:26 - Trial = 16910/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.004 | DEBUG    | __main__:trials:29 - Trial = 16910/30000 | Total reward = 13.86
2022-01-26 14:17:48.007 | DEBUG    | __main__:trials:24 - Trial = 16911/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.009 | DEBUG    | __main__:trials:29 - Trial = 16911/30000 | Total reward = 41.97
2022-01-26 14:17:48.012 | DEBUG    | __main__:trials:24 - Trial = 16912/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.014 | DEBUG    | __main__:trials:29 - Trial = 16912/30000 | Total reward = 46.43
2022-01-26 14:17:48.017 | DEBUG    | __main__:trials:24 - Trial = 16913/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.018 | DEBUG    | __main__:trials:29 - Trial = 16913/30000 | Total reward = 44.24
2022-01-26 14:17:48.022 | DEBUG    | __main__:trials:24 - Trial = 16914/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.023 | DEBUG    | __main__:trials:29 - Trial = 16914/30000 | Total reward = 40.39
2022-01-26 14:17:48.026 | DEBUG    | __main__:trials:24 - Trial = 16915/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.028 | DEBUG    | __main__:trials:29 - Trial = 16915/30000 | Total reward = 33.22
2022-01-26 14:17:48.032 | DEBUG    | __main__:trials:24 - Trial = 16916/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.033 | DEBUG    | __main__:trials:29 - Trial = 16916/30000 | Total reward = 50.17
2022-01-26 14:17:48.036 | DEBUG    | __main__:trials:24 - Trial = 16917/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.038 | DEBUG    | __main__:trials:29 - Trial = 16917/30000 | Total reward = 51.12
2022-01-26 14:17:48.042 | DEBUG    | __main__:trials:24 - Trial = 16918/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.042 | DEBUG    | __main__:trials:29 - Trial = 16918/30000 | Total reward = 33.61
2022-01-26 14:17:48.046 | DEBUG    | __main__:trials:24 - Trial = 16919/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.048 | DEBUG    | __main__:trials:29 - Trial = 16919/30000 | Total reward = 41.86
2022-01-26 14:17:48.050 | DEBUG    | __main__:trials:26 - Trial = 16920/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.051 | DEBUG    | __main__:trials:29 - Trial = 16920/30000 | Total reward = 11.31
2022-01-26 14:17:48.055 | DEBUG    | __main__:trials:24 - Trial = 16921/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.057 | DEBUG    | __main__:trials:29 - Trial = 16921/30000 | Total reward = 51.59
2022-01-26 14:17:48.060 | DEBUG    | __main__:trials:24 - Trial = 16922/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.061 | DEBUG    | __main__:trials:29 - Trial = 16922/30000 | Total reward = 43.26
2022-01-26 14:17:48.065 | DEBUG    | __main__:trials:24 - Trial = 16923/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.065 | DEBUG    | __main__:trials:29 - Trial = 16923/30000 | Total reward = 52.66
2022-01-26 14:17:48.069 | DEBUG    | __main__:trials:24 - Trial = 16924/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.069 | DEBUG    | __main__:trials:29 - Trial = 16924/30000 | Total reward = 66.15
2022-01-26 14:17:48.073 | DEBUG    | __main__:trials:24 - Trial = 16925/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.075 | DEBUG    | __main__:trials:29 - Trial = 16925/30000 | Total reward = 35.62
2022-01-26 14:17:48.079 | DEBUG    | __main__:trials:24 - Trial = 16926/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.080 | DEBUG    | __main__:trials:29 - Trial = 16926/30000 | Total reward = 52.59
2022-01-26 14:17:48.084 | DEBUG    | __main__:trials:24 - Trial = 16927/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.085 | DEBUG    | __main__:trials:29 - Trial = 16927/30000 | Total reward = 51.60
2022-01-26 14:17:48.088 | DEBUG    | __main__:trials:24 - Trial = 16928/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.090 | DEBUG    | __main__:trials:29 - Trial = 16928/30000 | Total reward = 49.68
2022-01-26 14:17:48.094 | DEBUG    | __main__:trials:24 - Trial = 16929/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.095 | DEBUG    | __main__:trials:29 - Trial = 16929/30000 | Total reward = 51.32
2022-01-26 14:17:48.099 | DEBUG    | __main__:trials:24 - Trial = 16930/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.100 | DEBUG    | __main__:trials:29 - Trial = 16930/30000 | Total reward = 39.97
2022-01-26 14:17:48.104 | DEBUG    | __main__:trials:24 - Trial = 16931/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.106 | DEBUG    | __main__:trials:29 - Trial = 16931/30000 | Total reward = 39.67
2022-01-26 14:17:48.110 | DEBUG    | __main__:trials:24 - Trial = 16932/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.111 | DEBUG    | __main__:trials:29 - Trial = 16932/30000 | Total reward = 43.08
2022-01-26 14:17:48.115 | DEBUG    | __main__:trials:24 - Trial = 16933/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.117 | DEBUG    | __main__:trials:29 - Trial = 16933/30000 | Total reward = 46.41
2022-01-26 14:17:48.120 | DEBUG    | __main__:trials:24 - Trial = 16934/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.121 | DEBUG    | __main__:trials:29 - Trial = 16934/30000 | Total reward = 43.12
2022-01-26 14:17:48.125 | DEBUG    | __main__:trials:24 - Trial = 16935/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.127 | DEBUG    | __main__:trials:29 - Trial = 16935/30000 | Total reward = 52.01
2022-01-26 14:17:48.130 | DEBUG    | __main__:trials:24 - Trial = 16936/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.132 | DEBUG    | __main__:trials:29 - Trial = 16936/30000 | Total reward = 58.38
2022-01-26 14:17:48.135 | DEBUG    | __main__:trials:26 - Trial = 16937/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.137 | DEBUG    | __main__:trials:29 - Trial = 16937/30000 | Total reward = 30.41
2022-01-26 14:17:48.140 | DEBUG    | __main__:trials:24 - Trial = 16938/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.142 | DEBUG    | __main__:trials:29 - Trial = 16938/30000 | Total reward = 38.67
2022-01-26 14:17:48.145 | DEBUG    | __main__:trials:24 - Trial = 16939/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.147 | DEBUG    | __main__:trials:29 - Trial = 16939/30000 | Total reward = 43.08
2022-01-26 14:17:48.151 | DEBUG    | __main__:trials:24 - Trial = 16940/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.152 | DEBUG    | __main__:trials:29 - Trial = 16940/30000 | Total reward = 52.01
2022-01-26 14:17:48.156 | DEBUG    | __main__:trials:24 - Trial = 16941/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.157 | DEBUG    | __main__:trials:29 - Trial = 16941/30000 | Total reward = 44.72
2022-01-26 14:17:48.161 | DEBUG    | __main__:trials:24 - Trial = 16942/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.162 | DEBUG    | __main__:trials:29 - Trial = 16942/30000 | Total reward = 62.12
2022-01-26 14:17:48.165 | DEBUG    | __main__:trials:24 - Trial = 16943/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.167 | DEBUG    | __main__:trials:29 - Trial = 16943/30000 | Total reward = 42.14
2022-01-26 14:17:48.172 | DEBUG    | __main__:trials:24 - Trial = 16944/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.173 | DEBUG    | __main__:trials:29 - Trial = 16944/30000 | Total reward = 45.31
2022-01-26 14:17:48.177 | DEBUG    | __main__:trials:24 - Trial = 16945/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.178 | DEBUG    | __main__:trials:29 - Trial = 16945/30000 | Total reward = 50.76
2022-01-26 14:17:48.181 | DEBUG    | __main__:trials:24 - Trial = 16946/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.182 | DEBUG    | __main__:trials:29 - Trial = 16946/30000 | Total reward = 63.47
2022-01-26 14:17:48.185 | DEBUG    | __main__:trials:24 - Trial = 16947/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.187 | DEBUG    | __main__:trials:29 - Trial = 16947/30000 | Total reward = 46.71
2022-01-26 14:17:48.190 | DEBUG    | __main__:trials:24 - Trial = 16948/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.191 | DEBUG    | __main__:trials:29 - Trial = 16948/30000 | Total reward = 43.08
2022-01-26 14:17:48.194 | DEBUG    | __main__:trials:24 - Trial = 16949/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.196 | DEBUG    | __main__:trials:29 - Trial = 16949/30000 | Total reward = 44.31
2022-01-26 14:17:48.200 | DEBUG    | __main__:trials:24 - Trial = 16950/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.201 | DEBUG    | __main__:trials:29 - Trial = 16950/30000 | Total reward = 45.86
2022-01-26 14:17:48.205 | DEBUG    | __main__:trials:24 - Trial = 16951/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.206 | DEBUG    | __main__:trials:29 - Trial = 16951/30000 | Total reward = 28.36
2022-01-26 14:17:48.210 | DEBUG    | __main__:trials:24 - Trial = 16952/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.211 | DEBUG    | __main__:trials:29 - Trial = 16952/30000 | Total reward = 28.44
2022-01-26 14:17:48.215 | DEBUG    | __main__:trials:24 - Trial = 16953/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.217 | DEBUG    | __main__:trials:29 - Trial = 16953/30000 | Total reward = 39.30
2022-01-26 14:17:48.220 | DEBUG    | __main__:trials:24 - Trial = 16954/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.221 | DEBUG    | __main__:trials:29 - Trial = 16954/30000 | Total reward = 57.58
2022-01-26 14:17:48.224 | DEBUG    | __main__:trials:24 - Trial = 16955/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.226 | DEBUG    | __main__:trials:29 - Trial = 16955/30000 | Total reward = 51.86
2022-01-26 14:17:48.229 | DEBUG    | __main__:trials:24 - Trial = 16956/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.230 | DEBUG    | __main__:trials:29 - Trial = 16956/30000 | Total reward = 43.08
2022-01-26 14:17:48.233 | DEBUG    | __main__:trials:24 - Trial = 16957/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.235 | DEBUG    | __main__:trials:29 - Trial = 16957/30000 | Total reward = 33.76
2022-01-26 14:17:48.237 | DEBUG    | __main__:trials:24 - Trial = 16958/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.239 | DEBUG    | __main__:trials:29 - Trial = 16958/30000 | Total reward = 54.89
2022-01-26 14:17:48.242 | DEBUG    | __main__:trials:24 - Trial = 16959/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.243 | DEBUG    | __main__:trials:29 - Trial = 16959/30000 | Total reward = 47.24
2022-01-26 14:17:48.247 | DEBUG    | __main__:trials:24 - Trial = 16960/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.248 | DEBUG    | __main__:trials:29 - Trial = 16960/30000 | Total reward = 41.62
2022-01-26 14:17:48.252 | DEBUG    | __main__:trials:24 - Trial = 16961/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.253 | DEBUG    | __main__:trials:29 - Trial = 16961/30000 | Total reward = 47.36
2022-01-26 14:17:48.257 | DEBUG    | __main__:trials:24 - Trial = 16962/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.258 | DEBUG    | __main__:trials:29 - Trial = 16962/30000 | Total reward = 40.10
2022-01-26 14:17:48.263 | DEBUG    | __main__:trials:24 - Trial = 16963/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.263 | DEBUG    | __main__:trials:29 - Trial = 16963/30000 | Total reward = 52.20
2022-01-26 14:17:48.268 | DEBUG    | __main__:trials:24 - Trial = 16964/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.268 | DEBUG    | __main__:trials:29 - Trial = 16964/30000 | Total reward = 37.19
2022-01-26 14:17:48.273 | DEBUG    | __main__:trials:24 - Trial = 16965/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.274 | DEBUG    | __main__:trials:29 - Trial = 16965/30000 | Total reward = 51.92
2022-01-26 14:17:48.278 | DEBUG    | __main__:trials:24 - Trial = 16966/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.279 | DEBUG    | __main__:trials:29 - Trial = 16966/30000 | Total reward = 52.20
2022-01-26 14:17:48.283 | DEBUG    | __main__:trials:24 - Trial = 16967/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.285 | DEBUG    | __main__:trials:29 - Trial = 16967/30000 | Total reward = 39.71
2022-01-26 14:17:48.288 | DEBUG    | __main__:trials:24 - Trial = 16968/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.290 | DEBUG    | __main__:trials:29 - Trial = 16968/30000 | Total reward = 52.50
2022-01-26 14:17:48.293 | DEBUG    | __main__:trials:24 - Trial = 16969/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.295 | DEBUG    | __main__:trials:29 - Trial = 16969/30000 | Total reward = 56.53
2022-01-26 14:17:48.298 | DEBUG    | __main__:trials:24 - Trial = 16970/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.300 | DEBUG    | __main__:trials:29 - Trial = 16970/30000 | Total reward = 52.50
2022-01-26 14:17:48.304 | DEBUG    | __main__:trials:24 - Trial = 16971/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.304 | DEBUG    | __main__:trials:29 - Trial = 16971/30000 | Total reward = 39.78
2022-01-26 14:17:48.309 | DEBUG    | __main__:trials:24 - Trial = 16972/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.310 | DEBUG    | __main__:trials:29 - Trial = 16972/30000 | Total reward = 46.19
2022-01-26 14:17:48.314 | DEBUG    | __main__:trials:24 - Trial = 16973/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.315 | DEBUG    | __main__:trials:29 - Trial = 16973/30000 | Total reward = 36.81
2022-01-26 14:17:48.319 | DEBUG    | __main__:trials:24 - Trial = 16974/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.319 | DEBUG    | __main__:trials:29 - Trial = 16974/30000 | Total reward = 50.75
2022-01-26 14:17:48.324 | DEBUG    | __main__:trials:24 - Trial = 16975/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.324 | DEBUG    | __main__:trials:29 - Trial = 16975/30000 | Total reward = 54.75
2022-01-26 14:17:48.329 | DEBUG    | __main__:trials:24 - Trial = 16976/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.329 | DEBUG    | __main__:trials:29 - Trial = 16976/30000 | Total reward = 54.95
2022-01-26 14:17:48.334 | DEBUG    | __main__:trials:24 - Trial = 16977/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.335 | DEBUG    | __main__:trials:29 - Trial = 16977/30000 | Total reward = 50.66
2022-01-26 14:17:48.339 | DEBUG    | __main__:trials:24 - Trial = 16978/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.340 | DEBUG    | __main__:trials:29 - Trial = 16978/30000 | Total reward = 40.93
2022-01-26 14:17:48.343 | DEBUG    | __main__:trials:24 - Trial = 16979/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.345 | DEBUG    | __main__:trials:29 - Trial = 16979/30000 | Total reward = 52.82
2022-01-26 14:17:48.349 | DEBUG    | __main__:trials:24 - Trial = 16980/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.350 | DEBUG    | __main__:trials:29 - Trial = 16980/30000 | Total reward = 52.67
2022-01-26 14:17:48.353 | DEBUG    | __main__:trials:24 - Trial = 16981/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.354 | DEBUG    | __main__:trials:29 - Trial = 16981/30000 | Total reward = 56.74
2022-01-26 14:17:48.357 | DEBUG    | __main__:trials:24 - Trial = 16982/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.359 | DEBUG    | __main__:trials:29 - Trial = 16982/30000 | Total reward = 38.55
2022-01-26 14:17:48.362 | DEBUG    | __main__:trials:24 - Trial = 16983/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.364 | DEBUG    | __main__:trials:29 - Trial = 16983/30000 | Total reward = 49.00
2022-01-26 14:17:48.367 | DEBUG    | __main__:trials:24 - Trial = 16984/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.368 | DEBUG    | __main__:trials:29 - Trial = 16984/30000 | Total reward = 49.03
2022-01-26 14:17:48.372 | DEBUG    | __main__:trials:24 - Trial = 16985/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.373 | DEBUG    | __main__:trials:29 - Trial = 16985/30000 | Total reward = 53.37
2022-01-26 14:17:48.377 | DEBUG    | __main__:trials:24 - Trial = 16986/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.378 | DEBUG    | __main__:trials:29 - Trial = 16986/30000 | Total reward = 39.58
2022-01-26 14:17:48.382 | DEBUG    | __main__:trials:24 - Trial = 16987/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.383 | DEBUG    | __main__:trials:29 - Trial = 16987/30000 | Total reward = 56.29
2022-01-26 14:17:48.386 | DEBUG    | __main__:trials:24 - Trial = 16988/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.388 | DEBUG    | __main__:trials:29 - Trial = 16988/30000 | Total reward = 47.11
2022-01-26 14:17:48.392 | DEBUG    | __main__:trials:24 - Trial = 16989/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.393 | DEBUG    | __main__:trials:29 - Trial = 16989/30000 | Total reward = 49.75
2022-01-26 14:17:48.396 | DEBUG    | __main__:trials:24 - Trial = 16990/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.397 | DEBUG    | __main__:trials:29 - Trial = 16990/30000 | Total reward = 41.75
2022-01-26 14:17:48.400 | DEBUG    | __main__:trials:24 - Trial = 16991/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.402 | DEBUG    | __main__:trials:29 - Trial = 16991/30000 | Total reward = 56.43
2022-01-26 14:17:48.405 | DEBUG    | __main__:trials:24 - Trial = 16992/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.406 | DEBUG    | __main__:trials:29 - Trial = 16992/30000 | Total reward = 47.68
2022-01-26 14:17:48.410 | DEBUG    | __main__:trials:24 - Trial = 16993/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.410 | DEBUG    | __main__:trials:29 - Trial = 16993/30000 | Total reward = 45.90
2022-01-26 14:17:48.414 | DEBUG    | __main__:trials:24 - Trial = 16994/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.414 | DEBUG    | __main__:trials:29 - Trial = 16994/30000 | Total reward = 31.86
2022-01-26 14:17:48.418 | DEBUG    | __main__:trials:24 - Trial = 16995/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.420 | DEBUG    | __main__:trials:29 - Trial = 16995/30000 | Total reward = 51.16
2022-01-26 14:17:48.423 | DEBUG    | __main__:trials:24 - Trial = 16996/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.424 | DEBUG    | __main__:trials:29 - Trial = 16996/30000 | Total reward = 58.92
2022-01-26 14:17:48.428 | DEBUG    | __main__:trials:24 - Trial = 16997/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.430 | DEBUG    | __main__:trials:29 - Trial = 16997/30000 | Total reward = 54.06
2022-01-26 14:17:48.433 | DEBUG    | __main__:trials:24 - Trial = 16998/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.435 | DEBUG    | __main__:trials:29 - Trial = 16998/30000 | Total reward = 54.63
2022-01-26 14:17:48.439 | DEBUG    | __main__:trials:24 - Trial = 16999/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.439 | DEBUG    | __main__:trials:29 - Trial = 16999/30000 | Total reward = 43.49
2022-01-26 14:17:48.443 | DEBUG    | __main__:trials:26 - Trial = 17000/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.445 | DEBUG    | __main__:trials:29 - Trial = 17000/30000 | Total reward = 35.54
2022-01-26 14:17:48.448 | DEBUG    | __main__:trials:24 - Trial = 17001/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.450 | DEBUG    | __main__:trials:29 - Trial = 17001/30000 | Total reward = 53.39
2022-01-26 14:17:48.453 | DEBUG    | __main__:trials:24 - Trial = 17002/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.455 | DEBUG    | __main__:trials:29 - Trial = 17002/30000 | Total reward = 48.93
2022-01-26 14:17:48.458 | DEBUG    | __main__:trials:24 - Trial = 17003/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.459 | DEBUG    | __main__:trials:29 - Trial = 17003/30000 | Total reward = 59.52
2022-01-26 14:17:48.463 | DEBUG    | __main__:trials:24 - Trial = 17004/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.465 | DEBUG    | __main__:trials:29 - Trial = 17004/30000 | Total reward = 56.27
2022-01-26 14:17:48.467 | DEBUG    | __main__:trials:24 - Trial = 17005/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.469 | DEBUG    | __main__:trials:29 - Trial = 17005/30000 | Total reward = 54.84
2022-01-26 14:17:48.473 | DEBUG    | __main__:trials:24 - Trial = 17006/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.473 | DEBUG    | __main__:trials:29 - Trial = 17006/30000 | Total reward = 39.98
2022-01-26 14:17:48.478 | DEBUG    | __main__:trials:24 - Trial = 17007/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.480 | DEBUG    | __main__:trials:29 - Trial = 17007/30000 | Total reward = 49.75
2022-01-26 14:17:48.483 | DEBUG    | __main__:trials:24 - Trial = 17008/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.485 | DEBUG    | __main__:trials:29 - Trial = 17008/30000 | Total reward = 54.29
2022-01-26 14:17:48.488 | DEBUG    | __main__:trials:24 - Trial = 17009/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.489 | DEBUG    | __main__:trials:29 - Trial = 17009/30000 | Total reward = 42.08
2022-01-26 14:17:48.492 | DEBUG    | __main__:trials:24 - Trial = 17010/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.493 | DEBUG    | __main__:trials:29 - Trial = 17010/30000 | Total reward = 46.78
2022-01-26 14:17:48.496 | DEBUG    | __main__:trials:24 - Trial = 17011/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.497 | DEBUG    | __main__:trials:29 - Trial = 17011/30000 | Total reward = 43.08
2022-01-26 14:17:48.500 | DEBUG    | __main__:trials:24 - Trial = 17012/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.501 | DEBUG    | __main__:trials:29 - Trial = 17012/30000 | Total reward = 36.59
2022-01-26 14:17:48.504 | DEBUG    | __main__:trials:24 - Trial = 17013/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.505 | DEBUG    | __main__:trials:29 - Trial = 17013/30000 | Total reward = 37.19
2022-01-26 14:17:48.508 | DEBUG    | __main__:trials:24 - Trial = 17014/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.510 | DEBUG    | __main__:trials:29 - Trial = 17014/30000 | Total reward = 57.70
2022-01-26 14:17:48.514 | DEBUG    | __main__:trials:24 - Trial = 17015/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.515 | DEBUG    | __main__:trials:29 - Trial = 17015/30000 | Total reward = 51.52
2022-01-26 14:17:48.519 | DEBUG    | __main__:trials:24 - Trial = 17016/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.520 | DEBUG    | __main__:trials:29 - Trial = 17016/30000 | Total reward = 60.79
2022-01-26 14:17:48.524 | DEBUG    | __main__:trials:24 - Trial = 17017/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.525 | DEBUG    | __main__:trials:29 - Trial = 17017/30000 | Total reward = 39.39
2022-01-26 14:17:48.528 | DEBUG    | __main__:trials:24 - Trial = 17018/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.529 | DEBUG    | __main__:trials:29 - Trial = 17018/30000 | Total reward = 52.86
2022-01-26 14:17:48.534 | DEBUG    | __main__:trials:24 - Trial = 17019/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.535 | DEBUG    | __main__:trials:29 - Trial = 17019/30000 | Total reward = 43.84
2022-01-26 14:17:48.538 | DEBUG    | __main__:trials:24 - Trial = 17020/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.540 | DEBUG    | __main__:trials:29 - Trial = 17020/30000 | Total reward = 44.27
2022-01-26 14:17:48.544 | DEBUG    | __main__:trials:24 - Trial = 17021/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.545 | DEBUG    | __main__:trials:29 - Trial = 17021/30000 | Total reward = 42.08
2022-01-26 14:17:48.549 | DEBUG    | __main__:trials:24 - Trial = 17022/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.549 | DEBUG    | __main__:trials:29 - Trial = 17022/30000 | Total reward = 30.11
2022-01-26 14:17:48.554 | DEBUG    | __main__:trials:24 - Trial = 17023/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.555 | DEBUG    | __main__:trials:29 - Trial = 17023/30000 | Total reward = 42.83
2022-01-26 14:17:48.559 | DEBUG    | __main__:trials:24 - Trial = 17024/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.560 | DEBUG    | __main__:trials:29 - Trial = 17024/30000 | Total reward = 46.01
2022-01-26 14:17:48.564 | DEBUG    | __main__:trials:26 - Trial = 17025/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.565 | DEBUG    | __main__:trials:29 - Trial = 17025/30000 | Total reward = 21.50
2022-01-26 14:17:48.569 | DEBUG    | __main__:trials:24 - Trial = 17026/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.570 | DEBUG    | __main__:trials:29 - Trial = 17026/30000 | Total reward = 49.11
2022-01-26 14:17:48.574 | DEBUG    | __main__:trials:24 - Trial = 17027/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.575 | DEBUG    | __main__:trials:29 - Trial = 17027/30000 | Total reward = 35.73
2022-01-26 14:17:48.579 | DEBUG    | __main__:trials:24 - Trial = 17028/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.581 | DEBUG    | __main__:trials:29 - Trial = 17028/30000 | Total reward = 37.91
2022-01-26 14:17:48.583 | DEBUG    | __main__:trials:24 - Trial = 17029/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.585 | DEBUG    | __main__:trials:29 - Trial = 17029/30000 | Total reward = 38.75
2022-01-26 14:17:48.588 | DEBUG    | __main__:trials:24 - Trial = 17030/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.590 | DEBUG    | __main__:trials:29 - Trial = 17030/30000 | Total reward = 45.99
2022-01-26 14:17:48.593 | DEBUG    | __main__:trials:24 - Trial = 17031/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.594 | DEBUG    | __main__:trials:29 - Trial = 17031/30000 | Total reward = 46.92
2022-01-26 14:17:48.598 | DEBUG    | __main__:trials:24 - Trial = 17032/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.599 | DEBUG    | __main__:trials:29 - Trial = 17032/30000 | Total reward = 38.38
2022-01-26 14:17:48.603 | DEBUG    | __main__:trials:24 - Trial = 17033/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.605 | DEBUG    | __main__:trials:29 - Trial = 17033/30000 | Total reward = 34.62
2022-01-26 14:17:48.608 | DEBUG    | __main__:trials:24 - Trial = 17034/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.610 | DEBUG    | __main__:trials:29 - Trial = 17034/30000 | Total reward = 50.61
2022-01-26 14:17:48.614 | DEBUG    | __main__:trials:24 - Trial = 17035/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.615 | DEBUG    | __main__:trials:29 - Trial = 17035/30000 | Total reward = 42.88
2022-01-26 14:17:48.619 | DEBUG    | __main__:trials:24 - Trial = 17036/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.620 | DEBUG    | __main__:trials:29 - Trial = 17036/30000 | Total reward = 51.16
2022-01-26 14:17:48.623 | DEBUG    | __main__:trials:24 - Trial = 17037/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.625 | DEBUG    | __main__:trials:29 - Trial = 17037/30000 | Total reward = 48.67
2022-01-26 14:17:48.628 | DEBUG    | __main__:trials:24 - Trial = 17038/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.629 | DEBUG    | __main__:trials:29 - Trial = 17038/30000 | Total reward = 46.39
2022-01-26 14:17:48.632 | DEBUG    | __main__:trials:24 - Trial = 17039/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.634 | DEBUG    | __main__:trials:29 - Trial = 17039/30000 | Total reward = 48.20
2022-01-26 14:17:48.637 | DEBUG    | __main__:trials:24 - Trial = 17040/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.638 | DEBUG    | __main__:trials:29 - Trial = 17040/30000 | Total reward = 44.54
2022-01-26 14:17:48.641 | DEBUG    | __main__:trials:26 - Trial = 17041/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.641 | DEBUG    | __main__:trials:29 - Trial = 17041/30000 | Total reward = 23.72
2022-01-26 14:17:48.645 | DEBUG    | __main__:trials:24 - Trial = 17042/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.645 | DEBUG    | __main__:trials:29 - Trial = 17042/30000 | Total reward = 42.22
2022-01-26 14:17:48.650 | DEBUG    | __main__:trials:24 - Trial = 17043/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.651 | DEBUG    | __main__:trials:29 - Trial = 17043/30000 | Total reward = 42.99
2022-01-26 14:17:48.655 | DEBUG    | __main__:trials:24 - Trial = 17044/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.657 | DEBUG    | __main__:trials:29 - Trial = 17044/30000 | Total reward = 43.04
2022-01-26 14:17:48.660 | DEBUG    | __main__:trials:24 - Trial = 17045/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.662 | DEBUG    | __main__:trials:29 - Trial = 17045/30000 | Total reward = 46.82
2022-01-26 14:17:48.666 | DEBUG    | __main__:trials:24 - Trial = 17046/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.667 | DEBUG    | __main__:trials:29 - Trial = 17046/30000 | Total reward = 42.17
2022-01-26 14:17:48.671 | DEBUG    | __main__:trials:24 - Trial = 17047/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.672 | DEBUG    | __main__:trials:29 - Trial = 17047/30000 | Total reward = 42.77
2022-01-26 14:17:48.676 | DEBUG    | __main__:trials:24 - Trial = 17048/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.676 | DEBUG    | __main__:trials:29 - Trial = 17048/30000 | Total reward = 39.57
2022-01-26 14:17:48.681 | DEBUG    | __main__:trials:24 - Trial = 17049/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.682 | DEBUG    | __main__:trials:29 - Trial = 17049/30000 | Total reward = 39.65
2022-01-26 14:17:48.686 | DEBUG    | __main__:trials:26 - Trial = 17050/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.686 | DEBUG    | __main__:trials:29 - Trial = 17050/30000 | Total reward = 34.50
2022-01-26 14:17:48.691 | DEBUG    | __main__:trials:24 - Trial = 17051/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.693 | DEBUG    | __main__:trials:29 - Trial = 17051/30000 | Total reward = 41.89
2022-01-26 14:17:48.696 | DEBUG    | __main__:trials:24 - Trial = 17052/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.697 | DEBUG    | __main__:trials:29 - Trial = 17052/30000 | Total reward = 42.60
2022-01-26 14:17:48.700 | DEBUG    | __main__:trials:24 - Trial = 17053/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.702 | DEBUG    | __main__:trials:29 - Trial = 17053/30000 | Total reward = 43.19
2022-01-26 14:17:48.705 | DEBUG    | __main__:trials:24 - Trial = 17054/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.706 | DEBUG    | __main__:trials:29 - Trial = 17054/30000 | Total reward = 43.19
2022-01-26 14:17:48.709 | DEBUG    | __main__:trials:24 - Trial = 17055/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.711 | DEBUG    | __main__:trials:29 - Trial = 17055/30000 | Total reward = 40.84
2022-01-26 14:17:48.714 | DEBUG    | __main__:trials:24 - Trial = 17056/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.715 | DEBUG    | __main__:trials:29 - Trial = 17056/30000 | Total reward = 43.19
2022-01-26 14:17:48.718 | DEBUG    | __main__:trials:24 - Trial = 17057/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.719 | DEBUG    | __main__:trials:29 - Trial = 17057/30000 | Total reward = 50.44
2022-01-26 14:17:48.722 | DEBUG    | __main__:trials:24 - Trial = 17058/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.723 | DEBUG    | __main__:trials:29 - Trial = 17058/30000 | Total reward = 44.17
2022-01-26 14:17:48.727 | DEBUG    | __main__:trials:24 - Trial = 17059/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.728 | DEBUG    | __main__:trials:29 - Trial = 17059/30000 | Total reward = 56.43
2022-01-26 14:17:48.732 | DEBUG    | __main__:trials:24 - Trial = 17060/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.732 | DEBUG    | __main__:trials:29 - Trial = 17060/30000 | Total reward = 48.94
2022-01-26 14:17:48.736 | DEBUG    | __main__:trials:24 - Trial = 17061/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.738 | DEBUG    | __main__:trials:29 - Trial = 17061/30000 | Total reward = 50.86
2022-01-26 14:17:48.742 | DEBUG    | __main__:trials:24 - Trial = 17062/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.743 | DEBUG    | __main__:trials:29 - Trial = 17062/30000 | Total reward = 37.26
2022-01-26 14:17:48.746 | DEBUG    | __main__:trials:24 - Trial = 17063/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.748 | DEBUG    | __main__:trials:29 - Trial = 17063/30000 | Total reward = 37.70
2022-01-26 14:17:48.750 | DEBUG    | __main__:trials:24 - Trial = 17064/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.752 | DEBUG    | __main__:trials:29 - Trial = 17064/30000 | Total reward = 42.23
2022-01-26 14:17:48.755 | DEBUG    | __main__:trials:24 - Trial = 17065/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.757 | DEBUG    | __main__:trials:29 - Trial = 17065/30000 | Total reward = 42.70
2022-01-26 14:17:48.760 | DEBUG    | __main__:trials:24 - Trial = 17066/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.761 | DEBUG    | __main__:trials:29 - Trial = 17066/30000 | Total reward = 42.26
2022-01-26 14:17:48.765 | DEBUG    | __main__:trials:24 - Trial = 17067/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.766 | DEBUG    | __main__:trials:29 - Trial = 17067/30000 | Total reward = 31.09
2022-01-26 14:17:48.770 | DEBUG    | __main__:trials:24 - Trial = 17068/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.771 | DEBUG    | __main__:trials:29 - Trial = 17068/30000 | Total reward = 48.02
2022-01-26 14:17:48.774 | DEBUG    | __main__:trials:24 - Trial = 17069/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.776 | DEBUG    | __main__:trials:29 - Trial = 17069/30000 | Total reward = 49.28
2022-01-26 14:17:48.780 | DEBUG    | __main__:trials:24 - Trial = 17070/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.780 | DEBUG    | __main__:trials:29 - Trial = 17070/30000 | Total reward = 48.31
2022-01-26 14:17:48.784 | DEBUG    | __main__:trials:24 - Trial = 17071/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.785 | DEBUG    | __main__:trials:29 - Trial = 17071/30000 | Total reward = 48.08
2022-01-26 14:17:48.790 | DEBUG    | __main__:trials:24 - Trial = 17072/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.790 | DEBUG    | __main__:trials:29 - Trial = 17072/30000 | Total reward = 52.82
2022-01-26 14:17:48.795 | DEBUG    | __main__:trials:24 - Trial = 17073/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.797 | DEBUG    | __main__:trials:29 - Trial = 17073/30000 | Total reward = 42.21
2022-01-26 14:17:48.799 | DEBUG    | __main__:trials:24 - Trial = 17074/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.801 | DEBUG    | __main__:trials:29 - Trial = 17074/30000 | Total reward = 41.51
2022-01-26 14:17:48.804 | DEBUG    | __main__:trials:24 - Trial = 17075/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.806 | DEBUG    | __main__:trials:29 - Trial = 17075/30000 | Total reward = 47.69
2022-01-26 14:17:48.809 | DEBUG    | __main__:trials:24 - Trial = 17076/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.810 | DEBUG    | __main__:trials:29 - Trial = 17076/30000 | Total reward = 47.19
2022-01-26 14:17:48.814 | DEBUG    | __main__:trials:24 - Trial = 17077/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.815 | DEBUG    | __main__:trials:29 - Trial = 17077/30000 | Total reward = 48.26
2022-01-26 14:17:48.819 | DEBUG    | __main__:trials:24 - Trial = 17078/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.821 | DEBUG    | __main__:trials:29 - Trial = 17078/30000 | Total reward = 39.80
2022-01-26 14:17:48.824 | DEBUG    | __main__:trials:24 - Trial = 17079/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.826 | DEBUG    | __main__:trials:29 - Trial = 17079/30000 | Total reward = 32.23
2022-01-26 14:17:48.829 | DEBUG    | __main__:trials:24 - Trial = 17080/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.832 | DEBUG    | __main__:trials:29 - Trial = 17080/30000 | Total reward = 40.71
2022-01-26 14:17:48.835 | DEBUG    | __main__:trials:24 - Trial = 17081/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.837 | DEBUG    | __main__:trials:29 - Trial = 17081/30000 | Total reward = 44.69
2022-01-26 14:17:48.840 | DEBUG    | __main__:trials:24 - Trial = 17082/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.841 | DEBUG    | __main__:trials:29 - Trial = 17082/30000 | Total reward = 49.79
2022-01-26 14:17:48.845 | DEBUG    | __main__:trials:24 - Trial = 17083/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.846 | DEBUG    | __main__:trials:29 - Trial = 17083/30000 | Total reward = 47.63
2022-01-26 14:17:48.850 | DEBUG    | __main__:trials:24 - Trial = 17084/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.852 | DEBUG    | __main__:trials:29 - Trial = 17084/30000 | Total reward = 51.04
2022-01-26 14:17:48.856 | DEBUG    | __main__:trials:24 - Trial = 17085/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.856 | DEBUG    | __main__:trials:29 - Trial = 17085/30000 | Total reward = 64.76
2022-01-26 14:17:48.861 | DEBUG    | __main__:trials:24 - Trial = 17086/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.861 | DEBUG    | __main__:trials:29 - Trial = 17086/30000 | Total reward = 51.76
2022-01-26 14:17:48.865 | DEBUG    | __main__:trials:26 - Trial = 17087/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.866 | DEBUG    | __main__:trials:29 - Trial = 17087/30000 | Total reward = 26.83
2022-01-26 14:17:48.869 | DEBUG    | __main__:trials:24 - Trial = 17088/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.870 | DEBUG    | __main__:trials:29 - Trial = 17088/30000 | Total reward = 51.16
2022-01-26 14:17:48.873 | DEBUG    | __main__:trials:24 - Trial = 17089/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.874 | DEBUG    | __main__:trials:29 - Trial = 17089/30000 | Total reward = 31.58
2022-01-26 14:17:48.877 | DEBUG    | __main__:trials:26 - Trial = 17090/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:48.878 | DEBUG    | __main__:trials:29 - Trial = 17090/30000 | Total reward = 27.43
2022-01-26 14:17:48.881 | DEBUG    | __main__:trials:24 - Trial = 17091/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.883 | DEBUG    | __main__:trials:29 - Trial = 17091/30000 | Total reward = 44.18
2022-01-26 14:17:48.887 | DEBUG    | __main__:trials:24 - Trial = 17092/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.888 | DEBUG    | __main__:trials:29 - Trial = 17092/30000 | Total reward = 51.62
2022-01-26 14:17:48.892 | DEBUG    | __main__:trials:24 - Trial = 17093/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.892 | DEBUG    | __main__:trials:29 - Trial = 17093/30000 | Total reward = 53.35
2022-01-26 14:17:48.897 | DEBUG    | __main__:trials:24 - Trial = 17094/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.898 | DEBUG    | __main__:trials:29 - Trial = 17094/30000 | Total reward = 49.09
2022-01-26 14:17:48.901 | DEBUG    | __main__:trials:24 - Trial = 17095/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.902 | DEBUG    | __main__:trials:29 - Trial = 17095/30000 | Total reward = 49.65
2022-01-26 14:17:48.905 | DEBUG    | __main__:trials:24 - Trial = 17096/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.906 | DEBUG    | __main__:trials:29 - Trial = 17096/30000 | Total reward = 48.22
2022-01-26 14:17:48.909 | DEBUG    | __main__:trials:24 - Trial = 17097/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.910 | DEBUG    | __main__:trials:29 - Trial = 17097/30000 | Total reward = 46.01
2022-01-26 14:17:48.913 | DEBUG    | __main__:trials:24 - Trial = 17098/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.914 | DEBUG    | __main__:trials:29 - Trial = 17098/30000 | Total reward = 46.53
2022-01-26 14:17:48.917 | DEBUG    | __main__:trials:24 - Trial = 17099/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.919 | DEBUG    | __main__:trials:29 - Trial = 17099/30000 | Total reward = 42.23
2022-01-26 14:17:48.922 | DEBUG    | __main__:trials:24 - Trial = 17100/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.924 | DEBUG    | __main__:trials:29 - Trial = 17100/30000 | Total reward = 58.75
2022-01-26 14:17:48.927 | DEBUG    | __main__:trials:24 - Trial = 17101/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.928 | DEBUG    | __main__:trials:29 - Trial = 17101/30000 | Total reward = 57.91
2022-01-26 14:17:48.932 | DEBUG    | __main__:trials:24 - Trial = 17102/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.934 | DEBUG    | __main__:trials:29 - Trial = 17102/30000 | Total reward = 37.66
2022-01-26 14:17:48.938 | DEBUG    | __main__:trials:24 - Trial = 17103/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.938 | DEBUG    | __main__:trials:29 - Trial = 17103/30000 | Total reward = 43.04
2022-01-26 14:17:48.942 | DEBUG    | __main__:trials:24 - Trial = 17104/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.944 | DEBUG    | __main__:trials:29 - Trial = 17104/30000 | Total reward = 51.53
2022-01-26 14:17:48.947 | DEBUG    | __main__:trials:24 - Trial = 17105/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.948 | DEBUG    | __main__:trials:29 - Trial = 17105/30000 | Total reward = 51.71
2022-01-26 14:17:48.952 | DEBUG    | __main__:trials:24 - Trial = 17106/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.953 | DEBUG    | __main__:trials:29 - Trial = 17106/30000 | Total reward = 47.46
2022-01-26 14:17:48.957 | DEBUG    | __main__:trials:24 - Trial = 17107/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.958 | DEBUG    | __main__:trials:29 - Trial = 17107/30000 | Total reward = 52.47
2022-01-26 14:17:48.962 | DEBUG    | __main__:trials:24 - Trial = 17108/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.963 | DEBUG    | __main__:trials:29 - Trial = 17108/30000 | Total reward = 39.54
2022-01-26 14:17:48.967 | DEBUG    | __main__:trials:24 - Trial = 17109/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.969 | DEBUG    | __main__:trials:29 - Trial = 17109/30000 | Total reward = 64.98
2022-01-26 14:17:48.972 | DEBUG    | __main__:trials:24 - Trial = 17110/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.974 | DEBUG    | __main__:trials:29 - Trial = 17110/30000 | Total reward = 43.41
2022-01-26 14:17:48.978 | DEBUG    | __main__:trials:24 - Trial = 17111/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.978 | DEBUG    | __main__:trials:29 - Trial = 17111/30000 | Total reward = 50.18
2022-01-26 14:17:48.983 | DEBUG    | __main__:trials:24 - Trial = 17112/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.983 | DEBUG    | __main__:trials:29 - Trial = 17112/30000 | Total reward = 43.94
2022-01-26 14:17:48.987 | DEBUG    | __main__:trials:24 - Trial = 17113/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.989 | DEBUG    | __main__:trials:29 - Trial = 17113/30000 | Total reward = 41.61
2022-01-26 14:17:48.993 | DEBUG    | __main__:trials:24 - Trial = 17114/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.993 | DEBUG    | __main__:trials:29 - Trial = 17114/30000 | Total reward = 44.97
2022-01-26 14:17:48.998 | DEBUG    | __main__:trials:24 - Trial = 17115/30000 | Max number of steps (20) reached
2022-01-26 14:17:48.999 | DEBUG    | __main__:trials:29 - Trial = 17115/30000 | Total reward = 46.55
2022-01-26 14:17:49.003 | DEBUG    | __main__:trials:24 - Trial = 17116/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.004 | DEBUG    | __main__:trials:29 - Trial = 17116/30000 | Total reward = 42.94
2022-01-26 14:17:49.008 | DEBUG    | __main__:trials:24 - Trial = 17117/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.009 | DEBUG    | __main__:trials:29 - Trial = 17117/30000 | Total reward = 50.07
2022-01-26 14:17:49.013 | DEBUG    | __main__:trials:24 - Trial = 17118/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.014 | DEBUG    | __main__:trials:29 - Trial = 17118/30000 | Total reward = 46.02
2022-01-26 14:17:49.018 | DEBUG    | __main__:trials:24 - Trial = 17119/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.020 | DEBUG    | __main__:trials:29 - Trial = 17119/30000 | Total reward = 41.46
2022-01-26 14:17:49.024 | DEBUG    | __main__:trials:24 - Trial = 17120/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.024 | DEBUG    | __main__:trials:29 - Trial = 17120/30000 | Total reward = 45.43
2022-01-26 14:17:49.028 | DEBUG    | __main__:trials:24 - Trial = 17121/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.029 | DEBUG    | __main__:trials:29 - Trial = 17121/30000 | Total reward = 36.61
2022-01-26 14:17:49.034 | DEBUG    | __main__:trials:24 - Trial = 17122/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.035 | DEBUG    | __main__:trials:29 - Trial = 17122/30000 | Total reward = 49.18
2022-01-26 14:17:49.039 | DEBUG    | __main__:trials:24 - Trial = 17123/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.040 | DEBUG    | __main__:trials:29 - Trial = 17123/30000 | Total reward = 61.39
2022-01-26 14:17:49.043 | DEBUG    | __main__:trials:24 - Trial = 17124/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.045 | DEBUG    | __main__:trials:29 - Trial = 17124/30000 | Total reward = 48.59
2022-01-26 14:17:49.048 | DEBUG    | __main__:trials:24 - Trial = 17125/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.050 | DEBUG    | __main__:trials:29 - Trial = 17125/30000 | Total reward = 52.17
2022-01-26 14:17:49.054 | DEBUG    | __main__:trials:24 - Trial = 17126/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.055 | DEBUG    | __main__:trials:29 - Trial = 17126/30000 | Total reward = 46.65
2022-01-26 14:17:49.059 | DEBUG    | __main__:trials:24 - Trial = 17127/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.061 | DEBUG    | __main__:trials:29 - Trial = 17127/30000 | Total reward = 52.03
2022-01-26 14:17:49.064 | DEBUG    | __main__:trials:24 - Trial = 17128/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.065 | DEBUG    | __main__:trials:29 - Trial = 17128/30000 | Total reward = 51.37
2022-01-26 14:17:49.068 | DEBUG    | __main__:trials:24 - Trial = 17129/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.070 | DEBUG    | __main__:trials:29 - Trial = 17129/30000 | Total reward = 43.37
2022-01-26 14:17:49.074 | DEBUG    | __main__:trials:24 - Trial = 17130/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.075 | DEBUG    | __main__:trials:29 - Trial = 17130/30000 | Total reward = 47.23
2022-01-26 14:17:49.078 | DEBUG    | __main__:trials:24 - Trial = 17131/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.079 | DEBUG    | __main__:trials:29 - Trial = 17131/30000 | Total reward = 59.56
2022-01-26 14:17:49.083 | DEBUG    | __main__:trials:24 - Trial = 17132/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.083 | DEBUG    | __main__:trials:29 - Trial = 17132/30000 | Total reward = 34.00
2022-01-26 14:17:49.087 | DEBUG    | __main__:trials:24 - Trial = 17133/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.087 | DEBUG    | __main__:trials:29 - Trial = 17133/30000 | Total reward = 50.78
2022-01-26 14:17:49.091 | DEBUG    | __main__:trials:24 - Trial = 17134/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.093 | DEBUG    | __main__:trials:29 - Trial = 17134/30000 | Total reward = 53.13
2022-01-26 14:17:49.096 | DEBUG    | __main__:trials:24 - Trial = 17135/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.098 | DEBUG    | __main__:trials:29 - Trial = 17135/30000 | Total reward = 52.16
2022-01-26 14:17:49.101 | DEBUG    | __main__:trials:24 - Trial = 17136/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.103 | DEBUG    | __main__:trials:29 - Trial = 17136/30000 | Total reward = 47.24
2022-01-26 14:17:49.107 | DEBUG    | __main__:trials:24 - Trial = 17137/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.107 | DEBUG    | __main__:trials:29 - Trial = 17137/30000 | Total reward = 52.77
2022-01-26 14:17:49.112 | DEBUG    | __main__:trials:24 - Trial = 17138/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.113 | DEBUG    | __main__:trials:29 - Trial = 17138/30000 | Total reward = 33.66
2022-01-26 14:17:49.117 | DEBUG    | __main__:trials:24 - Trial = 17139/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.118 | DEBUG    | __main__:trials:29 - Trial = 17139/30000 | Total reward = 41.42
2022-01-26 14:17:49.123 | DEBUG    | __main__:trials:24 - Trial = 17140/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.124 | DEBUG    | __main__:trials:29 - Trial = 17140/30000 | Total reward = 50.66
2022-01-26 14:17:49.128 | DEBUG    | __main__:trials:24 - Trial = 17141/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.129 | DEBUG    | __main__:trials:29 - Trial = 17141/30000 | Total reward = 54.20
2022-01-26 14:17:49.132 | DEBUG    | __main__:trials:24 - Trial = 17142/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.133 | DEBUG    | __main__:trials:29 - Trial = 17142/30000 | Total reward = 52.14
2022-01-26 14:17:49.138 | DEBUG    | __main__:trials:24 - Trial = 17143/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.138 | DEBUG    | __main__:trials:29 - Trial = 17143/30000 | Total reward = 46.14
2022-01-26 14:17:49.142 | DEBUG    | __main__:trials:24 - Trial = 17144/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.144 | DEBUG    | __main__:trials:29 - Trial = 17144/30000 | Total reward = 52.77
2022-01-26 14:17:49.147 | DEBUG    | __main__:trials:24 - Trial = 17145/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.149 | DEBUG    | __main__:trials:29 - Trial = 17145/30000 | Total reward = 39.25
2022-01-26 14:17:49.152 | DEBUG    | __main__:trials:24 - Trial = 17146/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.153 | DEBUG    | __main__:trials:29 - Trial = 17146/30000 | Total reward = 50.39
2022-01-26 14:17:49.156 | DEBUG    | __main__:trials:24 - Trial = 17147/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.158 | DEBUG    | __main__:trials:29 - Trial = 17147/30000 | Total reward = 59.42
2022-01-26 14:17:49.161 | DEBUG    | __main__:trials:24 - Trial = 17148/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.163 | DEBUG    | __main__:trials:29 - Trial = 17148/30000 | Total reward = 42.58
2022-01-26 14:17:49.166 | DEBUG    | __main__:trials:24 - Trial = 17149/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.168 | DEBUG    | __main__:trials:29 - Trial = 17149/30000 | Total reward = 56.18
2022-01-26 14:17:49.171 | DEBUG    | __main__:trials:24 - Trial = 17150/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.173 | DEBUG    | __main__:trials:29 - Trial = 17150/30000 | Total reward = 43.93
2022-01-26 14:17:49.176 | DEBUG    | __main__:trials:24 - Trial = 17151/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.177 | DEBUG    | __main__:trials:29 - Trial = 17151/30000 | Total reward = 47.38
2022-01-26 14:17:49.181 | DEBUG    | __main__:trials:24 - Trial = 17152/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.182 | DEBUG    | __main__:trials:29 - Trial = 17152/30000 | Total reward = 51.42
2022-01-26 14:17:49.186 | DEBUG    | __main__:trials:24 - Trial = 17153/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.186 | DEBUG    | __main__:trials:29 - Trial = 17153/30000 | Total reward = 46.82
2022-01-26 14:17:49.191 | DEBUG    | __main__:trials:24 - Trial = 17154/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.192 | DEBUG    | __main__:trials:29 - Trial = 17154/30000 | Total reward = 52.80
2022-01-26 14:17:49.196 | DEBUG    | __main__:trials:24 - Trial = 17155/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.198 | DEBUG    | __main__:trials:29 - Trial = 17155/30000 | Total reward = 53.93
2022-01-26 14:17:49.202 | DEBUG    | __main__:trials:24 - Trial = 17156/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.203 | DEBUG    | __main__:trials:29 - Trial = 17156/30000 | Total reward = 49.15
2022-01-26 14:17:49.207 | DEBUG    | __main__:trials:24 - Trial = 17157/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.209 | DEBUG    | __main__:trials:29 - Trial = 17157/30000 | Total reward = 42.68
2022-01-26 14:17:49.212 | DEBUG    | __main__:trials:24 - Trial = 17158/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.214 | DEBUG    | __main__:trials:29 - Trial = 17158/30000 | Total reward = 49.47
2022-01-26 14:17:49.218 | DEBUG    | __main__:trials:24 - Trial = 17159/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.218 | DEBUG    | __main__:trials:29 - Trial = 17159/30000 | Total reward = 47.78
2022-01-26 14:17:49.222 | DEBUG    | __main__:trials:24 - Trial = 17160/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.224 | DEBUG    | __main__:trials:29 - Trial = 17160/30000 | Total reward = 54.59
2022-01-26 14:17:49.228 | DEBUG    | __main__:trials:24 - Trial = 17161/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.229 | DEBUG    | __main__:trials:29 - Trial = 17161/30000 | Total reward = 42.23
2022-01-26 14:17:49.232 | DEBUG    | __main__:trials:24 - Trial = 17162/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.233 | DEBUG    | __main__:trials:29 - Trial = 17162/30000 | Total reward = 47.60
2022-01-26 14:17:49.236 | DEBUG    | __main__:trials:24 - Trial = 17163/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.238 | DEBUG    | __main__:trials:29 - Trial = 17163/30000 | Total reward = 43.80
2022-01-26 14:17:49.241 | DEBUG    | __main__:trials:24 - Trial = 17164/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.242 | DEBUG    | __main__:trials:29 - Trial = 17164/30000 | Total reward = 48.01
2022-01-26 14:17:49.245 | DEBUG    | __main__:trials:24 - Trial = 17165/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.246 | DEBUG    | __main__:trials:29 - Trial = 17165/30000 | Total reward = 51.07
2022-01-26 14:17:49.249 | DEBUG    | __main__:trials:24 - Trial = 17166/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.251 | DEBUG    | __main__:trials:29 - Trial = 17166/30000 | Total reward = 40.59
2022-01-26 14:17:49.255 | DEBUG    | __main__:trials:24 - Trial = 17167/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.256 | DEBUG    | __main__:trials:29 - Trial = 17167/30000 | Total reward = 46.55
2022-01-26 14:17:49.260 | DEBUG    | __main__:trials:24 - Trial = 17168/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.261 | DEBUG    | __main__:trials:29 - Trial = 17168/30000 | Total reward = 51.89
2022-01-26 14:17:49.265 | DEBUG    | __main__:trials:24 - Trial = 17169/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.266 | DEBUG    | __main__:trials:29 - Trial = 17169/30000 | Total reward = 44.98
2022-01-26 14:17:49.269 | DEBUG    | __main__:trials:24 - Trial = 17170/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.270 | DEBUG    | __main__:trials:29 - Trial = 17170/30000 | Total reward = 50.60
2022-01-26 14:17:49.274 | DEBUG    | __main__:trials:24 - Trial = 17171/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.274 | DEBUG    | __main__:trials:29 - Trial = 17171/30000 | Total reward = 37.31
2022-01-26 14:17:49.278 | DEBUG    | __main__:trials:24 - Trial = 17172/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.278 | DEBUG    | __main__:trials:29 - Trial = 17172/30000 | Total reward = 36.28
2022-01-26 14:17:49.282 | DEBUG    | __main__:trials:24 - Trial = 17173/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.284 | DEBUG    | __main__:trials:29 - Trial = 17173/30000 | Total reward = 51.89
2022-01-26 14:17:49.287 | DEBUG    | __main__:trials:24 - Trial = 17174/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.289 | DEBUG    | __main__:trials:29 - Trial = 17174/30000 | Total reward = 52.76
2022-01-26 14:17:49.292 | DEBUG    | __main__:trials:24 - Trial = 17175/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.293 | DEBUG    | __main__:trials:29 - Trial = 17175/30000 | Total reward = 49.09
2022-01-26 14:17:49.296 | DEBUG    | __main__:trials:24 - Trial = 17176/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.298 | DEBUG    | __main__:trials:29 - Trial = 17176/30000 | Total reward = 51.00
2022-01-26 14:17:49.301 | DEBUG    | __main__:trials:24 - Trial = 17177/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.302 | DEBUG    | __main__:trials:29 - Trial = 17177/30000 | Total reward = 41.23
2022-01-26 14:17:49.305 | DEBUG    | __main__:trials:24 - Trial = 17178/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.307 | DEBUG    | __main__:trials:29 - Trial = 17178/30000 | Total reward = 46.53
2022-01-26 14:17:49.311 | DEBUG    | __main__:trials:24 - Trial = 17179/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.312 | DEBUG    | __main__:trials:29 - Trial = 17179/30000 | Total reward = 38.72
2022-01-26 14:17:49.316 | DEBUG    | __main__:trials:24 - Trial = 17180/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.316 | DEBUG    | __main__:trials:29 - Trial = 17180/30000 | Total reward = 58.38
2022-01-26 14:17:49.320 | DEBUG    | __main__:trials:24 - Trial = 17181/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.322 | DEBUG    | __main__:trials:29 - Trial = 17181/30000 | Total reward = 55.25
2022-01-26 14:17:49.325 | DEBUG    | __main__:trials:24 - Trial = 17182/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.326 | DEBUG    | __main__:trials:29 - Trial = 17182/30000 | Total reward = 58.88
2022-01-26 14:17:49.329 | DEBUG    | __main__:trials:24 - Trial = 17183/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.329 | DEBUG    | __main__:trials:29 - Trial = 17183/30000 | Total reward = 43.60
2022-01-26 14:17:49.333 | DEBUG    | __main__:trials:24 - Trial = 17184/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.335 | DEBUG    | __main__:trials:29 - Trial = 17184/30000 | Total reward = 43.18
2022-01-26 14:17:49.338 | DEBUG    | __main__:trials:24 - Trial = 17185/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.339 | DEBUG    | __main__:trials:29 - Trial = 17185/30000 | Total reward = 58.76
2022-01-26 14:17:49.343 | DEBUG    | __main__:trials:24 - Trial = 17186/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.344 | DEBUG    | __main__:trials:29 - Trial = 17186/30000 | Total reward = 40.20
2022-01-26 14:17:49.348 | DEBUG    | __main__:trials:24 - Trial = 17187/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.349 | DEBUG    | __main__:trials:29 - Trial = 17187/30000 | Total reward = 45.85
2022-01-26 14:17:49.353 | DEBUG    | __main__:trials:24 - Trial = 17188/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.353 | DEBUG    | __main__:trials:29 - Trial = 17188/30000 | Total reward = 45.19
2022-01-26 14:17:49.357 | DEBUG    | __main__:trials:24 - Trial = 17189/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.358 | DEBUG    | __main__:trials:29 - Trial = 17189/30000 | Total reward = 44.47
2022-01-26 14:17:49.361 | DEBUG    | __main__:trials:24 - Trial = 17190/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.363 | DEBUG    | __main__:trials:29 - Trial = 17190/30000 | Total reward = 42.90
2022-01-26 14:17:49.366 | DEBUG    | __main__:trials:24 - Trial = 17191/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.367 | DEBUG    | __main__:trials:29 - Trial = 17191/30000 | Total reward = 36.81
2022-01-26 14:17:49.371 | DEBUG    | __main__:trials:24 - Trial = 17192/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.372 | DEBUG    | __main__:trials:29 - Trial = 17192/30000 | Total reward = 35.30
2022-01-26 14:17:49.376 | DEBUG    | __main__:trials:24 - Trial = 17193/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.377 | DEBUG    | __main__:trials:29 - Trial = 17193/30000 | Total reward = 45.19
2022-01-26 14:17:49.380 | DEBUG    | __main__:trials:24 - Trial = 17194/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.382 | DEBUG    | __main__:trials:29 - Trial = 17194/30000 | Total reward = 43.16
2022-01-26 14:17:49.385 | DEBUG    | __main__:trials:24 - Trial = 17195/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.386 | DEBUG    | __main__:trials:29 - Trial = 17195/30000 | Total reward = 35.08
2022-01-26 14:17:49.390 | DEBUG    | __main__:trials:24 - Trial = 17196/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.391 | DEBUG    | __main__:trials:29 - Trial = 17196/30000 | Total reward = 37.30
2022-01-26 14:17:49.395 | DEBUG    | __main__:trials:24 - Trial = 17197/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.396 | DEBUG    | __main__:trials:29 - Trial = 17197/30000 | Total reward = 48.44
2022-01-26 14:17:49.399 | DEBUG    | __main__:trials:24 - Trial = 17198/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.401 | DEBUG    | __main__:trials:29 - Trial = 17198/30000 | Total reward = 33.97
2022-01-26 14:17:49.404 | DEBUG    | __main__:trials:24 - Trial = 17199/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.406 | DEBUG    | __main__:trials:29 - Trial = 17199/30000 | Total reward = 46.66
2022-01-26 14:17:49.409 | DEBUG    | __main__:trials:24 - Trial = 17200/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.410 | DEBUG    | __main__:trials:29 - Trial = 17200/30000 | Total reward = 49.39
2022-01-26 14:17:49.413 | DEBUG    | __main__:trials:24 - Trial = 17201/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.415 | DEBUG    | __main__:trials:29 - Trial = 17201/30000 | Total reward = 31.97
2022-01-26 14:17:49.418 | DEBUG    | __main__:trials:24 - Trial = 17202/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.420 | DEBUG    | __main__:trials:29 - Trial = 17202/30000 | Total reward = 40.81
2022-01-26 14:17:49.423 | DEBUG    | __main__:trials:24 - Trial = 17203/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.425 | DEBUG    | __main__:trials:29 - Trial = 17203/30000 | Total reward = 38.74
2022-01-26 14:17:49.428 | DEBUG    | __main__:trials:24 - Trial = 17204/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.429 | DEBUG    | __main__:trials:29 - Trial = 17204/30000 | Total reward = 54.82
2022-01-26 14:17:49.433 | DEBUG    | __main__:trials:24 - Trial = 17205/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.434 | DEBUG    | __main__:trials:29 - Trial = 17205/30000 | Total reward = 56.04
2022-01-26 14:17:49.437 | DEBUG    | __main__:trials:24 - Trial = 17206/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.438 | DEBUG    | __main__:trials:29 - Trial = 17206/30000 | Total reward = 44.22
2022-01-26 14:17:49.441 | DEBUG    | __main__:trials:24 - Trial = 17207/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.443 | DEBUG    | __main__:trials:29 - Trial = 17207/30000 | Total reward = 27.77
2022-01-26 14:17:49.447 | DEBUG    | __main__:trials:24 - Trial = 17208/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.447 | DEBUG    | __main__:trials:29 - Trial = 17208/30000 | Total reward = 34.16
2022-01-26 14:17:49.451 | DEBUG    | __main__:trials:24 - Trial = 17209/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.453 | DEBUG    | __main__:trials:29 - Trial = 17209/30000 | Total reward = 47.62
2022-01-26 14:17:49.456 | DEBUG    | __main__:trials:24 - Trial = 17210/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.457 | DEBUG    | __main__:trials:29 - Trial = 17210/30000 | Total reward = 34.34
2022-01-26 14:17:49.460 | DEBUG    | __main__:trials:24 - Trial = 17211/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.462 | DEBUG    | __main__:trials:29 - Trial = 17211/30000 | Total reward = 32.06
2022-01-26 14:17:49.465 | DEBUG    | __main__:trials:24 - Trial = 17212/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.466 | DEBUG    | __main__:trials:29 - Trial = 17212/30000 | Total reward = 46.32
2022-01-26 14:17:49.469 | DEBUG    | __main__:trials:26 - Trial = 17213/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:49.470 | DEBUG    | __main__:trials:29 - Trial = 17213/30000 | Total reward = 19.28
2022-01-26 14:17:49.473 | DEBUG    | __main__:trials:24 - Trial = 17214/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.474 | DEBUG    | __main__:trials:29 - Trial = 17214/30000 | Total reward = 43.47
2022-01-26 14:17:49.478 | DEBUG    | __main__:trials:24 - Trial = 17215/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.479 | DEBUG    | __main__:trials:29 - Trial = 17215/30000 | Total reward = 64.27
2022-01-26 14:17:49.483 | DEBUG    | __main__:trials:24 - Trial = 17216/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.484 | DEBUG    | __main__:trials:29 - Trial = 17216/30000 | Total reward = 49.85
2022-01-26 14:17:49.488 | DEBUG    | __main__:trials:24 - Trial = 17217/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.489 | DEBUG    | __main__:trials:29 - Trial = 17217/30000 | Total reward = 43.82
2022-01-26 14:17:49.492 | DEBUG    | __main__:trials:24 - Trial = 17218/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.493 | DEBUG    | __main__:trials:29 - Trial = 17218/30000 | Total reward = 66.21
2022-01-26 14:17:49.496 | DEBUG    | __main__:trials:24 - Trial = 17219/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.498 | DEBUG    | __main__:trials:29 - Trial = 17219/30000 | Total reward = 49.11
2022-01-26 14:17:49.501 | DEBUG    | __main__:trials:24 - Trial = 17220/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.503 | DEBUG    | __main__:trials:29 - Trial = 17220/30000 | Total reward = 44.62
2022-01-26 14:17:49.506 | DEBUG    | __main__:trials:24 - Trial = 17221/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.507 | DEBUG    | __main__:trials:29 - Trial = 17221/30000 | Total reward = 40.53
2022-01-26 14:17:49.511 | DEBUG    | __main__:trials:24 - Trial = 17222/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.512 | DEBUG    | __main__:trials:29 - Trial = 17222/30000 | Total reward = 38.38
2022-01-26 14:17:49.515 | DEBUG    | __main__:trials:24 - Trial = 17223/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.517 | DEBUG    | __main__:trials:29 - Trial = 17223/30000 | Total reward = 43.19
2022-01-26 14:17:49.520 | DEBUG    | __main__:trials:24 - Trial = 17224/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.521 | DEBUG    | __main__:trials:29 - Trial = 17224/30000 | Total reward = 40.20
2022-01-26 14:17:49.525 | DEBUG    | __main__:trials:24 - Trial = 17225/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.526 | DEBUG    | __main__:trials:29 - Trial = 17225/30000 | Total reward = 53.87
2022-01-26 14:17:49.529 | DEBUG    | __main__:trials:24 - Trial = 17226/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.530 | DEBUG    | __main__:trials:29 - Trial = 17226/30000 | Total reward = 45.67
2022-01-26 14:17:49.533 | DEBUG    | __main__:trials:24 - Trial = 17227/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.534 | DEBUG    | __main__:trials:29 - Trial = 17227/30000 | Total reward = 47.02
2022-01-26 14:17:49.537 | DEBUG    | __main__:trials:24 - Trial = 17228/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.538 | DEBUG    | __main__:trials:29 - Trial = 17228/30000 | Total reward = 42.09
2022-01-26 14:17:49.542 | DEBUG    | __main__:trials:24 - Trial = 17229/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.543 | DEBUG    | __main__:trials:29 - Trial = 17229/30000 | Total reward = 40.97
2022-01-26 14:17:49.547 | DEBUG    | __main__:trials:24 - Trial = 17230/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.547 | DEBUG    | __main__:trials:29 - Trial = 17230/30000 | Total reward = 55.91
2022-01-26 14:17:49.551 | DEBUG    | __main__:trials:24 - Trial = 17231/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.551 | DEBUG    | __main__:trials:29 - Trial = 17231/30000 | Total reward = 42.67
2022-01-26 14:17:49.555 | DEBUG    | __main__:trials:24 - Trial = 17232/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.557 | DEBUG    | __main__:trials:29 - Trial = 17232/30000 | Total reward = 51.75
2022-01-26 14:17:49.560 | DEBUG    | __main__:trials:24 - Trial = 17233/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.561 | DEBUG    | __main__:trials:29 - Trial = 17233/30000 | Total reward = 44.09
2022-01-26 14:17:49.565 | DEBUG    | __main__:trials:24 - Trial = 17234/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.565 | DEBUG    | __main__:trials:29 - Trial = 17234/30000 | Total reward = 22.40
2022-01-26 14:17:49.569 | DEBUG    | __main__:trials:24 - Trial = 17235/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.570 | DEBUG    | __main__:trials:29 - Trial = 17235/30000 | Total reward = 36.46
2022-01-26 14:17:49.573 | DEBUG    | __main__:trials:24 - Trial = 17236/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.574 | DEBUG    | __main__:trials:29 - Trial = 17236/30000 | Total reward = 47.26
2022-01-26 14:17:49.577 | DEBUG    | __main__:trials:24 - Trial = 17237/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.578 | DEBUG    | __main__:trials:29 - Trial = 17237/30000 | Total reward = 33.53
2022-01-26 14:17:49.581 | DEBUG    | __main__:trials:24 - Trial = 17238/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.583 | DEBUG    | __main__:trials:29 - Trial = 17238/30000 | Total reward = 46.43
2022-01-26 14:17:49.587 | DEBUG    | __main__:trials:24 - Trial = 17239/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.588 | DEBUG    | __main__:trials:29 - Trial = 17239/30000 | Total reward = 59.46
2022-01-26 14:17:49.592 | DEBUG    | __main__:trials:24 - Trial = 17240/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.593 | DEBUG    | __main__:trials:29 - Trial = 17240/30000 | Total reward = 48.28
2022-01-26 14:17:49.596 | DEBUG    | __main__:trials:24 - Trial = 17241/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.598 | DEBUG    | __main__:trials:29 - Trial = 17241/30000 | Total reward = 48.60
2022-01-26 14:17:49.602 | DEBUG    | __main__:trials:24 - Trial = 17242/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.604 | DEBUG    | __main__:trials:29 - Trial = 17242/30000 | Total reward = 40.63
2022-01-26 14:17:49.608 | DEBUG    | __main__:trials:24 - Trial = 17243/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.609 | DEBUG    | __main__:trials:29 - Trial = 17243/30000 | Total reward = 36.92
2022-01-26 14:17:49.613 | DEBUG    | __main__:trials:24 - Trial = 17244/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.615 | DEBUG    | __main__:trials:29 - Trial = 17244/30000 | Total reward = 49.81
2022-01-26 14:17:49.618 | DEBUG    | __main__:trials:24 - Trial = 17245/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.619 | DEBUG    | __main__:trials:29 - Trial = 17245/30000 | Total reward = 49.15
2022-01-26 14:17:49.623 | DEBUG    | __main__:trials:24 - Trial = 17246/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.625 | DEBUG    | __main__:trials:29 - Trial = 17246/30000 | Total reward = 40.35
2022-01-26 14:17:49.628 | DEBUG    | __main__:trials:24 - Trial = 17247/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.630 | DEBUG    | __main__:trials:29 - Trial = 17247/30000 | Total reward = 60.82
2022-01-26 14:17:49.633 | DEBUG    | __main__:trials:24 - Trial = 17248/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.635 | DEBUG    | __main__:trials:29 - Trial = 17248/30000 | Total reward = 46.44
2022-01-26 14:17:49.638 | DEBUG    | __main__:trials:24 - Trial = 17249/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.640 | DEBUG    | __main__:trials:29 - Trial = 17249/30000 | Total reward = 50.13
2022-01-26 14:17:49.643 | DEBUG    | __main__:trials:24 - Trial = 17250/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.644 | DEBUG    | __main__:trials:29 - Trial = 17250/30000 | Total reward = 36.78
2022-01-26 14:17:49.647 | DEBUG    | __main__:trials:24 - Trial = 17251/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.649 | DEBUG    | __main__:trials:29 - Trial = 17251/30000 | Total reward = 44.39
2022-01-26 14:17:49.653 | DEBUG    | __main__:trials:24 - Trial = 17252/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.655 | DEBUG    | __main__:trials:29 - Trial = 17252/30000 | Total reward = 37.05
2022-01-26 14:17:49.658 | DEBUG    | __main__:trials:24 - Trial = 17253/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.660 | DEBUG    | __main__:trials:29 - Trial = 17253/30000 | Total reward = 43.96
2022-01-26 14:17:49.663 | DEBUG    | __main__:trials:24 - Trial = 17254/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.665 | DEBUG    | __main__:trials:29 - Trial = 17254/30000 | Total reward = 46.17
2022-01-26 14:17:49.669 | DEBUG    | __main__:trials:24 - Trial = 17255/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.669 | DEBUG    | __main__:trials:29 - Trial = 17255/30000 | Total reward = 55.52
2022-01-26 14:17:49.674 | DEBUG    | __main__:trials:24 - Trial = 17256/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.675 | DEBUG    | __main__:trials:29 - Trial = 17256/30000 | Total reward = 47.11
2022-01-26 14:17:49.678 | DEBUG    | __main__:trials:24 - Trial = 17257/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.680 | DEBUG    | __main__:trials:29 - Trial = 17257/30000 | Total reward = 44.22
2022-01-26 14:17:49.684 | DEBUG    | __main__:trials:24 - Trial = 17258/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.686 | DEBUG    | __main__:trials:29 - Trial = 17258/30000 | Total reward = 42.25
2022-01-26 14:17:49.689 | DEBUG    | __main__:trials:24 - Trial = 17259/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.691 | DEBUG    | __main__:trials:29 - Trial = 17259/30000 | Total reward = 43.19
2022-01-26 14:17:49.694 | DEBUG    | __main__:trials:24 - Trial = 17260/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.696 | DEBUG    | __main__:trials:29 - Trial = 17260/30000 | Total reward = 34.94
2022-01-26 14:17:49.700 | DEBUG    | __main__:trials:24 - Trial = 17261/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.702 | DEBUG    | __main__:trials:29 - Trial = 17261/30000 | Total reward = 55.25
2022-01-26 14:17:49.705 | DEBUG    | __main__:trials:24 - Trial = 17262/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.707 | DEBUG    | __main__:trials:29 - Trial = 17262/30000 | Total reward = 45.88
2022-01-26 14:17:49.710 | DEBUG    | __main__:trials:24 - Trial = 17263/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.712 | DEBUG    | __main__:trials:29 - Trial = 17263/30000 | Total reward = 44.92
2022-01-26 14:17:49.715 | DEBUG    | __main__:trials:24 - Trial = 17264/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.717 | DEBUG    | __main__:trials:29 - Trial = 17264/30000 | Total reward = 50.31
2022-01-26 14:17:49.720 | DEBUG    | __main__:trials:24 - Trial = 17265/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.722 | DEBUG    | __main__:trials:29 - Trial = 17265/30000 | Total reward = 50.89
2022-01-26 14:17:49.726 | DEBUG    | __main__:trials:24 - Trial = 17266/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.726 | DEBUG    | __main__:trials:29 - Trial = 17266/30000 | Total reward = 40.52
2022-01-26 14:17:49.730 | DEBUG    | __main__:trials:24 - Trial = 17267/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.732 | DEBUG    | __main__:trials:29 - Trial = 17267/30000 | Total reward = 43.34
2022-01-26 14:17:49.735 | DEBUG    | __main__:trials:24 - Trial = 17268/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.737 | DEBUG    | __main__:trials:29 - Trial = 17268/30000 | Total reward = 57.04
2022-01-26 14:17:49.740 | DEBUG    | __main__:trials:24 - Trial = 17269/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.742 | DEBUG    | __main__:trials:29 - Trial = 17269/30000 | Total reward = 46.95
2022-01-26 14:17:49.745 | DEBUG    | __main__:trials:24 - Trial = 17270/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.747 | DEBUG    | __main__:trials:29 - Trial = 17270/30000 | Total reward = 45.11
2022-01-26 14:17:49.751 | DEBUG    | __main__:trials:24 - Trial = 17271/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.752 | DEBUG    | __main__:trials:29 - Trial = 17271/30000 | Total reward = 12.47
2022-01-26 14:17:49.756 | DEBUG    | __main__:trials:24 - Trial = 17272/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.757 | DEBUG    | __main__:trials:29 - Trial = 17272/30000 | Total reward = 44.22
2022-01-26 14:17:49.761 | DEBUG    | __main__:trials:24 - Trial = 17273/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.762 | DEBUG    | __main__:trials:29 - Trial = 17273/30000 | Total reward = 44.22
2022-01-26 14:17:49.766 | DEBUG    | __main__:trials:24 - Trial = 17274/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.767 | DEBUG    | __main__:trials:29 - Trial = 17274/30000 | Total reward = 55.55
2022-01-26 14:17:49.771 | DEBUG    | __main__:trials:24 - Trial = 17275/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.773 | DEBUG    | __main__:trials:29 - Trial = 17275/30000 | Total reward = 32.15
2022-01-26 14:17:49.776 | DEBUG    | __main__:trials:24 - Trial = 17276/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.778 | DEBUG    | __main__:trials:29 - Trial = 17276/30000 | Total reward = 37.03
2022-01-26 14:17:49.782 | DEBUG    | __main__:trials:24 - Trial = 17277/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.783 | DEBUG    | __main__:trials:29 - Trial = 17277/30000 | Total reward = 45.28
2022-01-26 14:17:49.787 | DEBUG    | __main__:trials:24 - Trial = 17278/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.787 | DEBUG    | __main__:trials:29 - Trial = 17278/30000 | Total reward = 52.49
2022-01-26 14:17:49.792 | DEBUG    | __main__:trials:24 - Trial = 17279/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.792 | DEBUG    | __main__:trials:29 - Trial = 17279/30000 | Total reward = 47.78
2022-01-26 14:17:49.797 | DEBUG    | __main__:trials:24 - Trial = 17280/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.798 | DEBUG    | __main__:trials:29 - Trial = 17280/30000 | Total reward = 51.83
2022-01-26 14:17:49.802 | DEBUG    | __main__:trials:24 - Trial = 17281/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.803 | DEBUG    | __main__:trials:29 - Trial = 17281/30000 | Total reward = 27.38
2022-01-26 14:17:49.807 | DEBUG    | __main__:trials:24 - Trial = 17282/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.808 | DEBUG    | __main__:trials:29 - Trial = 17282/30000 | Total reward = 45.75
2022-01-26 14:17:49.812 | DEBUG    | __main__:trials:24 - Trial = 17283/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.813 | DEBUG    | __main__:trials:29 - Trial = 17283/30000 | Total reward = 45.73
2022-01-26 14:17:49.817 | DEBUG    | __main__:trials:24 - Trial = 17284/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.819 | DEBUG    | __main__:trials:29 - Trial = 17284/30000 | Total reward = 44.80
2022-01-26 14:17:49.822 | DEBUG    | __main__:trials:26 - Trial = 17285/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:49.823 | DEBUG    | __main__:trials:29 - Trial = 17285/30000 | Total reward = 25.17
2022-01-26 14:17:49.827 | DEBUG    | __main__:trials:24 - Trial = 17286/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.828 | DEBUG    | __main__:trials:29 - Trial = 17286/30000 | Total reward = 43.86
2022-01-26 14:17:49.832 | DEBUG    | __main__:trials:24 - Trial = 17287/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.833 | DEBUG    | __main__:trials:29 - Trial = 17287/30000 | Total reward = 39.01
2022-01-26 14:17:49.837 | DEBUG    | __main__:trials:24 - Trial = 17288/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.838 | DEBUG    | __main__:trials:29 - Trial = 17288/30000 | Total reward = 58.06
2022-01-26 14:17:49.842 | DEBUG    | __main__:trials:24 - Trial = 17289/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.844 | DEBUG    | __main__:trials:29 - Trial = 17289/30000 | Total reward = 43.89
2022-01-26 14:17:49.847 | DEBUG    | __main__:trials:24 - Trial = 17290/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.849 | DEBUG    | __main__:trials:29 - Trial = 17290/30000 | Total reward = 50.24
2022-01-26 14:17:49.852 | DEBUG    | __main__:trials:24 - Trial = 17291/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.853 | DEBUG    | __main__:trials:29 - Trial = 17291/30000 | Total reward = 27.92
2022-01-26 14:17:49.857 | DEBUG    | __main__:trials:24 - Trial = 17292/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.859 | DEBUG    | __main__:trials:29 - Trial = 17292/30000 | Total reward = 52.64
2022-01-26 14:17:49.862 | DEBUG    | __main__:trials:26 - Trial = 17293/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:49.863 | DEBUG    | __main__:trials:29 - Trial = 17293/30000 | Total reward = 27.86
2022-01-26 14:17:49.867 | DEBUG    | __main__:trials:24 - Trial = 17294/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.868 | DEBUG    | __main__:trials:29 - Trial = 17294/30000 | Total reward = 48.49
2022-01-26 14:17:49.871 | DEBUG    | __main__:trials:24 - Trial = 17295/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.873 | DEBUG    | __main__:trials:29 - Trial = 17295/30000 | Total reward = 37.58
2022-01-26 14:17:49.876 | DEBUG    | __main__:trials:24 - Trial = 17296/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.878 | DEBUG    | __main__:trials:29 - Trial = 17296/30000 | Total reward = 48.88
2022-01-26 14:17:49.881 | DEBUG    | __main__:trials:24 - Trial = 17297/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.882 | DEBUG    | __main__:trials:29 - Trial = 17297/30000 | Total reward = 51.83
2022-01-26 14:17:49.886 | DEBUG    | __main__:trials:24 - Trial = 17298/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.888 | DEBUG    | __main__:trials:29 - Trial = 17298/30000 | Total reward = 57.89
2022-01-26 14:17:49.890 | DEBUG    | __main__:trials:24 - Trial = 17299/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.892 | DEBUG    | __main__:trials:29 - Trial = 17299/30000 | Total reward = 55.65
2022-01-26 14:17:49.896 | DEBUG    | __main__:trials:24 - Trial = 17300/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.897 | DEBUG    | __main__:trials:29 - Trial = 17300/30000 | Total reward = 46.69
2022-01-26 14:17:49.900 | DEBUG    | __main__:trials:24 - Trial = 17301/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.902 | DEBUG    | __main__:trials:29 - Trial = 17301/30000 | Total reward = 44.78
2022-01-26 14:17:49.905 | DEBUG    | __main__:trials:24 - Trial = 17302/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.907 | DEBUG    | __main__:trials:29 - Trial = 17302/30000 | Total reward = 51.37
2022-01-26 14:17:49.910 | DEBUG    | __main__:trials:24 - Trial = 17303/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.911 | DEBUG    | __main__:trials:29 - Trial = 17303/30000 | Total reward = 40.50
2022-01-26 14:17:49.916 | DEBUG    | __main__:trials:24 - Trial = 17304/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.917 | DEBUG    | __main__:trials:29 - Trial = 17304/30000 | Total reward = 47.57
2022-01-26 14:17:49.921 | DEBUG    | __main__:trials:24 - Trial = 17305/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.921 | DEBUG    | __main__:trials:29 - Trial = 17305/30000 | Total reward = 51.62
2022-01-26 14:17:49.926 | DEBUG    | __main__:trials:24 - Trial = 17306/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.927 | DEBUG    | __main__:trials:29 - Trial = 17306/30000 | Total reward = 49.94
2022-01-26 14:17:49.930 | DEBUG    | __main__:trials:24 - Trial = 17307/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.932 | DEBUG    | __main__:trials:29 - Trial = 17307/30000 | Total reward = 51.17
2022-01-26 14:17:49.935 | DEBUG    | __main__:trials:26 - Trial = 17308/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:49.937 | DEBUG    | __main__:trials:29 - Trial = 17308/30000 | Total reward = 29.72
2022-01-26 14:17:49.940 | DEBUG    | __main__:trials:26 - Trial = 17309/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:49.940 | DEBUG    | __main__:trials:29 - Trial = 17309/30000 | Total reward = 21.53
2022-01-26 14:17:49.944 | DEBUG    | __main__:trials:24 - Trial = 17310/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.945 | DEBUG    | __main__:trials:29 - Trial = 17310/30000 | Total reward = 49.42
2022-01-26 14:17:49.949 | DEBUG    | __main__:trials:24 - Trial = 17311/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.950 | DEBUG    | __main__:trials:29 - Trial = 17311/30000 | Total reward = 50.06
2022-01-26 14:17:49.953 | DEBUG    | __main__:trials:24 - Trial = 17312/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.954 | DEBUG    | __main__:trials:29 - Trial = 17312/30000 | Total reward = 42.50
2022-01-26 14:17:49.957 | DEBUG    | __main__:trials:24 - Trial = 17313/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.958 | DEBUG    | __main__:trials:29 - Trial = 17313/30000 | Total reward = 30.93
2022-01-26 14:17:49.961 | DEBUG    | __main__:trials:24 - Trial = 17314/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.964 | DEBUG    | __main__:trials:29 - Trial = 17314/30000 | Total reward = 61.62
2022-01-26 14:17:49.967 | DEBUG    | __main__:trials:24 - Trial = 17315/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.968 | DEBUG    | __main__:trials:29 - Trial = 17315/30000 | Total reward = 50.84
2022-01-26 14:17:49.971 | DEBUG    | __main__:trials:24 - Trial = 17316/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.973 | DEBUG    | __main__:trials:29 - Trial = 17316/30000 | Total reward = 46.70
2022-01-26 14:17:49.976 | DEBUG    | __main__:trials:24 - Trial = 17317/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.978 | DEBUG    | __main__:trials:29 - Trial = 17317/30000 | Total reward = 38.99
2022-01-26 14:17:49.982 | DEBUG    | __main__:trials:24 - Trial = 17318/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.983 | DEBUG    | __main__:trials:29 - Trial = 17318/30000 | Total reward = 49.43
2022-01-26 14:17:49.987 | DEBUG    | __main__:trials:24 - Trial = 17319/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.988 | DEBUG    | __main__:trials:29 - Trial = 17319/30000 | Total reward = 49.50
2022-01-26 14:17:49.992 | DEBUG    | __main__:trials:24 - Trial = 17320/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.993 | DEBUG    | __main__:trials:29 - Trial = 17320/30000 | Total reward = 48.62
2022-01-26 14:17:49.997 | DEBUG    | __main__:trials:24 - Trial = 17321/30000 | Max number of steps (20) reached
2022-01-26 14:17:49.998 | DEBUG    | __main__:trials:29 - Trial = 17321/30000 | Total reward = 47.32
2022-01-26 14:17:50.002 | DEBUG    | __main__:trials:24 - Trial = 17322/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.002 | DEBUG    | __main__:trials:29 - Trial = 17322/30000 | Total reward = 44.02
2022-01-26 14:17:50.007 | DEBUG    | __main__:trials:24 - Trial = 17323/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.008 | DEBUG    | __main__:trials:29 - Trial = 17323/30000 | Total reward = 43.93
2022-01-26 14:17:50.012 | DEBUG    | __main__:trials:24 - Trial = 17324/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.013 | DEBUG    | __main__:trials:29 - Trial = 17324/30000 | Total reward = 45.70
2022-01-26 14:17:50.017 | DEBUG    | __main__:trials:24 - Trial = 17325/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.018 | DEBUG    | __main__:trials:29 - Trial = 17325/30000 | Total reward = 49.13
2022-01-26 14:17:50.021 | DEBUG    | __main__:trials:24 - Trial = 17326/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.022 | DEBUG    | __main__:trials:29 - Trial = 17326/30000 | Total reward = 46.08
2022-01-26 14:17:50.025 | DEBUG    | __main__:trials:24 - Trial = 17327/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.026 | DEBUG    | __main__:trials:29 - Trial = 17327/30000 | Total reward = 34.08
2022-01-26 14:17:50.029 | DEBUG    | __main__:trials:24 - Trial = 17328/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.030 | DEBUG    | __main__:trials:29 - Trial = 17328/30000 | Total reward = 46.41
2022-01-26 14:17:50.033 | DEBUG    | __main__:trials:24 - Trial = 17329/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.035 | DEBUG    | __main__:trials:29 - Trial = 17329/30000 | Total reward = 41.35
2022-01-26 14:17:50.038 | DEBUG    | __main__:trials:24 - Trial = 17330/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.039 | DEBUG    | __main__:trials:29 - Trial = 17330/30000 | Total reward = 46.57
2022-01-26 14:17:50.043 | DEBUG    | __main__:trials:24 - Trial = 17331/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.043 | DEBUG    | __main__:trials:29 - Trial = 17331/30000 | Total reward = 45.96
2022-01-26 14:17:50.047 | DEBUG    | __main__:trials:24 - Trial = 17332/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.048 | DEBUG    | __main__:trials:29 - Trial = 17332/30000 | Total reward = 54.67
2022-01-26 14:17:50.052 | DEBUG    | __main__:trials:24 - Trial = 17333/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.054 | DEBUG    | __main__:trials:29 - Trial = 17333/30000 | Total reward = 44.02
2022-01-26 14:17:50.057 | DEBUG    | __main__:trials:24 - Trial = 17334/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.058 | DEBUG    | __main__:trials:29 - Trial = 17334/30000 | Total reward = 42.93
2022-01-26 14:17:50.062 | DEBUG    | __main__:trials:24 - Trial = 17335/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.063 | DEBUG    | __main__:trials:29 - Trial = 17335/30000 | Total reward = 49.56
2022-01-26 14:17:50.067 | DEBUG    | __main__:trials:24 - Trial = 17336/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.067 | DEBUG    | __main__:trials:29 - Trial = 17336/30000 | Total reward = 59.24
2022-01-26 14:17:50.072 | DEBUG    | __main__:trials:24 - Trial = 17337/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.074 | DEBUG    | __main__:trials:29 - Trial = 17337/30000 | Total reward = 53.35
2022-01-26 14:17:50.077 | DEBUG    | __main__:trials:24 - Trial = 17338/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.079 | DEBUG    | __main__:trials:29 - Trial = 17338/30000 | Total reward = 49.50
2022-01-26 14:17:50.082 | DEBUG    | __main__:trials:24 - Trial = 17339/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.084 | DEBUG    | __main__:trials:29 - Trial = 17339/30000 | Total reward = 50.77
2022-01-26 14:17:50.087 | DEBUG    | __main__:trials:24 - Trial = 17340/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.088 | DEBUG    | __main__:trials:29 - Trial = 17340/30000 | Total reward = 49.14
2022-01-26 14:17:50.092 | DEBUG    | __main__:trials:24 - Trial = 17341/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.093 | DEBUG    | __main__:trials:29 - Trial = 17341/30000 | Total reward = 57.28
2022-01-26 14:17:50.097 | DEBUG    | __main__:trials:24 - Trial = 17342/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.098 | DEBUG    | __main__:trials:29 - Trial = 17342/30000 | Total reward = 47.66
2022-01-26 14:17:50.102 | DEBUG    | __main__:trials:24 - Trial = 17343/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.104 | DEBUG    | __main__:trials:29 - Trial = 17343/30000 | Total reward = 59.15
2022-01-26 14:17:50.108 | DEBUG    | __main__:trials:24 - Trial = 17344/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.109 | DEBUG    | __main__:trials:29 - Trial = 17344/30000 | Total reward = 49.99
2022-01-26 14:17:50.112 | DEBUG    | __main__:trials:24 - Trial = 17345/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.114 | DEBUG    | __main__:trials:29 - Trial = 17345/30000 | Total reward = 42.54
2022-01-26 14:17:50.117 | DEBUG    | __main__:trials:24 - Trial = 17346/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.118 | DEBUG    | __main__:trials:29 - Trial = 17346/30000 | Total reward = 50.73
2022-01-26 14:17:50.121 | DEBUG    | __main__:trials:24 - Trial = 17347/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.122 | DEBUG    | __main__:trials:29 - Trial = 17347/30000 | Total reward = 50.06
2022-01-26 14:17:50.126 | DEBUG    | __main__:trials:24 - Trial = 17348/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.127 | DEBUG    | __main__:trials:29 - Trial = 17348/30000 | Total reward = 52.58
2022-01-26 14:17:50.131 | DEBUG    | __main__:trials:24 - Trial = 17349/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.131 | DEBUG    | __main__:trials:29 - Trial = 17349/30000 | Total reward = 40.58
2022-01-26 14:17:50.135 | DEBUG    | __main__:trials:26 - Trial = 17350/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:50.136 | DEBUG    | __main__:trials:29 - Trial = 17350/30000 | Total reward = 27.16
2022-01-26 14:17:50.139 | DEBUG    | __main__:trials:24 - Trial = 17351/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.141 | DEBUG    | __main__:trials:29 - Trial = 17351/30000 | Total reward = 51.83
2022-01-26 14:17:50.144 | DEBUG    | __main__:trials:24 - Trial = 17352/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.146 | DEBUG    | __main__:trials:29 - Trial = 17352/30000 | Total reward = 51.72
2022-01-26 14:17:50.149 | DEBUG    | __main__:trials:24 - Trial = 17353/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.150 | DEBUG    | __main__:trials:29 - Trial = 17353/30000 | Total reward = 50.08
2022-01-26 14:17:50.153 | DEBUG    | __main__:trials:24 - Trial = 17354/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.154 | DEBUG    | __main__:trials:29 - Trial = 17354/30000 | Total reward = 43.67
2022-01-26 14:17:50.157 | DEBUG    | __main__:trials:24 - Trial = 17355/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.158 | DEBUG    | __main__:trials:29 - Trial = 17355/30000 | Total reward = 35.26
2022-01-26 14:17:50.161 | DEBUG    | __main__:trials:24 - Trial = 17356/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.163 | DEBUG    | __main__:trials:29 - Trial = 17356/30000 | Total reward = 52.06
2022-01-26 14:17:50.167 | DEBUG    | __main__:trials:24 - Trial = 17357/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.168 | DEBUG    | __main__:trials:29 - Trial = 17357/30000 | Total reward = 51.72
2022-01-26 14:17:50.171 | DEBUG    | __main__:trials:26 - Trial = 17358/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:50.173 | DEBUG    | __main__:trials:29 - Trial = 17358/30000 | Total reward = 30.67
2022-01-26 14:17:50.176 | DEBUG    | __main__:trials:24 - Trial = 17359/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.178 | DEBUG    | __main__:trials:29 - Trial = 17359/30000 | Total reward = 51.41
2022-01-26 14:17:50.181 | DEBUG    | __main__:trials:24 - Trial = 17360/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.182 | DEBUG    | __main__:trials:29 - Trial = 17360/30000 | Total reward = 56.81
2022-01-26 14:17:50.186 | DEBUG    | __main__:trials:24 - Trial = 17361/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.187 | DEBUG    | __main__:trials:29 - Trial = 17361/30000 | Total reward = 50.24
2022-01-26 14:17:50.190 | DEBUG    | __main__:trials:24 - Trial = 17362/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.191 | DEBUG    | __main__:trials:29 - Trial = 17362/30000 | Total reward = 52.84
2022-01-26 14:17:50.195 | DEBUG    | __main__:trials:24 - Trial = 17363/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.197 | DEBUG    | __main__:trials:29 - Trial = 17363/30000 | Total reward = 51.85
2022-01-26 14:17:50.199 | DEBUG    | __main__:trials:24 - Trial = 17364/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.201 | DEBUG    | __main__:trials:29 - Trial = 17364/30000 | Total reward = 51.72
2022-01-26 14:17:50.204 | DEBUG    | __main__:trials:24 - Trial = 17365/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.206 | DEBUG    | __main__:trials:29 - Trial = 17365/30000 | Total reward = 49.31
2022-01-26 14:17:50.209 | DEBUG    | __main__:trials:24 - Trial = 17366/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.209 | DEBUG    | __main__:trials:29 - Trial = 17366/30000 | Total reward = 52.62
2022-01-26 14:17:50.213 | DEBUG    | __main__:trials:24 - Trial = 17367/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.214 | DEBUG    | __main__:trials:29 - Trial = 17367/30000 | Total reward = 49.68
2022-01-26 14:17:50.217 | DEBUG    | __main__:trials:26 - Trial = 17368/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:50.217 | DEBUG    | __main__:trials:29 - Trial = 17368/30000 | Total reward = 26.82
2022-01-26 14:17:50.221 | DEBUG    | __main__:trials:24 - Trial = 17369/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.221 | DEBUG    | __main__:trials:29 - Trial = 17369/30000 | Total reward = 50.67
2022-01-26 14:17:50.225 | DEBUG    | __main__:trials:24 - Trial = 17370/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.226 | DEBUG    | __main__:trials:29 - Trial = 17370/30000 | Total reward = 49.26
2022-01-26 14:17:50.229 | DEBUG    | __main__:trials:24 - Trial = 17371/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.230 | DEBUG    | __main__:trials:29 - Trial = 17371/30000 | Total reward = 54.08
2022-01-26 14:17:50.234 | DEBUG    | __main__:trials:24 - Trial = 17372/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.236 | DEBUG    | __main__:trials:29 - Trial = 17372/30000 | Total reward = 50.29
2022-01-26 14:17:50.238 | DEBUG    | __main__:trials:24 - Trial = 17373/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.240 | DEBUG    | __main__:trials:29 - Trial = 17373/30000 | Total reward = 48.17
2022-01-26 14:17:50.243 | DEBUG    | __main__:trials:24 - Trial = 17374/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.244 | DEBUG    | __main__:trials:29 - Trial = 17374/30000 | Total reward = 61.91
2022-01-26 14:17:50.248 | DEBUG    | __main__:trials:24 - Trial = 17375/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.249 | DEBUG    | __main__:trials:29 - Trial = 17375/30000 | Total reward = 47.11
2022-01-26 14:17:50.252 | DEBUG    | __main__:trials:24 - Trial = 17376/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.254 | DEBUG    | __main__:trials:29 - Trial = 17376/30000 | Total reward = 53.70
2022-01-26 14:17:50.257 | DEBUG    | __main__:trials:24 - Trial = 17377/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.257 | DEBUG    | __main__:trials:29 - Trial = 17377/30000 | Total reward = 38.16
2022-01-26 14:17:50.261 | DEBUG    | __main__:trials:24 - Trial = 17378/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.262 | DEBUG    | __main__:trials:29 - Trial = 17378/30000 | Total reward = 60.15
2022-01-26 14:17:50.265 | DEBUG    | __main__:trials:24 - Trial = 17379/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.266 | DEBUG    | __main__:trials:29 - Trial = 17379/30000 | Total reward = 48.20
2022-01-26 14:17:50.269 | DEBUG    | __main__:trials:24 - Trial = 17380/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.270 | DEBUG    | __main__:trials:29 - Trial = 17380/30000 | Total reward = 50.38
2022-01-26 14:17:50.273 | DEBUG    | __main__:trials:24 - Trial = 17381/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.274 | DEBUG    | __main__:trials:29 - Trial = 17381/30000 | Total reward = 50.52
2022-01-26 14:17:50.277 | DEBUG    | __main__:trials:24 - Trial = 17382/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.278 | DEBUG    | __main__:trials:29 - Trial = 17382/30000 | Total reward = 43.59
2022-01-26 14:17:50.281 | DEBUG    | __main__:trials:24 - Trial = 17383/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.282 | DEBUG    | __main__:trials:29 - Trial = 17383/30000 | Total reward = 47.85
2022-01-26 14:17:50.286 | DEBUG    | __main__:trials:24 - Trial = 17384/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.288 | DEBUG    | __main__:trials:29 - Trial = 17384/30000 | Total reward = 43.31
2022-01-26 14:17:50.291 | DEBUG    | __main__:trials:24 - Trial = 17385/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.292 | DEBUG    | __main__:trials:29 - Trial = 17385/30000 | Total reward = 47.11
2022-01-26 14:17:50.295 | DEBUG    | __main__:trials:24 - Trial = 17386/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.297 | DEBUG    | __main__:trials:29 - Trial = 17386/30000 | Total reward = 41.12
2022-01-26 14:17:50.300 | DEBUG    | __main__:trials:24 - Trial = 17387/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.301 | DEBUG    | __main__:trials:29 - Trial = 17387/30000 | Total reward = 43.28
2022-01-26 14:17:50.304 | DEBUG    | __main__:trials:24 - Trial = 17388/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.305 | DEBUG    | __main__:trials:29 - Trial = 17388/30000 | Total reward = 47.68
2022-01-26 14:17:50.308 | DEBUG    | __main__:trials:24 - Trial = 17389/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.309 | DEBUG    | __main__:trials:29 - Trial = 17389/30000 | Total reward = 44.32
2022-01-26 14:17:50.313 | DEBUG    | __main__:trials:24 - Trial = 17390/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.313 | DEBUG    | __main__:trials:29 - Trial = 17390/30000 | Total reward = 46.10
2022-01-26 14:17:50.317 | DEBUG    | __main__:trials:24 - Trial = 17391/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.319 | DEBUG    | __main__:trials:29 - Trial = 17391/30000 | Total reward = 42.27
2022-01-26 14:17:50.322 | DEBUG    | __main__:trials:24 - Trial = 17392/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.322 | DEBUG    | __main__:trials:29 - Trial = 17392/30000 | Total reward = 46.16
2022-01-26 14:17:50.326 | DEBUG    | __main__:trials:24 - Trial = 17393/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.326 | DEBUG    | __main__:trials:29 - Trial = 17393/30000 | Total reward = 48.94
2022-01-26 14:17:50.330 | DEBUG    | __main__:trials:24 - Trial = 17394/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.330 | DEBUG    | __main__:trials:29 - Trial = 17394/30000 | Total reward = 48.25
2022-01-26 14:17:50.334 | DEBUG    | __main__:trials:24 - Trial = 17395/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.335 | DEBUG    | __main__:trials:29 - Trial = 17395/30000 | Total reward = 52.69
2022-01-26 14:17:50.339 | DEBUG    | __main__:trials:24 - Trial = 17396/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.340 | DEBUG    | __main__:trials:29 - Trial = 17396/30000 | Total reward = 39.63
2022-01-26 14:17:50.344 | DEBUG    | __main__:trials:24 - Trial = 17397/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.345 | DEBUG    | __main__:trials:29 - Trial = 17397/30000 | Total reward = 41.11
2022-01-26 14:17:50.348 | DEBUG    | __main__:trials:24 - Trial = 17398/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.350 | DEBUG    | __main__:trials:29 - Trial = 17398/30000 | Total reward = 46.89
2022-01-26 14:17:50.353 | DEBUG    | __main__:trials:24 - Trial = 17399/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.353 | DEBUG    | __main__:trials:29 - Trial = 17399/30000 | Total reward = 48.62
2022-01-26 14:17:50.357 | DEBUG    | __main__:trials:24 - Trial = 17400/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.358 | DEBUG    | __main__:trials:29 - Trial = 17400/30000 | Total reward = 36.00
2022-01-26 14:17:50.361 | DEBUG    | __main__:trials:24 - Trial = 17401/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.362 | DEBUG    | __main__:trials:29 - Trial = 17401/30000 | Total reward = 46.83
2022-01-26 14:17:50.365 | DEBUG    | __main__:trials:24 - Trial = 17402/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.367 | DEBUG    | __main__:trials:29 - Trial = 17402/30000 | Total reward = 42.12
2022-01-26 14:17:50.371 | DEBUG    | __main__:trials:24 - Trial = 17403/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.371 | DEBUG    | __main__:trials:29 - Trial = 17403/30000 | Total reward = 49.16
2022-01-26 14:17:50.375 | DEBUG    | __main__:trials:24 - Trial = 17404/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.377 | DEBUG    | __main__:trials:29 - Trial = 17404/30000 | Total reward = 53.32
2022-01-26 14:17:50.380 | DEBUG    | __main__:trials:24 - Trial = 17405/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.381 | DEBUG    | __main__:trials:29 - Trial = 17405/30000 | Total reward = 49.98
2022-01-26 14:17:50.384 | DEBUG    | __main__:trials:26 - Trial = 17406/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:50.385 | DEBUG    | __main__:trials:29 - Trial = 17406/30000 | Total reward = 23.65
2022-01-26 14:17:50.389 | DEBUG    | __main__:trials:24 - Trial = 17407/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.391 | DEBUG    | __main__:trials:29 - Trial = 17407/30000 | Total reward = 45.90
2022-01-26 14:17:50.394 | DEBUG    | __main__:trials:24 - Trial = 17408/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.396 | DEBUG    | __main__:trials:29 - Trial = 17408/30000 | Total reward = 53.76
2022-01-26 14:17:50.399 | DEBUG    | __main__:trials:24 - Trial = 17409/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.401 | DEBUG    | __main__:trials:29 - Trial = 17409/30000 | Total reward = 49.79
2022-01-26 14:17:50.404 | DEBUG    | __main__:trials:24 - Trial = 17410/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.406 | DEBUG    | __main__:trials:29 - Trial = 17410/30000 | Total reward = 47.95
2022-01-26 14:17:50.409 | DEBUG    | __main__:trials:24 - Trial = 17411/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.411 | DEBUG    | __main__:trials:29 - Trial = 17411/30000 | Total reward = 44.61
2022-01-26 14:17:50.415 | DEBUG    | __main__:trials:24 - Trial = 17412/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.416 | DEBUG    | __main__:trials:29 - Trial = 17412/30000 | Total reward = 47.11
2022-01-26 14:17:50.420 | DEBUG    | __main__:trials:24 - Trial = 17413/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.420 | DEBUG    | __main__:trials:29 - Trial = 17413/30000 | Total reward = 37.53
2022-01-26 14:17:50.425 | DEBUG    | __main__:trials:24 - Trial = 17414/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.426 | DEBUG    | __main__:trials:29 - Trial = 17414/30000 | Total reward = 42.03
2022-01-26 14:17:50.430 | DEBUG    | __main__:trials:24 - Trial = 17415/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.431 | DEBUG    | __main__:trials:29 - Trial = 17415/30000 | Total reward = 45.10
2022-01-26 14:17:50.435 | DEBUG    | __main__:trials:24 - Trial = 17416/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.436 | DEBUG    | __main__:trials:29 - Trial = 17416/30000 | Total reward = 47.52
2022-01-26 14:17:50.440 | DEBUG    | __main__:trials:24 - Trial = 17417/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.441 | DEBUG    | __main__:trials:29 - Trial = 17417/30000 | Total reward = 49.06
2022-01-26 14:17:50.445 | DEBUG    | __main__:trials:24 - Trial = 17418/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.446 | DEBUG    | __main__:trials:29 - Trial = 17418/30000 | Total reward = 53.45
2022-01-26 14:17:50.449 | DEBUG    | __main__:trials:24 - Trial = 17419/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.451 | DEBUG    | __main__:trials:29 - Trial = 17419/30000 | Total reward = 44.01
2022-01-26 14:17:50.454 | DEBUG    | __main__:trials:24 - Trial = 17420/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.456 | DEBUG    | __main__:trials:29 - Trial = 17420/30000 | Total reward = 42.72
2022-01-26 14:17:50.460 | DEBUG    | __main__:trials:24 - Trial = 17421/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.461 | DEBUG    | __main__:trials:29 - Trial = 17421/30000 | Total reward = 50.74
2022-01-26 14:17:50.464 | DEBUG    | __main__:trials:24 - Trial = 17422/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.466 | DEBUG    | __main__:trials:29 - Trial = 17422/30000 | Total reward = 42.12
2022-01-26 14:17:50.469 | DEBUG    | __main__:trials:24 - Trial = 17423/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.470 | DEBUG    | __main__:trials:29 - Trial = 17423/30000 | Total reward = 45.56
2022-01-26 14:17:50.474 | DEBUG    | __main__:trials:24 - Trial = 17424/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.474 | DEBUG    | __main__:trials:29 - Trial = 17424/30000 | Total reward = 52.33
2022-01-26 14:17:50.478 | DEBUG    | __main__:trials:24 - Trial = 17425/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.479 | DEBUG    | __main__:trials:29 - Trial = 17425/30000 | Total reward = 53.65
2022-01-26 14:17:50.482 | DEBUG    | __main__:trials:24 - Trial = 17426/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.484 | DEBUG    | __main__:trials:29 - Trial = 17426/30000 | Total reward = 42.59
2022-01-26 14:17:50.488 | DEBUG    | __main__:trials:24 - Trial = 17427/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.489 | DEBUG    | __main__:trials:29 - Trial = 17427/30000 | Total reward = 50.18
2022-01-26 14:17:50.493 | DEBUG    | __main__:trials:24 - Trial = 17428/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.495 | DEBUG    | __main__:trials:29 - Trial = 17428/30000 | Total reward = 44.83
2022-01-26 14:17:50.499 | DEBUG    | __main__:trials:24 - Trial = 17429/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.500 | DEBUG    | __main__:trials:29 - Trial = 17429/30000 | Total reward = 50.41
2022-01-26 14:17:50.504 | DEBUG    | __main__:trials:24 - Trial = 17430/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.505 | DEBUG    | __main__:trials:29 - Trial = 17430/30000 | Total reward = 56.18
2022-01-26 14:17:50.508 | DEBUG    | __main__:trials:24 - Trial = 17431/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.510 | DEBUG    | __main__:trials:29 - Trial = 17431/30000 | Total reward = 47.33
2022-01-26 14:17:50.514 | DEBUG    | __main__:trials:24 - Trial = 17432/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.515 | DEBUG    | __main__:trials:29 - Trial = 17432/30000 | Total reward = 45.56
2022-01-26 14:17:50.518 | DEBUG    | __main__:trials:24 - Trial = 17433/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.520 | DEBUG    | __main__:trials:29 - Trial = 17433/30000 | Total reward = 47.42
2022-01-26 14:17:50.523 | DEBUG    | __main__:trials:24 - Trial = 17434/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.524 | DEBUG    | __main__:trials:29 - Trial = 17434/30000 | Total reward = 46.67
2022-01-26 14:17:50.528 | DEBUG    | __main__:trials:24 - Trial = 17435/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.530 | DEBUG    | __main__:trials:29 - Trial = 17435/30000 | Total reward = 50.24
2022-01-26 14:17:50.534 | DEBUG    | __main__:trials:24 - Trial = 17436/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.535 | DEBUG    | __main__:trials:29 - Trial = 17436/30000 | Total reward = 47.35
2022-01-26 14:17:50.539 | DEBUG    | __main__:trials:24 - Trial = 17437/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.540 | DEBUG    | __main__:trials:29 - Trial = 17437/30000 | Total reward = 59.10
2022-01-26 14:17:50.544 | DEBUG    | __main__:trials:24 - Trial = 17438/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.544 | DEBUG    | __main__:trials:29 - Trial = 17438/30000 | Total reward = 39.67
2022-01-26 14:17:50.549 | DEBUG    | __main__:trials:24 - Trial = 17439/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.549 | DEBUG    | __main__:trials:29 - Trial = 17439/30000 | Total reward = 55.46
2022-01-26 14:17:50.552 | DEBUG    | __main__:trials:24 - Trial = 17440/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.554 | DEBUG    | __main__:trials:29 - Trial = 17440/30000 | Total reward = 40.70
2022-01-26 14:17:50.557 | DEBUG    | __main__:trials:24 - Trial = 17441/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.558 | DEBUG    | __main__:trials:29 - Trial = 17441/30000 | Total reward = 46.20
2022-01-26 14:17:50.562 | DEBUG    | __main__:trials:24 - Trial = 17442/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.562 | DEBUG    | __main__:trials:29 - Trial = 17442/30000 | Total reward = 48.54
2022-01-26 14:17:50.566 | DEBUG    | __main__:trials:24 - Trial = 17443/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.568 | DEBUG    | __main__:trials:29 - Trial = 17443/30000 | Total reward = 47.66
2022-01-26 14:17:50.571 | DEBUG    | __main__:trials:24 - Trial = 17444/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.572 | DEBUG    | __main__:trials:29 - Trial = 17444/30000 | Total reward = 32.05
2022-01-26 14:17:50.575 | DEBUG    | __main__:trials:24 - Trial = 17445/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.577 | DEBUG    | __main__:trials:29 - Trial = 17445/30000 | Total reward = 44.79
2022-01-26 14:17:50.581 | DEBUG    | __main__:trials:24 - Trial = 17446/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.582 | DEBUG    | __main__:trials:29 - Trial = 17446/30000 | Total reward = 45.72
2022-01-26 14:17:50.586 | DEBUG    | __main__:trials:24 - Trial = 17447/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.586 | DEBUG    | __main__:trials:29 - Trial = 17447/30000 | Total reward = 42.59
2022-01-26 14:17:50.591 | DEBUG    | __main__:trials:24 - Trial = 17448/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.592 | DEBUG    | __main__:trials:29 - Trial = 17448/30000 | Total reward = 50.60
2022-01-26 14:17:50.596 | DEBUG    | __main__:trials:24 - Trial = 17449/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.597 | DEBUG    | __main__:trials:29 - Trial = 17449/30000 | Total reward = 42.23
2022-01-26 14:17:50.600 | DEBUG    | __main__:trials:24 - Trial = 17450/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.602 | DEBUG    | __main__:trials:29 - Trial = 17450/30000 | Total reward = 43.23
2022-01-26 14:17:50.605 | DEBUG    | __main__:trials:24 - Trial = 17451/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.606 | DEBUG    | __main__:trials:29 - Trial = 17451/30000 | Total reward = 34.58
2022-01-26 14:17:50.610 | DEBUG    | __main__:trials:24 - Trial = 17452/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.611 | DEBUG    | __main__:trials:29 - Trial = 17452/30000 | Total reward = 36.35
2022-01-26 14:17:50.614 | DEBUG    | __main__:trials:24 - Trial = 17453/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.616 | DEBUG    | __main__:trials:29 - Trial = 17453/30000 | Total reward = 52.82
2022-01-26 14:17:50.619 | DEBUG    | __main__:trials:24 - Trial = 17454/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.621 | DEBUG    | __main__:trials:29 - Trial = 17454/30000 | Total reward = 49.84
2022-01-26 14:17:50.624 | DEBUG    | __main__:trials:24 - Trial = 17455/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.626 | DEBUG    | __main__:trials:29 - Trial = 17455/30000 | Total reward = 49.91
2022-01-26 14:17:50.629 | DEBUG    | __main__:trials:24 - Trial = 17456/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.630 | DEBUG    | __main__:trials:29 - Trial = 17456/30000 | Total reward = 47.91
2022-01-26 14:17:50.634 | DEBUG    | __main__:trials:24 - Trial = 17457/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.635 | DEBUG    | __main__:trials:29 - Trial = 17457/30000 | Total reward = 41.30
2022-01-26 14:17:50.639 | DEBUG    | __main__:trials:24 - Trial = 17458/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.640 | DEBUG    | __main__:trials:29 - Trial = 17458/30000 | Total reward = 46.67
2022-01-26 14:17:50.644 | DEBUG    | __main__:trials:24 - Trial = 17459/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.646 | DEBUG    | __main__:trials:29 - Trial = 17459/30000 | Total reward = 49.85
2022-01-26 14:17:50.650 | DEBUG    | __main__:trials:24 - Trial = 17460/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.651 | DEBUG    | __main__:trials:29 - Trial = 17460/30000 | Total reward = 38.34
2022-01-26 14:17:50.655 | DEBUG    | __main__:trials:24 - Trial = 17461/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.656 | DEBUG    | __main__:trials:29 - Trial = 17461/30000 | Total reward = 51.72
2022-01-26 14:17:50.660 | DEBUG    | __main__:trials:24 - Trial = 17462/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.662 | DEBUG    | __main__:trials:29 - Trial = 17462/30000 | Total reward = 36.40
2022-01-26 14:17:50.665 | DEBUG    | __main__:trials:24 - Trial = 17463/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.667 | DEBUG    | __main__:trials:29 - Trial = 17463/30000 | Total reward = 43.64
2022-01-26 14:17:50.671 | DEBUG    | __main__:trials:24 - Trial = 17464/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.672 | DEBUG    | __main__:trials:29 - Trial = 17464/30000 | Total reward = 49.71
2022-01-26 14:17:50.676 | DEBUG    | __main__:trials:24 - Trial = 17465/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.678 | DEBUG    | __main__:trials:29 - Trial = 17465/30000 | Total reward = 46.22
2022-01-26 14:17:50.682 | DEBUG    | __main__:trials:24 - Trial = 17466/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.683 | DEBUG    | __main__:trials:29 - Trial = 17466/30000 | Total reward = 46.13
2022-01-26 14:17:50.687 | DEBUG    | __main__:trials:24 - Trial = 17467/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.688 | DEBUG    | __main__:trials:29 - Trial = 17467/30000 | Total reward = 42.17
2022-01-26 14:17:50.692 | DEBUG    | __main__:trials:24 - Trial = 17468/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.694 | DEBUG    | __main__:trials:29 - Trial = 17468/30000 | Total reward = 33.82
2022-01-26 14:17:50.697 | DEBUG    | __main__:trials:24 - Trial = 17469/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.698 | DEBUG    | __main__:trials:29 - Trial = 17469/30000 | Total reward = 52.11
2022-01-26 14:17:50.703 | DEBUG    | __main__:trials:24 - Trial = 17470/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.704 | DEBUG    | __main__:trials:29 - Trial = 17470/30000 | Total reward = 49.02
2022-01-26 14:17:50.708 | DEBUG    | __main__:trials:24 - Trial = 17471/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.709 | DEBUG    | __main__:trials:29 - Trial = 17471/30000 | Total reward = 43.69
2022-01-26 14:17:50.713 | DEBUG    | __main__:trials:24 - Trial = 17472/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.715 | DEBUG    | __main__:trials:29 - Trial = 17472/30000 | Total reward = 36.86
2022-01-26 14:17:50.719 | DEBUG    | __main__:trials:24 - Trial = 17473/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.720 | DEBUG    | __main__:trials:29 - Trial = 17473/30000 | Total reward = 49.84
2022-01-26 14:17:50.723 | DEBUG    | __main__:trials:24 - Trial = 17474/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.725 | DEBUG    | __main__:trials:29 - Trial = 17474/30000 | Total reward = 40.35
2022-01-26 14:17:50.728 | DEBUG    | __main__:trials:24 - Trial = 17475/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.730 | DEBUG    | __main__:trials:29 - Trial = 17475/30000 | Total reward = 28.49
2022-01-26 14:17:50.733 | DEBUG    | __main__:trials:24 - Trial = 17476/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.734 | DEBUG    | __main__:trials:29 - Trial = 17476/30000 | Total reward = 63.76
2022-01-26 14:17:50.738 | DEBUG    | __main__:trials:24 - Trial = 17477/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.740 | DEBUG    | __main__:trials:29 - Trial = 17477/30000 | Total reward = 59.17
2022-01-26 14:17:50.743 | DEBUG    | __main__:trials:24 - Trial = 17478/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.745 | DEBUG    | __main__:trials:29 - Trial = 17478/30000 | Total reward = 54.00
2022-01-26 14:17:50.749 | DEBUG    | __main__:trials:24 - Trial = 17479/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.750 | DEBUG    | __main__:trials:29 - Trial = 17479/30000 | Total reward = 35.54
2022-01-26 14:17:50.754 | DEBUG    | __main__:trials:24 - Trial = 17480/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.756 | DEBUG    | __main__:trials:29 - Trial = 17480/30000 | Total reward = 46.78
2022-01-26 14:17:50.759 | DEBUG    | __main__:trials:24 - Trial = 17481/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.761 | DEBUG    | __main__:trials:29 - Trial = 17481/30000 | Total reward = 43.81
2022-01-26 14:17:50.764 | DEBUG    | __main__:trials:24 - Trial = 17482/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.766 | DEBUG    | __main__:trials:29 - Trial = 17482/30000 | Total reward = 41.88
2022-01-26 14:17:50.769 | DEBUG    | __main__:trials:24 - Trial = 17483/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.770 | DEBUG    | __main__:trials:29 - Trial = 17483/30000 | Total reward = 45.82
2022-01-26 14:17:50.773 | DEBUG    | __main__:trials:24 - Trial = 17484/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.774 | DEBUG    | __main__:trials:29 - Trial = 17484/30000 | Total reward = 50.50
2022-01-26 14:17:50.777 | DEBUG    | __main__:trials:24 - Trial = 17485/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.778 | DEBUG    | __main__:trials:29 - Trial = 17485/30000 | Total reward = 51.73
2022-01-26 14:17:50.781 | DEBUG    | __main__:trials:24 - Trial = 17486/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.782 | DEBUG    | __main__:trials:29 - Trial = 17486/30000 | Total reward = 36.14
2022-01-26 14:17:50.786 | DEBUG    | __main__:trials:24 - Trial = 17487/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.786 | DEBUG    | __main__:trials:29 - Trial = 17487/30000 | Total reward = 47.77
2022-01-26 14:17:50.791 | DEBUG    | __main__:trials:24 - Trial = 17488/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.793 | DEBUG    | __main__:trials:29 - Trial = 17488/30000 | Total reward = 38.12
2022-01-26 14:17:50.796 | DEBUG    | __main__:trials:24 - Trial = 17489/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.797 | DEBUG    | __main__:trials:29 - Trial = 17489/30000 | Total reward = 49.34
2022-01-26 14:17:50.801 | DEBUG    | __main__:trials:24 - Trial = 17490/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.803 | DEBUG    | __main__:trials:29 - Trial = 17490/30000 | Total reward = 46.16
2022-01-26 14:17:50.806 | DEBUG    | __main__:trials:24 - Trial = 17491/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.808 | DEBUG    | __main__:trials:29 - Trial = 17491/30000 | Total reward = 47.30
2022-01-26 14:17:50.811 | DEBUG    | __main__:trials:24 - Trial = 17492/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.813 | DEBUG    | __main__:trials:29 - Trial = 17492/30000 | Total reward = 45.51
2022-01-26 14:17:50.817 | DEBUG    | __main__:trials:24 - Trial = 17493/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.818 | DEBUG    | __main__:trials:29 - Trial = 17493/30000 | Total reward = 50.09
2022-01-26 14:17:50.822 | DEBUG    | __main__:trials:24 - Trial = 17494/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.823 | DEBUG    | __main__:trials:29 - Trial = 17494/30000 | Total reward = 47.18
2022-01-26 14:17:50.826 | DEBUG    | __main__:trials:24 - Trial = 17495/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.828 | DEBUG    | __main__:trials:29 - Trial = 17495/30000 | Total reward = 49.93
2022-01-26 14:17:50.831 | DEBUG    | __main__:trials:24 - Trial = 17496/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.833 | DEBUG    | __main__:trials:29 - Trial = 17496/30000 | Total reward = 38.35
2022-01-26 14:17:50.836 | DEBUG    | __main__:trials:24 - Trial = 17497/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.838 | DEBUG    | __main__:trials:29 - Trial = 17497/30000 | Total reward = 38.94
2022-01-26 14:17:50.841 | DEBUG    | __main__:trials:24 - Trial = 17498/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.843 | DEBUG    | __main__:trials:29 - Trial = 17498/30000 | Total reward = 49.89
2022-01-26 14:17:50.847 | DEBUG    | __main__:trials:24 - Trial = 17499/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.847 | DEBUG    | __main__:trials:29 - Trial = 17499/30000 | Total reward = 47.01
2022-01-26 14:17:50.851 | DEBUG    | __main__:trials:24 - Trial = 17500/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.853 | DEBUG    | __main__:trials:29 - Trial = 17500/30000 | Total reward = 46.94
2022-01-26 14:17:50.856 | DEBUG    | __main__:trials:24 - Trial = 17501/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.857 | DEBUG    | __main__:trials:29 - Trial = 17501/30000 | Total reward = 56.75
2022-01-26 14:17:50.861 | DEBUG    | __main__:trials:24 - Trial = 17502/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.862 | DEBUG    | __main__:trials:29 - Trial = 17502/30000 | Total reward = 44.51
2022-01-26 14:17:50.866 | DEBUG    | __main__:trials:24 - Trial = 17503/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.867 | DEBUG    | __main__:trials:29 - Trial = 17503/30000 | Total reward = 49.79
2022-01-26 14:17:50.870 | DEBUG    | __main__:trials:24 - Trial = 17504/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.872 | DEBUG    | __main__:trials:29 - Trial = 17504/30000 | Total reward = 45.99
2022-01-26 14:17:50.876 | DEBUG    | __main__:trials:24 - Trial = 17505/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.876 | DEBUG    | __main__:trials:29 - Trial = 17505/30000 | Total reward = 47.75
2022-01-26 14:17:50.880 | DEBUG    | __main__:trials:24 - Trial = 17506/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.882 | DEBUG    | __main__:trials:29 - Trial = 17506/30000 | Total reward = 51.88
2022-01-26 14:17:50.886 | DEBUG    | __main__:trials:24 - Trial = 17507/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.887 | DEBUG    | __main__:trials:29 - Trial = 17507/30000 | Total reward = 49.00
2022-01-26 14:17:50.891 | DEBUG    | __main__:trials:24 - Trial = 17508/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.893 | DEBUG    | __main__:trials:29 - Trial = 17508/30000 | Total reward = 50.15
2022-01-26 14:17:50.896 | DEBUG    | __main__:trials:24 - Trial = 17509/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.897 | DEBUG    | __main__:trials:29 - Trial = 17509/30000 | Total reward = 49.09
2022-01-26 14:17:50.902 | DEBUG    | __main__:trials:24 - Trial = 17510/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.903 | DEBUG    | __main__:trials:29 - Trial = 17510/30000 | Total reward = 45.52
2022-01-26 14:17:50.907 | DEBUG    | __main__:trials:24 - Trial = 17511/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.909 | DEBUG    | __main__:trials:29 - Trial = 17511/30000 | Total reward = 58.10
2022-01-26 14:17:50.913 | DEBUG    | __main__:trials:24 - Trial = 17512/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.914 | DEBUG    | __main__:trials:29 - Trial = 17512/30000 | Total reward = 47.34
2022-01-26 14:17:50.918 | DEBUG    | __main__:trials:24 - Trial = 17513/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.918 | DEBUG    | __main__:trials:29 - Trial = 17513/30000 | Total reward = 50.57
2022-01-26 14:17:50.923 | DEBUG    | __main__:trials:24 - Trial = 17514/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.924 | DEBUG    | __main__:trials:29 - Trial = 17514/30000 | Total reward = 49.74
2022-01-26 14:17:50.928 | DEBUG    | __main__:trials:24 - Trial = 17515/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.929 | DEBUG    | __main__:trials:29 - Trial = 17515/30000 | Total reward = 51.15
2022-01-26 14:17:50.933 | DEBUG    | __main__:trials:24 - Trial = 17516/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.934 | DEBUG    | __main__:trials:29 - Trial = 17516/30000 | Total reward = 34.43
2022-01-26 14:17:50.938 | DEBUG    | __main__:trials:24 - Trial = 17517/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.939 | DEBUG    | __main__:trials:29 - Trial = 17517/30000 | Total reward = 61.39
2022-01-26 14:17:50.943 | DEBUG    | __main__:trials:24 - Trial = 17518/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.944 | DEBUG    | __main__:trials:29 - Trial = 17518/30000 | Total reward = 45.52
2022-01-26 14:17:50.948 | DEBUG    | __main__:trials:24 - Trial = 17519/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.950 | DEBUG    | __main__:trials:29 - Trial = 17519/30000 | Total reward = 55.02
2022-01-26 14:17:50.954 | DEBUG    | __main__:trials:24 - Trial = 17520/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.954 | DEBUG    | __main__:trials:29 - Trial = 17520/30000 | Total reward = 43.00
2022-01-26 14:17:50.959 | DEBUG    | __main__:trials:24 - Trial = 17521/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.959 | DEBUG    | __main__:trials:29 - Trial = 17521/30000 | Total reward = 51.61
2022-01-26 14:17:50.964 | DEBUG    | __main__:trials:24 - Trial = 17522/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.965 | DEBUG    | __main__:trials:29 - Trial = 17522/30000 | Total reward = 45.52
2022-01-26 14:17:50.969 | DEBUG    | __main__:trials:24 - Trial = 17523/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.970 | DEBUG    | __main__:trials:29 - Trial = 17523/30000 | Total reward = 50.27
2022-01-26 14:17:50.973 | DEBUG    | __main__:trials:24 - Trial = 17524/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.974 | DEBUG    | __main__:trials:29 - Trial = 17524/30000 | Total reward = 54.23
2022-01-26 14:17:50.977 | DEBUG    | __main__:trials:24 - Trial = 17525/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.979 | DEBUG    | __main__:trials:29 - Trial = 17525/30000 | Total reward = 48.35
2022-01-26 14:17:50.981 | DEBUG    | __main__:trials:24 - Trial = 17526/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.983 | DEBUG    | __main__:trials:29 - Trial = 17526/30000 | Total reward = 46.34
2022-01-26 14:17:50.986 | DEBUG    | __main__:trials:24 - Trial = 17527/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.987 | DEBUG    | __main__:trials:29 - Trial = 17527/30000 | Total reward = 34.48
2022-01-26 14:17:50.990 | DEBUG    | __main__:trials:24 - Trial = 17528/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.992 | DEBUG    | __main__:trials:29 - Trial = 17528/30000 | Total reward = 61.25
2022-01-26 14:17:50.996 | DEBUG    | __main__:trials:24 - Trial = 17529/30000 | Max number of steps (20) reached
2022-01-26 14:17:50.996 | DEBUG    | __main__:trials:29 - Trial = 17529/30000 | Total reward = 48.55
2022-01-26 14:17:51.001 | DEBUG    | __main__:trials:24 - Trial = 17530/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.002 | DEBUG    | __main__:trials:29 - Trial = 17530/30000 | Total reward = 22.06
2022-01-26 14:17:51.006 | DEBUG    | __main__:trials:24 - Trial = 17531/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.007 | DEBUG    | __main__:trials:29 - Trial = 17531/30000 | Total reward = 48.02
2022-01-26 14:17:51.010 | DEBUG    | __main__:trials:24 - Trial = 17532/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.012 | DEBUG    | __main__:trials:29 - Trial = 17532/30000 | Total reward = 52.45
2022-01-26 14:17:51.016 | DEBUG    | __main__:trials:24 - Trial = 17533/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.016 | DEBUG    | __main__:trials:29 - Trial = 17533/30000 | Total reward = 45.52
2022-01-26 14:17:51.021 | DEBUG    | __main__:trials:24 - Trial = 17534/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.022 | DEBUG    | __main__:trials:29 - Trial = 17534/30000 | Total reward = 37.78
2022-01-26 14:17:51.025 | DEBUG    | __main__:trials:24 - Trial = 17535/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.026 | DEBUG    | __main__:trials:29 - Trial = 17535/30000 | Total reward = 47.17
2022-01-26 14:17:51.029 | DEBUG    | __main__:trials:24 - Trial = 17536/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.030 | DEBUG    | __main__:trials:29 - Trial = 17536/30000 | Total reward = 61.64
2022-01-26 14:17:51.033 | DEBUG    | __main__:trials:24 - Trial = 17537/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.035 | DEBUG    | __main__:trials:29 - Trial = 17537/30000 | Total reward = 46.45
2022-01-26 14:17:51.038 | DEBUG    | __main__:trials:24 - Trial = 17538/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.040 | DEBUG    | __main__:trials:29 - Trial = 17538/30000 | Total reward = 45.56
2022-01-26 14:17:51.043 | DEBUG    | __main__:trials:24 - Trial = 17539/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.045 | DEBUG    | __main__:trials:29 - Trial = 17539/30000 | Total reward = 51.66
2022-01-26 14:17:51.048 | DEBUG    | __main__:trials:24 - Trial = 17540/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.049 | DEBUG    | __main__:trials:29 - Trial = 17540/30000 | Total reward = 51.43
2022-01-26 14:17:51.052 | DEBUG    | __main__:trials:24 - Trial = 17541/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.054 | DEBUG    | __main__:trials:29 - Trial = 17541/30000 | Total reward = 54.52
2022-01-26 14:17:51.057 | DEBUG    | __main__:trials:24 - Trial = 17542/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.058 | DEBUG    | __main__:trials:29 - Trial = 17542/30000 | Total reward = 44.16
2022-01-26 14:17:51.061 | DEBUG    | __main__:trials:24 - Trial = 17543/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.062 | DEBUG    | __main__:trials:29 - Trial = 17543/30000 | Total reward = 25.87
2022-01-26 14:17:51.066 | DEBUG    | __main__:trials:24 - Trial = 17544/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.066 | DEBUG    | __main__:trials:29 - Trial = 17544/30000 | Total reward = 47.55
2022-01-26 14:17:51.070 | DEBUG    | __main__:trials:24 - Trial = 17545/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.072 | DEBUG    | __main__:trials:29 - Trial = 17545/30000 | Total reward = 47.62
2022-01-26 14:17:51.075 | DEBUG    | __main__:trials:24 - Trial = 17546/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.075 | DEBUG    | __main__:trials:29 - Trial = 17546/30000 | Total reward = 53.65
2022-01-26 14:17:51.079 | DEBUG    | __main__:trials:24 - Trial = 17547/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.080 | DEBUG    | __main__:trials:29 - Trial = 17547/30000 | Total reward = 34.91
2022-01-26 14:17:51.084 | DEBUG    | __main__:trials:24 - Trial = 17548/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.086 | DEBUG    | __main__:trials:29 - Trial = 17548/30000 | Total reward = 45.56
2022-01-26 14:17:51.089 | DEBUG    | __main__:trials:24 - Trial = 17549/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.090 | DEBUG    | __main__:trials:29 - Trial = 17549/30000 | Total reward = 47.01
2022-01-26 14:17:51.094 | DEBUG    | __main__:trials:24 - Trial = 17550/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.096 | DEBUG    | __main__:trials:29 - Trial = 17550/30000 | Total reward = 47.01
2022-01-26 14:17:51.099 | DEBUG    | __main__:trials:24 - Trial = 17551/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.101 | DEBUG    | __main__:trials:29 - Trial = 17551/30000 | Total reward = 45.25
2022-01-26 14:17:51.104 | DEBUG    | __main__:trials:24 - Trial = 17552/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.106 | DEBUG    | __main__:trials:29 - Trial = 17552/30000 | Total reward = 53.00
2022-01-26 14:17:51.109 | DEBUG    | __main__:trials:24 - Trial = 17553/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.111 | DEBUG    | __main__:trials:29 - Trial = 17553/30000 | Total reward = 51.47
2022-01-26 14:17:51.115 | DEBUG    | __main__:trials:24 - Trial = 17554/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.115 | DEBUG    | __main__:trials:29 - Trial = 17554/30000 | Total reward = 47.81
2022-01-26 14:17:51.120 | DEBUG    | __main__:trials:24 - Trial = 17555/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.121 | DEBUG    | __main__:trials:29 - Trial = 17555/30000 | Total reward = 58.42
2022-01-26 14:17:51.125 | DEBUG    | __main__:trials:24 - Trial = 17556/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.126 | DEBUG    | __main__:trials:29 - Trial = 17556/30000 | Total reward = 59.14
2022-01-26 14:17:51.130 | DEBUG    | __main__:trials:24 - Trial = 17557/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.132 | DEBUG    | __main__:trials:29 - Trial = 17557/30000 | Total reward = 48.03
2022-01-26 14:17:51.135 | DEBUG    | __main__:trials:24 - Trial = 17558/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.136 | DEBUG    | __main__:trials:29 - Trial = 17558/30000 | Total reward = 37.78
2022-01-26 14:17:51.139 | DEBUG    | __main__:trials:24 - Trial = 17559/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.140 | DEBUG    | __main__:trials:29 - Trial = 17559/30000 | Total reward = 50.79
2022-01-26 14:17:51.144 | DEBUG    | __main__:trials:24 - Trial = 17560/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.145 | DEBUG    | __main__:trials:29 - Trial = 17560/30000 | Total reward = 48.35
2022-01-26 14:17:51.148 | DEBUG    | __main__:trials:24 - Trial = 17561/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.149 | DEBUG    | __main__:trials:29 - Trial = 17561/30000 | Total reward = 47.01
2022-01-26 14:17:51.153 | DEBUG    | __main__:trials:24 - Trial = 17562/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.155 | DEBUG    | __main__:trials:29 - Trial = 17562/30000 | Total reward = 45.56
2022-01-26 14:17:51.158 | DEBUG    | __main__:trials:24 - Trial = 17563/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.160 | DEBUG    | __main__:trials:29 - Trial = 17563/30000 | Total reward = 47.43
2022-01-26 14:17:51.163 | DEBUG    | __main__:trials:24 - Trial = 17564/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.165 | DEBUG    | __main__:trials:29 - Trial = 17564/30000 | Total reward = 59.72
2022-01-26 14:17:51.168 | DEBUG    | __main__:trials:24 - Trial = 17565/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.169 | DEBUG    | __main__:trials:29 - Trial = 17565/30000 | Total reward = 45.81
2022-01-26 14:17:51.174 | DEBUG    | __main__:trials:24 - Trial = 17566/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.175 | DEBUG    | __main__:trials:29 - Trial = 17566/30000 | Total reward = 34.56
2022-01-26 14:17:51.179 | DEBUG    | __main__:trials:24 - Trial = 17567/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.181 | DEBUG    | __main__:trials:29 - Trial = 17567/30000 | Total reward = 29.80
2022-01-26 14:17:51.184 | DEBUG    | __main__:trials:24 - Trial = 17568/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.185 | DEBUG    | __main__:trials:29 - Trial = 17568/30000 | Total reward = 65.17
2022-01-26 14:17:51.189 | DEBUG    | __main__:trials:24 - Trial = 17569/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.191 | DEBUG    | __main__:trials:29 - Trial = 17569/30000 | Total reward = 34.34
2022-01-26 14:17:51.194 | DEBUG    | __main__:trials:24 - Trial = 17570/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.196 | DEBUG    | __main__:trials:29 - Trial = 17570/30000 | Total reward = 56.99
2022-01-26 14:17:51.200 | DEBUG    | __main__:trials:24 - Trial = 17571/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.201 | DEBUG    | __main__:trials:29 - Trial = 17571/30000 | Total reward = 39.99
2022-01-26 14:17:51.205 | DEBUG    | __main__:trials:24 - Trial = 17572/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.205 | DEBUG    | __main__:trials:29 - Trial = 17572/30000 | Total reward = 49.38
2022-01-26 14:17:51.210 | DEBUG    | __main__:trials:24 - Trial = 17573/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.211 | DEBUG    | __main__:trials:29 - Trial = 17573/30000 | Total reward = 45.78
2022-01-26 14:17:51.215 | DEBUG    | __main__:trials:24 - Trial = 17574/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.216 | DEBUG    | __main__:trials:29 - Trial = 17574/30000 | Total reward = 43.34
2022-01-26 14:17:51.220 | DEBUG    | __main__:trials:24 - Trial = 17575/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.221 | DEBUG    | __main__:trials:29 - Trial = 17575/30000 | Total reward = 57.08
2022-01-26 14:17:51.225 | DEBUG    | __main__:trials:24 - Trial = 17576/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.226 | DEBUG    | __main__:trials:29 - Trial = 17576/30000 | Total reward = 51.72
2022-01-26 14:17:51.230 | DEBUG    | __main__:trials:24 - Trial = 17577/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.231 | DEBUG    | __main__:trials:29 - Trial = 17577/30000 | Total reward = 56.00
2022-01-26 14:17:51.235 | DEBUG    | __main__:trials:24 - Trial = 17578/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.236 | DEBUG    | __main__:trials:29 - Trial = 17578/30000 | Total reward = 41.20
2022-01-26 14:17:51.240 | DEBUG    | __main__:trials:24 - Trial = 17579/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.242 | DEBUG    | __main__:trials:29 - Trial = 17579/30000 | Total reward = 40.26
2022-01-26 14:17:51.245 | DEBUG    | __main__:trials:24 - Trial = 17580/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.246 | DEBUG    | __main__:trials:29 - Trial = 17580/30000 | Total reward = 55.71
2022-01-26 14:17:51.250 | DEBUG    | __main__:trials:24 - Trial = 17581/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.251 | DEBUG    | __main__:trials:29 - Trial = 17581/30000 | Total reward = 43.87
2022-01-26 14:17:51.255 | DEBUG    | __main__:trials:24 - Trial = 17582/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.257 | DEBUG    | __main__:trials:29 - Trial = 17582/30000 | Total reward = 42.29
2022-01-26 14:17:51.260 | DEBUG    | __main__:trials:24 - Trial = 17583/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.262 | DEBUG    | __main__:trials:29 - Trial = 17583/30000 | Total reward = 49.78
2022-01-26 14:17:51.266 | DEBUG    | __main__:trials:24 - Trial = 17584/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.267 | DEBUG    | __main__:trials:29 - Trial = 17584/30000 | Total reward = 61.50
2022-01-26 14:17:51.271 | DEBUG    | __main__:trials:24 - Trial = 17585/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.271 | DEBUG    | __main__:trials:29 - Trial = 17585/30000 | Total reward = 48.80
2022-01-26 14:17:51.275 | DEBUG    | __main__:trials:24 - Trial = 17586/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.276 | DEBUG    | __main__:trials:29 - Trial = 17586/30000 | Total reward = 54.11
2022-01-26 14:17:51.280 | DEBUG    | __main__:trials:24 - Trial = 17587/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.282 | DEBUG    | __main__:trials:29 - Trial = 17587/30000 | Total reward = 45.52
2022-01-26 14:17:51.285 | DEBUG    | __main__:trials:26 - Trial = 17588/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:51.287 | DEBUG    | __main__:trials:29 - Trial = 17588/30000 | Total reward = 28.86
2022-01-26 14:17:51.290 | DEBUG    | __main__:trials:24 - Trial = 17589/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.292 | DEBUG    | __main__:trials:29 - Trial = 17589/30000 | Total reward = 52.60
2022-01-26 14:17:51.295 | DEBUG    | __main__:trials:24 - Trial = 17590/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.297 | DEBUG    | __main__:trials:29 - Trial = 17590/30000 | Total reward = 55.46
2022-01-26 14:17:51.300 | DEBUG    | __main__:trials:24 - Trial = 17591/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.301 | DEBUG    | __main__:trials:29 - Trial = 17591/30000 | Total reward = 46.03
2022-01-26 14:17:51.305 | DEBUG    | __main__:trials:24 - Trial = 17592/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.307 | DEBUG    | __main__:trials:29 - Trial = 17592/30000 | Total reward = 37.84
2022-01-26 14:17:51.309 | DEBUG    | __main__:trials:24 - Trial = 17593/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.311 | DEBUG    | __main__:trials:29 - Trial = 17593/30000 | Total reward = 44.34
2022-01-26 14:17:51.315 | DEBUG    | __main__:trials:24 - Trial = 17594/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.316 | DEBUG    | __main__:trials:29 - Trial = 17594/30000 | Total reward = 37.17
2022-01-26 14:17:51.320 | DEBUG    | __main__:trials:24 - Trial = 17595/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.320 | DEBUG    | __main__:trials:29 - Trial = 17595/30000 | Total reward = 35.35
2022-01-26 14:17:51.325 | DEBUG    | __main__:trials:24 - Trial = 17596/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.326 | DEBUG    | __main__:trials:29 - Trial = 17596/30000 | Total reward = 47.11
2022-01-26 14:17:51.330 | DEBUG    | __main__:trials:24 - Trial = 17597/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.330 | DEBUG    | __main__:trials:29 - Trial = 17597/30000 | Total reward = 60.57
2022-01-26 14:17:51.335 | DEBUG    | __main__:trials:24 - Trial = 17598/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.336 | DEBUG    | __main__:trials:29 - Trial = 17598/30000 | Total reward = 59.24
2022-01-26 14:17:51.339 | DEBUG    | __main__:trials:24 - Trial = 17599/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.339 | DEBUG    | __main__:trials:29 - Trial = 17599/30000 | Total reward = 47.07
2022-01-26 14:17:51.343 | DEBUG    | __main__:trials:24 - Trial = 17600/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.345 | DEBUG    | __main__:trials:29 - Trial = 17600/30000 | Total reward = 52.84
2022-01-26 14:17:51.348 | DEBUG    | __main__:trials:24 - Trial = 17601/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.349 | DEBUG    | __main__:trials:29 - Trial = 17601/30000 | Total reward = 52.47
2022-01-26 14:17:51.353 | DEBUG    | __main__:trials:24 - Trial = 17602/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.355 | DEBUG    | __main__:trials:29 - Trial = 17602/30000 | Total reward = 51.09
2022-01-26 14:17:51.358 | DEBUG    | __main__:trials:24 - Trial = 17603/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.359 | DEBUG    | __main__:trials:29 - Trial = 17603/30000 | Total reward = 57.39
2022-01-26 14:17:51.363 | DEBUG    | __main__:trials:24 - Trial = 17604/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.364 | DEBUG    | __main__:trials:29 - Trial = 17604/30000 | Total reward = 48.23
2022-01-26 14:17:51.368 | DEBUG    | __main__:trials:24 - Trial = 17605/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.370 | DEBUG    | __main__:trials:29 - Trial = 17605/30000 | Total reward = 51.97
2022-01-26 14:17:51.374 | DEBUG    | __main__:trials:24 - Trial = 17606/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.375 | DEBUG    | __main__:trials:29 - Trial = 17606/30000 | Total reward = 58.24
2022-01-26 14:17:51.379 | DEBUG    | __main__:trials:24 - Trial = 17607/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.379 | DEBUG    | __main__:trials:29 - Trial = 17607/30000 | Total reward = 55.71
2022-01-26 14:17:51.383 | DEBUG    | __main__:trials:24 - Trial = 17608/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.384 | DEBUG    | __main__:trials:29 - Trial = 17608/30000 | Total reward = 40.94
2022-01-26 14:17:51.389 | DEBUG    | __main__:trials:24 - Trial = 17609/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.390 | DEBUG    | __main__:trials:29 - Trial = 17609/30000 | Total reward = 38.53
2022-01-26 14:17:51.394 | DEBUG    | __main__:trials:24 - Trial = 17610/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.395 | DEBUG    | __main__:trials:29 - Trial = 17610/30000 | Total reward = 44.77
2022-01-26 14:17:51.399 | DEBUG    | __main__:trials:24 - Trial = 17611/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.400 | DEBUG    | __main__:trials:29 - Trial = 17611/30000 | Total reward = 52.76
2022-01-26 14:17:51.404 | DEBUG    | __main__:trials:24 - Trial = 17612/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.404 | DEBUG    | __main__:trials:29 - Trial = 17612/30000 | Total reward = 47.25
2022-01-26 14:17:51.409 | DEBUG    | __main__:trials:24 - Trial = 17613/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.410 | DEBUG    | __main__:trials:29 - Trial = 17613/30000 | Total reward = 53.50
2022-01-26 14:17:51.414 | DEBUG    | __main__:trials:24 - Trial = 17614/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.415 | DEBUG    | __main__:trials:29 - Trial = 17614/30000 | Total reward = 37.38
2022-01-26 14:17:51.419 | DEBUG    | __main__:trials:24 - Trial = 17615/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.421 | DEBUG    | __main__:trials:29 - Trial = 17615/30000 | Total reward = 38.01
2022-01-26 14:17:51.424 | DEBUG    | __main__:trials:24 - Trial = 17616/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.426 | DEBUG    | __main__:trials:29 - Trial = 17616/30000 | Total reward = 57.49
2022-01-26 14:17:51.429 | DEBUG    | __main__:trials:24 - Trial = 17617/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.431 | DEBUG    | __main__:trials:29 - Trial = 17617/30000 | Total reward = 41.40
2022-01-26 14:17:51.435 | DEBUG    | __main__:trials:24 - Trial = 17618/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.435 | DEBUG    | __main__:trials:29 - Trial = 17618/30000 | Total reward = 55.75
2022-01-26 14:17:51.440 | DEBUG    | __main__:trials:24 - Trial = 17619/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.441 | DEBUG    | __main__:trials:29 - Trial = 17619/30000 | Total reward = 38.14
2022-01-26 14:17:51.444 | DEBUG    | __main__:trials:24 - Trial = 17620/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.446 | DEBUG    | __main__:trials:29 - Trial = 17620/30000 | Total reward = 48.39
2022-01-26 14:17:51.449 | DEBUG    | __main__:trials:24 - Trial = 17621/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.450 | DEBUG    | __main__:trials:29 - Trial = 17621/30000 | Total reward = 37.25
2022-01-26 14:17:51.454 | DEBUG    | __main__:trials:24 - Trial = 17622/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.456 | DEBUG    | __main__:trials:29 - Trial = 17622/30000 | Total reward = 40.54
2022-01-26 14:17:51.459 | DEBUG    | __main__:trials:24 - Trial = 17623/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.460 | DEBUG    | __main__:trials:29 - Trial = 17623/30000 | Total reward = 57.09
2022-01-26 14:17:51.465 | DEBUG    | __main__:trials:24 - Trial = 17624/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.465 | DEBUG    | __main__:trials:29 - Trial = 17624/30000 | Total reward = 55.29
2022-01-26 14:17:51.470 | DEBUG    | __main__:trials:24 - Trial = 17625/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.471 | DEBUG    | __main__:trials:29 - Trial = 17625/30000 | Total reward = 44.19
2022-01-26 14:17:51.475 | DEBUG    | __main__:trials:24 - Trial = 17626/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.475 | DEBUG    | __main__:trials:29 - Trial = 17626/30000 | Total reward = 40.55
2022-01-26 14:17:51.478 | DEBUG    | __main__:trials:26 - Trial = 17627/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:51.480 | DEBUG    | __main__:trials:29 - Trial = 17627/30000 | Total reward = 22.84
2022-01-26 14:17:51.483 | DEBUG    | __main__:trials:24 - Trial = 17628/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.485 | DEBUG    | __main__:trials:29 - Trial = 17628/30000 | Total reward = 56.49
2022-01-26 14:17:51.488 | DEBUG    | __main__:trials:24 - Trial = 17629/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.490 | DEBUG    | __main__:trials:29 - Trial = 17629/30000 | Total reward = 42.10
2022-01-26 14:17:51.494 | DEBUG    | __main__:trials:24 - Trial = 17630/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.494 | DEBUG    | __main__:trials:29 - Trial = 17630/30000 | Total reward = 52.96
2022-01-26 14:17:51.499 | DEBUG    | __main__:trials:24 - Trial = 17631/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.499 | DEBUG    | __main__:trials:29 - Trial = 17631/30000 | Total reward = 51.21
2022-01-26 14:17:51.504 | DEBUG    | __main__:trials:24 - Trial = 17632/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.504 | DEBUG    | __main__:trials:29 - Trial = 17632/30000 | Total reward = 54.52
2022-01-26 14:17:51.509 | DEBUG    | __main__:trials:24 - Trial = 17633/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.511 | DEBUG    | __main__:trials:29 - Trial = 17633/30000 | Total reward = 50.08
2022-01-26 14:17:51.514 | DEBUG    | __main__:trials:24 - Trial = 17634/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.515 | DEBUG    | __main__:trials:29 - Trial = 17634/30000 | Total reward = 34.67
2022-01-26 14:17:51.519 | DEBUG    | __main__:trials:24 - Trial = 17635/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.520 | DEBUG    | __main__:trials:29 - Trial = 17635/30000 | Total reward = 40.82
2022-01-26 14:17:51.524 | DEBUG    | __main__:trials:24 - Trial = 17636/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.526 | DEBUG    | __main__:trials:29 - Trial = 17636/30000 | Total reward = 40.51
2022-01-26 14:17:51.530 | DEBUG    | __main__:trials:24 - Trial = 17637/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.530 | DEBUG    | __main__:trials:29 - Trial = 17637/30000 | Total reward = 43.06
2022-01-26 14:17:51.535 | DEBUG    | __main__:trials:24 - Trial = 17638/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.536 | DEBUG    | __main__:trials:29 - Trial = 17638/30000 | Total reward = 33.79
2022-01-26 14:17:51.540 | DEBUG    | __main__:trials:24 - Trial = 17639/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.542 | DEBUG    | __main__:trials:29 - Trial = 17639/30000 | Total reward = 48.35
2022-01-26 14:17:51.545 | DEBUG    | __main__:trials:24 - Trial = 17640/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.546 | DEBUG    | __main__:trials:29 - Trial = 17640/30000 | Total reward = 44.51
2022-01-26 14:17:51.551 | DEBUG    | __main__:trials:24 - Trial = 17641/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.552 | DEBUG    | __main__:trials:29 - Trial = 17641/30000 | Total reward = 47.01
2022-01-26 14:17:51.556 | DEBUG    | __main__:trials:24 - Trial = 17642/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.557 | DEBUG    | __main__:trials:29 - Trial = 17642/30000 | Total reward = 46.58
2022-01-26 14:17:51.561 | DEBUG    | __main__:trials:24 - Trial = 17643/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.563 | DEBUG    | __main__:trials:29 - Trial = 17643/30000 | Total reward = 58.54
2022-01-26 14:17:51.567 | DEBUG    | __main__:trials:24 - Trial = 17644/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.567 | DEBUG    | __main__:trials:29 - Trial = 17644/30000 | Total reward = 45.17
2022-01-26 14:17:51.571 | DEBUG    | __main__:trials:26 - Trial = 17645/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:51.573 | DEBUG    | __main__:trials:29 - Trial = 17645/30000 | Total reward = 29.56
2022-01-26 14:17:51.576 | DEBUG    | __main__:trials:24 - Trial = 17646/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.577 | DEBUG    | __main__:trials:29 - Trial = 17646/30000 | Total reward = 61.49
2022-01-26 14:17:51.581 | DEBUG    | __main__:trials:24 - Trial = 17647/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.581 | DEBUG    | __main__:trials:29 - Trial = 17647/30000 | Total reward = 40.02
2022-01-26 14:17:51.586 | DEBUG    | __main__:trials:24 - Trial = 17648/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.586 | DEBUG    | __main__:trials:29 - Trial = 17648/30000 | Total reward = 47.44
2022-01-26 14:17:51.591 | DEBUG    | __main__:trials:24 - Trial = 17649/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.592 | DEBUG    | __main__:trials:29 - Trial = 17649/30000 | Total reward = 57.95
2022-01-26 14:17:51.596 | DEBUG    | __main__:trials:24 - Trial = 17650/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.597 | DEBUG    | __main__:trials:29 - Trial = 17650/30000 | Total reward = 60.78
2022-01-26 14:17:51.601 | DEBUG    | __main__:trials:24 - Trial = 17651/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.603 | DEBUG    | __main__:trials:29 - Trial = 17651/30000 | Total reward = 45.94
2022-01-26 14:17:51.606 | DEBUG    | __main__:trials:24 - Trial = 17652/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.608 | DEBUG    | __main__:trials:29 - Trial = 17652/30000 | Total reward = 38.62
2022-01-26 14:17:51.611 | DEBUG    | __main__:trials:24 - Trial = 17653/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.613 | DEBUG    | __main__:trials:29 - Trial = 17653/30000 | Total reward = 48.22
2022-01-26 14:17:51.616 | DEBUG    | __main__:trials:24 - Trial = 17654/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.617 | DEBUG    | __main__:trials:29 - Trial = 17654/30000 | Total reward = 42.32
2022-01-26 14:17:51.620 | DEBUG    | __main__:trials:24 - Trial = 17655/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.622 | DEBUG    | __main__:trials:29 - Trial = 17655/30000 | Total reward = 51.59
2022-01-26 14:17:51.626 | DEBUG    | __main__:trials:24 - Trial = 17656/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.628 | DEBUG    | __main__:trials:29 - Trial = 17656/30000 | Total reward = 45.90
2022-01-26 14:17:51.631 | DEBUG    | __main__:trials:24 - Trial = 17657/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.632 | DEBUG    | __main__:trials:29 - Trial = 17657/30000 | Total reward = 48.45
2022-01-26 14:17:51.637 | DEBUG    | __main__:trials:24 - Trial = 17658/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.638 | DEBUG    | __main__:trials:29 - Trial = 17658/30000 | Total reward = 45.53
2022-01-26 14:17:51.642 | DEBUG    | __main__:trials:24 - Trial = 17659/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.642 | DEBUG    | __main__:trials:29 - Trial = 17659/30000 | Total reward = 37.23
2022-01-26 14:17:51.647 | DEBUG    | __main__:trials:24 - Trial = 17660/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.648 | DEBUG    | __main__:trials:29 - Trial = 17660/30000 | Total reward = 45.54
2022-01-26 14:17:51.652 | DEBUG    | __main__:trials:24 - Trial = 17661/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.654 | DEBUG    | __main__:trials:29 - Trial = 17661/30000 | Total reward = 46.54
2022-01-26 14:17:51.658 | DEBUG    | __main__:trials:24 - Trial = 17662/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.659 | DEBUG    | __main__:trials:29 - Trial = 17662/30000 | Total reward = 40.49
2022-01-26 14:17:51.663 | DEBUG    | __main__:trials:24 - Trial = 17663/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.664 | DEBUG    | __main__:trials:29 - Trial = 17663/30000 | Total reward = 37.57
2022-01-26 14:17:51.668 | DEBUG    | __main__:trials:24 - Trial = 17664/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.669 | DEBUG    | __main__:trials:29 - Trial = 17664/30000 | Total reward = 47.63
2022-01-26 14:17:51.672 | DEBUG    | __main__:trials:24 - Trial = 17665/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.674 | DEBUG    | __main__:trials:29 - Trial = 17665/30000 | Total reward = 35.04
2022-01-26 14:17:51.677 | DEBUG    | __main__:trials:24 - Trial = 17666/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.678 | DEBUG    | __main__:trials:29 - Trial = 17666/30000 | Total reward = 47.33
2022-01-26 14:17:51.681 | DEBUG    | __main__:trials:24 - Trial = 17667/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.683 | DEBUG    | __main__:trials:29 - Trial = 17667/30000 | Total reward = 43.39
2022-01-26 14:17:51.686 | DEBUG    | __main__:trials:24 - Trial = 17668/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.687 | DEBUG    | __main__:trials:29 - Trial = 17668/30000 | Total reward = 42.59
2022-01-26 14:17:51.691 | DEBUG    | __main__:trials:24 - Trial = 17669/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.693 | DEBUG    | __main__:trials:29 - Trial = 17669/30000 | Total reward = 49.15
2022-01-26 14:17:51.697 | DEBUG    | __main__:trials:24 - Trial = 17670/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.698 | DEBUG    | __main__:trials:29 - Trial = 17670/30000 | Total reward = 43.50
2022-01-26 14:17:51.702 | DEBUG    | __main__:trials:24 - Trial = 17671/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.703 | DEBUG    | __main__:trials:29 - Trial = 17671/30000 | Total reward = 44.99
2022-01-26 14:17:51.708 | DEBUG    | __main__:trials:24 - Trial = 17672/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.709 | DEBUG    | __main__:trials:29 - Trial = 17672/30000 | Total reward = 55.90
2022-01-26 14:17:51.713 | DEBUG    | __main__:trials:24 - Trial = 17673/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.714 | DEBUG    | __main__:trials:29 - Trial = 17673/30000 | Total reward = 41.42
2022-01-26 14:17:51.717 | DEBUG    | __main__:trials:24 - Trial = 17674/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.719 | DEBUG    | __main__:trials:29 - Trial = 17674/30000 | Total reward = 51.91
2022-01-26 14:17:51.722 | DEBUG    | __main__:trials:24 - Trial = 17675/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.724 | DEBUG    | __main__:trials:29 - Trial = 17675/30000 | Total reward = 42.53
2022-01-26 14:17:51.727 | DEBUG    | __main__:trials:24 - Trial = 17676/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.729 | DEBUG    | __main__:trials:29 - Trial = 17676/30000 | Total reward = 48.90
2022-01-26 14:17:51.733 | DEBUG    | __main__:trials:24 - Trial = 17677/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.734 | DEBUG    | __main__:trials:29 - Trial = 17677/30000 | Total reward = 60.46
2022-01-26 14:17:51.738 | DEBUG    | __main__:trials:24 - Trial = 17678/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.739 | DEBUG    | __main__:trials:29 - Trial = 17678/30000 | Total reward = 37.00
2022-01-26 14:17:51.743 | DEBUG    | __main__:trials:24 - Trial = 17679/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.745 | DEBUG    | __main__:trials:29 - Trial = 17679/30000 | Total reward = 47.52
2022-01-26 14:17:51.748 | DEBUG    | __main__:trials:24 - Trial = 17680/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.750 | DEBUG    | __main__:trials:29 - Trial = 17680/30000 | Total reward = 37.05
2022-01-26 14:17:51.754 | DEBUG    | __main__:trials:24 - Trial = 17681/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.755 | DEBUG    | __main__:trials:29 - Trial = 17681/30000 | Total reward = 36.85
2022-01-26 14:17:51.759 | DEBUG    | __main__:trials:24 - Trial = 17682/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.761 | DEBUG    | __main__:trials:29 - Trial = 17682/30000 | Total reward = 46.19
2022-01-26 14:17:51.764 | DEBUG    | __main__:trials:24 - Trial = 17683/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.765 | DEBUG    | __main__:trials:29 - Trial = 17683/30000 | Total reward = 47.32
2022-01-26 14:17:51.770 | DEBUG    | __main__:trials:24 - Trial = 17684/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.771 | DEBUG    | __main__:trials:29 - Trial = 17684/30000 | Total reward = 50.44
2022-01-26 14:17:51.775 | DEBUG    | __main__:trials:24 - Trial = 17685/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.776 | DEBUG    | __main__:trials:29 - Trial = 17685/30000 | Total reward = 49.89
2022-01-26 14:17:51.780 | DEBUG    | __main__:trials:24 - Trial = 17686/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.782 | DEBUG    | __main__:trials:29 - Trial = 17686/30000 | Total reward = 55.87
2022-01-26 14:17:51.785 | DEBUG    | __main__:trials:24 - Trial = 17687/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.787 | DEBUG    | __main__:trials:29 - Trial = 17687/30000 | Total reward = 41.69
2022-01-26 14:17:51.791 | DEBUG    | __main__:trials:24 - Trial = 17688/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.791 | DEBUG    | __main__:trials:29 - Trial = 17688/30000 | Total reward = 48.37
2022-01-26 14:17:51.796 | DEBUG    | __main__:trials:24 - Trial = 17689/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.797 | DEBUG    | __main__:trials:29 - Trial = 17689/30000 | Total reward = 46.68
2022-01-26 14:17:51.800 | DEBUG    | __main__:trials:24 - Trial = 17690/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.802 | DEBUG    | __main__:trials:29 - Trial = 17690/30000 | Total reward = 33.36
2022-01-26 14:17:51.805 | DEBUG    | __main__:trials:24 - Trial = 17691/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.806 | DEBUG    | __main__:trials:29 - Trial = 17691/30000 | Total reward = 39.60
2022-01-26 14:17:51.810 | DEBUG    | __main__:trials:24 - Trial = 17692/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.812 | DEBUG    | __main__:trials:29 - Trial = 17692/30000 | Total reward = 49.80
2022-01-26 14:17:51.815 | DEBUG    | __main__:trials:26 - Trial = 17693/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:51.817 | DEBUG    | __main__:trials:29 - Trial = 17693/30000 | Total reward = 24.61
2022-01-26 14:17:51.820 | DEBUG    | __main__:trials:24 - Trial = 17694/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.821 | DEBUG    | __main__:trials:29 - Trial = 17694/30000 | Total reward = 47.20
2022-01-26 14:17:51.825 | DEBUG    | __main__:trials:24 - Trial = 17695/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.827 | DEBUG    | __main__:trials:29 - Trial = 17695/30000 | Total reward = 45.55
2022-01-26 14:17:51.830 | DEBUG    | __main__:trials:24 - Trial = 17696/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.832 | DEBUG    | __main__:trials:29 - Trial = 17696/30000 | Total reward = 36.77
2022-01-26 14:17:51.835 | DEBUG    | __main__:trials:24 - Trial = 17697/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.837 | DEBUG    | __main__:trials:29 - Trial = 17697/30000 | Total reward = 47.61
2022-01-26 14:17:51.840 | DEBUG    | __main__:trials:24 - Trial = 17698/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.841 | DEBUG    | __main__:trials:29 - Trial = 17698/30000 | Total reward = 44.80
2022-01-26 14:17:51.845 | DEBUG    | __main__:trials:24 - Trial = 17699/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.847 | DEBUG    | __main__:trials:29 - Trial = 17699/30000 | Total reward = 67.89
2022-01-26 14:17:51.851 | DEBUG    | __main__:trials:24 - Trial = 17700/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.852 | DEBUG    | __main__:trials:29 - Trial = 17700/30000 | Total reward = 43.96
2022-01-26 14:17:51.856 | DEBUG    | __main__:trials:24 - Trial = 17701/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.858 | DEBUG    | __main__:trials:29 - Trial = 17701/30000 | Total reward = 48.79
2022-01-26 14:17:51.860 | DEBUG    | __main__:trials:24 - Trial = 17702/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.862 | DEBUG    | __main__:trials:29 - Trial = 17702/30000 | Total reward = 50.83
2022-01-26 14:17:51.866 | DEBUG    | __main__:trials:24 - Trial = 17703/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.867 | DEBUG    | __main__:trials:29 - Trial = 17703/30000 | Total reward = 47.30
2022-01-26 14:17:51.871 | DEBUG    | __main__:trials:24 - Trial = 17704/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.871 | DEBUG    | __main__:trials:29 - Trial = 17704/30000 | Total reward = 47.81
2022-01-26 14:17:51.875 | DEBUG    | __main__:trials:24 - Trial = 17705/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.875 | DEBUG    | __main__:trials:29 - Trial = 17705/30000 | Total reward = 44.41
2022-01-26 14:17:51.879 | DEBUG    | __main__:trials:24 - Trial = 17706/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.879 | DEBUG    | __main__:trials:29 - Trial = 17706/30000 | Total reward = 34.63
2022-01-26 14:17:51.883 | DEBUG    | __main__:trials:24 - Trial = 17707/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.884 | DEBUG    | __main__:trials:29 - Trial = 17707/30000 | Total reward = 42.05
2022-01-26 14:17:51.888 | DEBUG    | __main__:trials:24 - Trial = 17708/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.889 | DEBUG    | __main__:trials:29 - Trial = 17708/30000 | Total reward = 40.56
2022-01-26 14:17:51.892 | DEBUG    | __main__:trials:24 - Trial = 17709/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.894 | DEBUG    | __main__:trials:29 - Trial = 17709/30000 | Total reward = 51.51
2022-01-26 14:17:51.898 | DEBUG    | __main__:trials:24 - Trial = 17710/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.898 | DEBUG    | __main__:trials:29 - Trial = 17710/30000 | Total reward = 52.29
2022-01-26 14:17:51.903 | DEBUG    | __main__:trials:24 - Trial = 17711/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.904 | DEBUG    | __main__:trials:29 - Trial = 17711/30000 | Total reward = 42.24
2022-01-26 14:17:51.908 | DEBUG    | __main__:trials:24 - Trial = 17712/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.909 | DEBUG    | __main__:trials:29 - Trial = 17712/30000 | Total reward = 39.35
2022-01-26 14:17:51.912 | DEBUG    | __main__:trials:24 - Trial = 17713/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.914 | DEBUG    | __main__:trials:29 - Trial = 17713/30000 | Total reward = 51.96
2022-01-26 14:17:51.917 | DEBUG    | __main__:trials:24 - Trial = 17714/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.918 | DEBUG    | __main__:trials:29 - Trial = 17714/30000 | Total reward = 47.87
2022-01-26 14:17:51.922 | DEBUG    | __main__:trials:24 - Trial = 17715/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.924 | DEBUG    | __main__:trials:29 - Trial = 17715/30000 | Total reward = 57.37
2022-01-26 14:17:51.927 | DEBUG    | __main__:trials:24 - Trial = 17716/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.928 | DEBUG    | __main__:trials:29 - Trial = 17716/30000 | Total reward = 37.39
2022-01-26 14:17:51.932 | DEBUG    | __main__:trials:24 - Trial = 17717/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.933 | DEBUG    | __main__:trials:29 - Trial = 17717/30000 | Total reward = 55.87
2022-01-26 14:17:51.936 | DEBUG    | __main__:trials:24 - Trial = 17718/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.938 | DEBUG    | __main__:trials:29 - Trial = 17718/30000 | Total reward = 53.79
2022-01-26 14:17:51.942 | DEBUG    | __main__:trials:24 - Trial = 17719/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.942 | DEBUG    | __main__:trials:29 - Trial = 17719/30000 | Total reward = 49.84
2022-01-26 14:17:51.947 | DEBUG    | __main__:trials:24 - Trial = 17720/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.948 | DEBUG    | __main__:trials:29 - Trial = 17720/30000 | Total reward = 54.85
2022-01-26 14:17:51.952 | DEBUG    | __main__:trials:24 - Trial = 17721/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.954 | DEBUG    | __main__:trials:29 - Trial = 17721/30000 | Total reward = 58.27
2022-01-26 14:17:51.957 | DEBUG    | __main__:trials:24 - Trial = 17722/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.959 | DEBUG    | __main__:trials:29 - Trial = 17722/30000 | Total reward = 22.22
2022-01-26 14:17:51.963 | DEBUG    | __main__:trials:24 - Trial = 17723/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.963 | DEBUG    | __main__:trials:29 - Trial = 17723/30000 | Total reward = 38.01
2022-01-26 14:17:51.968 | DEBUG    | __main__:trials:24 - Trial = 17724/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.969 | DEBUG    | __main__:trials:29 - Trial = 17724/30000 | Total reward = 54.25
2022-01-26 14:17:51.973 | DEBUG    | __main__:trials:24 - Trial = 17725/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.974 | DEBUG    | __main__:trials:29 - Trial = 17725/30000 | Total reward = 54.55
2022-01-26 14:17:51.978 | DEBUG    | __main__:trials:24 - Trial = 17726/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.979 | DEBUG    | __main__:trials:29 - Trial = 17726/30000 | Total reward = 53.03
2022-01-26 14:17:51.983 | DEBUG    | __main__:trials:24 - Trial = 17727/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.984 | DEBUG    | __main__:trials:29 - Trial = 17727/30000 | Total reward = 33.34
2022-01-26 14:17:51.987 | DEBUG    | __main__:trials:24 - Trial = 17728/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.989 | DEBUG    | __main__:trials:29 - Trial = 17728/30000 | Total reward = 35.79
2022-01-26 14:17:51.992 | DEBUG    | __main__:trials:24 - Trial = 17729/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.994 | DEBUG    | __main__:trials:29 - Trial = 17729/30000 | Total reward = 52.83
2022-01-26 14:17:51.997 | DEBUG    | __main__:trials:24 - Trial = 17730/30000 | Max number of steps (20) reached
2022-01-26 14:17:51.999 | DEBUG    | __main__:trials:29 - Trial = 17730/30000 | Total reward = 41.41
2022-01-26 14:17:52.003 | DEBUG    | __main__:trials:24 - Trial = 17731/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.003 | DEBUG    | __main__:trials:29 - Trial = 17731/30000 | Total reward = 50.18
2022-01-26 14:17:52.008 | DEBUG    | __main__:trials:24 - Trial = 17732/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.009 | DEBUG    | __main__:trials:29 - Trial = 17732/30000 | Total reward = 35.51
2022-01-26 14:17:52.012 | DEBUG    | __main__:trials:24 - Trial = 17733/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.014 | DEBUG    | __main__:trials:29 - Trial = 17733/30000 | Total reward = 33.06
2022-01-26 14:17:52.018 | DEBUG    | __main__:trials:24 - Trial = 17734/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.018 | DEBUG    | __main__:trials:29 - Trial = 17734/30000 | Total reward = 47.26
2022-01-26 14:17:52.023 | DEBUG    | __main__:trials:24 - Trial = 17735/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.024 | DEBUG    | __main__:trials:29 - Trial = 17735/30000 | Total reward = 40.06
2022-01-26 14:17:52.027 | DEBUG    | __main__:trials:26 - Trial = 17736/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.028 | DEBUG    | __main__:trials:29 - Trial = 17736/30000 | Total reward = 26.68
2022-01-26 14:17:52.031 | DEBUG    | __main__:trials:24 - Trial = 17737/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.033 | DEBUG    | __main__:trials:29 - Trial = 17737/30000 | Total reward = 34.89
2022-01-26 14:17:52.036 | DEBUG    | __main__:trials:24 - Trial = 17738/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.037 | DEBUG    | __main__:trials:29 - Trial = 17738/30000 | Total reward = 52.64
2022-01-26 14:17:52.040 | DEBUG    | __main__:trials:24 - Trial = 17739/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.041 | DEBUG    | __main__:trials:29 - Trial = 17739/30000 | Total reward = 40.60
2022-01-26 14:17:52.044 | DEBUG    | __main__:trials:24 - Trial = 17740/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.045 | DEBUG    | __main__:trials:29 - Trial = 17740/30000 | Total reward = 28.29
2022-01-26 14:17:52.048 | DEBUG    | __main__:trials:24 - Trial = 17741/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.049 | DEBUG    | __main__:trials:29 - Trial = 17741/30000 | Total reward = 54.68
2022-01-26 14:17:52.053 | DEBUG    | __main__:trials:24 - Trial = 17742/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.053 | DEBUG    | __main__:trials:29 - Trial = 17742/30000 | Total reward = 47.01
2022-01-26 14:17:52.057 | DEBUG    | __main__:trials:24 - Trial = 17743/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.058 | DEBUG    | __main__:trials:29 - Trial = 17743/30000 | Total reward = 27.02
2022-01-26 14:17:52.061 | DEBUG    | __main__:trials:24 - Trial = 17744/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.062 | DEBUG    | __main__:trials:29 - Trial = 17744/30000 | Total reward = 62.28
2022-01-26 14:17:52.065 | DEBUG    | __main__:trials:24 - Trial = 17745/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.066 | DEBUG    | __main__:trials:29 - Trial = 17745/30000 | Total reward = 48.66
2022-01-26 14:17:52.069 | DEBUG    | __main__:trials:24 - Trial = 17746/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.071 | DEBUG    | __main__:trials:29 - Trial = 17746/30000 | Total reward = 48.61
2022-01-26 14:17:52.074 | DEBUG    | __main__:trials:24 - Trial = 17747/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.076 | DEBUG    | __main__:trials:29 - Trial = 17747/30000 | Total reward = 44.98
2022-01-26 14:17:52.079 | DEBUG    | __main__:trials:24 - Trial = 17748/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.081 | DEBUG    | __main__:trials:29 - Trial = 17748/30000 | Total reward = 50.13
2022-01-26 14:17:52.085 | DEBUG    | __main__:trials:24 - Trial = 17749/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.087 | DEBUG    | __main__:trials:29 - Trial = 17749/30000 | Total reward = 36.26
2022-01-26 14:17:52.090 | DEBUG    | __main__:trials:24 - Trial = 17750/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.092 | DEBUG    | __main__:trials:29 - Trial = 17750/30000 | Total reward = 48.78
2022-01-26 14:17:52.096 | DEBUG    | __main__:trials:24 - Trial = 17751/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.097 | DEBUG    | __main__:trials:29 - Trial = 17751/30000 | Total reward = 34.27
2022-01-26 14:17:52.100 | DEBUG    | __main__:trials:24 - Trial = 17752/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.102 | DEBUG    | __main__:trials:29 - Trial = 17752/30000 | Total reward = 63.18
2022-01-26 14:17:52.106 | DEBUG    | __main__:trials:24 - Trial = 17753/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.107 | DEBUG    | __main__:trials:29 - Trial = 17753/30000 | Total reward = 61.89
2022-01-26 14:17:52.110 | DEBUG    | __main__:trials:24 - Trial = 17754/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.112 | DEBUG    | __main__:trials:29 - Trial = 17754/30000 | Total reward = 61.44
2022-01-26 14:17:52.115 | DEBUG    | __main__:trials:24 - Trial = 17755/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.117 | DEBUG    | __main__:trials:29 - Trial = 17755/30000 | Total reward = 36.67
2022-01-26 14:17:52.120 | DEBUG    | __main__:trials:24 - Trial = 17756/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.121 | DEBUG    | __main__:trials:29 - Trial = 17756/30000 | Total reward = 60.54
2022-01-26 14:17:52.124 | DEBUG    | __main__:trials:24 - Trial = 17757/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.125 | DEBUG    | __main__:trials:29 - Trial = 17757/30000 | Total reward = 58.66
2022-01-26 14:17:52.129 | DEBUG    | __main__:trials:24 - Trial = 17758/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.130 | DEBUG    | __main__:trials:29 - Trial = 17758/30000 | Total reward = 38.02
2022-01-26 14:17:52.133 | DEBUG    | __main__:trials:24 - Trial = 17759/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.135 | DEBUG    | __main__:trials:29 - Trial = 17759/30000 | Total reward = 54.27
2022-01-26 14:17:52.139 | DEBUG    | __main__:trials:24 - Trial = 17760/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.141 | DEBUG    | __main__:trials:29 - Trial = 17760/30000 | Total reward = 59.80
2022-01-26 14:17:52.143 | DEBUG    | __main__:trials:24 - Trial = 17761/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.145 | DEBUG    | __main__:trials:29 - Trial = 17761/30000 | Total reward = 64.39
2022-01-26 14:17:52.148 | DEBUG    | __main__:trials:24 - Trial = 17762/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.149 | DEBUG    | __main__:trials:29 - Trial = 17762/30000 | Total reward = 64.33
2022-01-26 14:17:52.152 | DEBUG    | __main__:trials:24 - Trial = 17763/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.154 | DEBUG    | __main__:trials:29 - Trial = 17763/30000 | Total reward = 49.23
2022-01-26 14:17:52.157 | DEBUG    | __main__:trials:24 - Trial = 17764/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.159 | DEBUG    | __main__:trials:29 - Trial = 17764/30000 | Total reward = 61.54
2022-01-26 14:17:52.163 | DEBUG    | __main__:trials:24 - Trial = 17765/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.164 | DEBUG    | __main__:trials:29 - Trial = 17765/30000 | Total reward = 40.27
2022-01-26 14:17:52.168 | DEBUG    | __main__:trials:24 - Trial = 17766/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.169 | DEBUG    | __main__:trials:29 - Trial = 17766/30000 | Total reward = 58.32
2022-01-26 14:17:52.173 | DEBUG    | __main__:trials:24 - Trial = 17767/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.174 | DEBUG    | __main__:trials:29 - Trial = 17767/30000 | Total reward = 35.24
2022-01-26 14:17:52.178 | DEBUG    | __main__:trials:24 - Trial = 17768/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.180 | DEBUG    | __main__:trials:29 - Trial = 17768/30000 | Total reward = 66.57
2022-01-26 14:17:52.183 | DEBUG    | __main__:trials:24 - Trial = 17769/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.184 | DEBUG    | __main__:trials:29 - Trial = 17769/30000 | Total reward = 46.06
2022-01-26 14:17:52.188 | DEBUG    | __main__:trials:24 - Trial = 17770/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.189 | DEBUG    | __main__:trials:29 - Trial = 17770/30000 | Total reward = 42.48
2022-01-26 14:17:52.194 | DEBUG    | __main__:trials:24 - Trial = 17771/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.195 | DEBUG    | __main__:trials:29 - Trial = 17771/30000 | Total reward = 38.94
2022-01-26 14:17:52.198 | DEBUG    | __main__:trials:24 - Trial = 17772/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.200 | DEBUG    | __main__:trials:29 - Trial = 17772/30000 | Total reward = 46.40
2022-01-26 14:17:52.203 | DEBUG    | __main__:trials:24 - Trial = 17773/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.205 | DEBUG    | __main__:trials:29 - Trial = 17773/30000 | Total reward = 49.42
2022-01-26 14:17:52.209 | DEBUG    | __main__:trials:24 - Trial = 17774/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.209 | DEBUG    | __main__:trials:29 - Trial = 17774/30000 | Total reward = 42.67
2022-01-26 14:17:52.214 | DEBUG    | __main__:trials:24 - Trial = 17775/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.215 | DEBUG    | __main__:trials:29 - Trial = 17775/30000 | Total reward = 57.91
2022-01-26 14:17:52.218 | DEBUG    | __main__:trials:24 - Trial = 17776/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.220 | DEBUG    | __main__:trials:29 - Trial = 17776/30000 | Total reward = 53.25
2022-01-26 14:17:52.223 | DEBUG    | __main__:trials:24 - Trial = 17777/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.225 | DEBUG    | __main__:trials:29 - Trial = 17777/30000 | Total reward = 47.01
2022-01-26 14:17:52.228 | DEBUG    | __main__:trials:24 - Trial = 17778/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.230 | DEBUG    | __main__:trials:29 - Trial = 17778/30000 | Total reward = 46.53
2022-01-26 14:17:52.233 | DEBUG    | __main__:trials:24 - Trial = 17779/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.234 | DEBUG    | __main__:trials:29 - Trial = 17779/30000 | Total reward = 56.52
2022-01-26 14:17:52.238 | DEBUG    | __main__:trials:24 - Trial = 17780/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.239 | DEBUG    | __main__:trials:29 - Trial = 17780/30000 | Total reward = 40.70
2022-01-26 14:17:52.243 | DEBUG    | __main__:trials:24 - Trial = 17781/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.245 | DEBUG    | __main__:trials:29 - Trial = 17781/30000 | Total reward = 45.96
2022-01-26 14:17:52.248 | DEBUG    | __main__:trials:24 - Trial = 17782/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.250 | DEBUG    | __main__:trials:29 - Trial = 17782/30000 | Total reward = 41.34
2022-01-26 14:17:52.253 | DEBUG    | __main__:trials:24 - Trial = 17783/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.254 | DEBUG    | __main__:trials:29 - Trial = 17783/30000 | Total reward = 46.99
2022-01-26 14:17:52.259 | DEBUG    | __main__:trials:24 - Trial = 17784/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.259 | DEBUG    | __main__:trials:29 - Trial = 17784/30000 | Total reward = 38.37
2022-01-26 14:17:52.264 | DEBUG    | __main__:trials:24 - Trial = 17785/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.265 | DEBUG    | __main__:trials:29 - Trial = 17785/30000 | Total reward = 45.24
2022-01-26 14:17:52.269 | DEBUG    | __main__:trials:24 - Trial = 17786/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.271 | DEBUG    | __main__:trials:29 - Trial = 17786/30000 | Total reward = 38.76
2022-01-26 14:17:52.275 | DEBUG    | __main__:trials:24 - Trial = 17787/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.276 | DEBUG    | __main__:trials:29 - Trial = 17787/30000 | Total reward = 44.33
2022-01-26 14:17:52.280 | DEBUG    | __main__:trials:24 - Trial = 17788/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.281 | DEBUG    | __main__:trials:29 - Trial = 17788/30000 | Total reward = 47.53
2022-01-26 14:17:52.285 | DEBUG    | __main__:trials:24 - Trial = 17789/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.286 | DEBUG    | __main__:trials:29 - Trial = 17789/30000 | Total reward = 34.44
2022-01-26 14:17:52.290 | DEBUG    | __main__:trials:24 - Trial = 17790/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.291 | DEBUG    | __main__:trials:29 - Trial = 17790/30000 | Total reward = 53.05
2022-01-26 14:17:52.295 | DEBUG    | __main__:trials:24 - Trial = 17791/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.296 | DEBUG    | __main__:trials:29 - Trial = 17791/30000 | Total reward = 60.86
2022-01-26 14:17:52.300 | DEBUG    | __main__:trials:24 - Trial = 17792/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.301 | DEBUG    | __main__:trials:29 - Trial = 17792/30000 | Total reward = 41.07
2022-01-26 14:17:52.306 | DEBUG    | __main__:trials:24 - Trial = 17793/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.306 | DEBUG    | __main__:trials:29 - Trial = 17793/30000 | Total reward = 49.64
2022-01-26 14:17:52.311 | DEBUG    | __main__:trials:24 - Trial = 17794/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.311 | DEBUG    | __main__:trials:29 - Trial = 17794/30000 | Total reward = 33.92
2022-01-26 14:17:52.316 | DEBUG    | __main__:trials:24 - Trial = 17795/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.317 | DEBUG    | __main__:trials:29 - Trial = 17795/30000 | Total reward = 57.53
2022-01-26 14:17:52.321 | DEBUG    | __main__:trials:24 - Trial = 17796/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.321 | DEBUG    | __main__:trials:29 - Trial = 17796/30000 | Total reward = 47.09
2022-01-26 14:17:52.326 | DEBUG    | __main__:trials:24 - Trial = 17797/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.328 | DEBUG    | __main__:trials:29 - Trial = 17797/30000 | Total reward = 44.40
2022-01-26 14:17:52.331 | DEBUG    | __main__:trials:24 - Trial = 17798/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.332 | DEBUG    | __main__:trials:29 - Trial = 17798/30000 | Total reward = 52.75
2022-01-26 14:17:52.336 | DEBUG    | __main__:trials:24 - Trial = 17799/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.337 | DEBUG    | __main__:trials:29 - Trial = 17799/30000 | Total reward = 55.07
2022-01-26 14:17:52.341 | DEBUG    | __main__:trials:24 - Trial = 17800/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.342 | DEBUG    | __main__:trials:29 - Trial = 17800/30000 | Total reward = 46.41
2022-01-26 14:17:52.346 | DEBUG    | __main__:trials:24 - Trial = 17801/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.348 | DEBUG    | __main__:trials:29 - Trial = 17801/30000 | Total reward = 42.77
2022-01-26 14:17:52.351 | DEBUG    | __main__:trials:26 - Trial = 17802/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.353 | DEBUG    | __main__:trials:29 - Trial = 17802/30000 | Total reward = 30.64
2022-01-26 14:17:52.356 | DEBUG    | __main__:trials:24 - Trial = 17803/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.357 | DEBUG    | __main__:trials:29 - Trial = 17803/30000 | Total reward = 45.59
2022-01-26 14:17:52.362 | DEBUG    | __main__:trials:24 - Trial = 17804/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.362 | DEBUG    | __main__:trials:29 - Trial = 17804/30000 | Total reward = 47.74
2022-01-26 14:17:52.367 | DEBUG    | __main__:trials:24 - Trial = 17805/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.368 | DEBUG    | __main__:trials:29 - Trial = 17805/30000 | Total reward = 29.59
2022-01-26 14:17:52.371 | DEBUG    | __main__:trials:24 - Trial = 17806/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.373 | DEBUG    | __main__:trials:29 - Trial = 17806/30000 | Total reward = 42.14
2022-01-26 14:17:52.377 | DEBUG    | __main__:trials:24 - Trial = 17807/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.379 | DEBUG    | __main__:trials:29 - Trial = 17807/30000 | Total reward = 47.01
2022-01-26 14:17:52.382 | DEBUG    | __main__:trials:24 - Trial = 17808/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.383 | DEBUG    | __main__:trials:29 - Trial = 17808/30000 | Total reward = 53.77
2022-01-26 14:17:52.387 | DEBUG    | __main__:trials:24 - Trial = 17809/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.389 | DEBUG    | __main__:trials:29 - Trial = 17809/30000 | Total reward = 55.64
2022-01-26 14:17:52.392 | DEBUG    | __main__:trials:24 - Trial = 17810/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.393 | DEBUG    | __main__:trials:29 - Trial = 17810/30000 | Total reward = 40.76
2022-01-26 14:17:52.397 | DEBUG    | __main__:trials:24 - Trial = 17811/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.398 | DEBUG    | __main__:trials:29 - Trial = 17811/30000 | Total reward = 56.20
2022-01-26 14:17:52.401 | DEBUG    | __main__:trials:24 - Trial = 17812/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.403 | DEBUG    | __main__:trials:29 - Trial = 17812/30000 | Total reward = 47.01
2022-01-26 14:17:52.406 | DEBUG    | __main__:trials:24 - Trial = 17813/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.407 | DEBUG    | __main__:trials:29 - Trial = 17813/30000 | Total reward = 46.86
2022-01-26 14:17:52.410 | DEBUG    | __main__:trials:24 - Trial = 17814/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.412 | DEBUG    | __main__:trials:29 - Trial = 17814/30000 | Total reward = 41.37
2022-01-26 14:17:52.416 | DEBUG    | __main__:trials:24 - Trial = 17815/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.416 | DEBUG    | __main__:trials:29 - Trial = 17815/30000 | Total reward = 61.36
2022-01-26 14:17:52.420 | DEBUG    | __main__:trials:24 - Trial = 17816/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.422 | DEBUG    | __main__:trials:29 - Trial = 17816/30000 | Total reward = 47.08
2022-01-26 14:17:52.425 | DEBUG    | __main__:trials:24 - Trial = 17817/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.426 | DEBUG    | __main__:trials:29 - Trial = 17817/30000 | Total reward = 47.01
2022-01-26 14:17:52.429 | DEBUG    | __main__:trials:24 - Trial = 17818/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.431 | DEBUG    | __main__:trials:29 - Trial = 17818/30000 | Total reward = 38.58
2022-01-26 14:17:52.434 | DEBUG    | __main__:trials:24 - Trial = 17819/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.436 | DEBUG    | __main__:trials:29 - Trial = 17819/30000 | Total reward = 47.01
2022-01-26 14:17:52.439 | DEBUG    | __main__:trials:24 - Trial = 17820/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.440 | DEBUG    | __main__:trials:29 - Trial = 17820/30000 | Total reward = 41.12
2022-01-26 14:17:52.443 | DEBUG    | __main__:trials:24 - Trial = 17821/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.445 | DEBUG    | __main__:trials:29 - Trial = 17821/30000 | Total reward = 38.45
2022-01-26 14:17:52.449 | DEBUG    | __main__:trials:24 - Trial = 17822/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.449 | DEBUG    | __main__:trials:29 - Trial = 17822/30000 | Total reward = 58.99
2022-01-26 14:17:52.453 | DEBUG    | __main__:trials:24 - Trial = 17823/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.454 | DEBUG    | __main__:trials:29 - Trial = 17823/30000 | Total reward = 31.29
2022-01-26 14:17:52.458 | DEBUG    | __main__:trials:24 - Trial = 17824/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.458 | DEBUG    | __main__:trials:29 - Trial = 17824/30000 | Total reward = 57.69
2022-01-26 14:17:52.461 | DEBUG    | __main__:trials:24 - Trial = 17825/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.463 | DEBUG    | __main__:trials:29 - Trial = 17825/30000 | Total reward = 59.24
2022-01-26 14:17:52.467 | DEBUG    | __main__:trials:24 - Trial = 17826/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.468 | DEBUG    | __main__:trials:29 - Trial = 17826/30000 | Total reward = 40.43
2022-01-26 14:17:52.471 | DEBUG    | __main__:trials:24 - Trial = 17827/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.472 | DEBUG    | __main__:trials:29 - Trial = 17827/30000 | Total reward = 63.34
2022-01-26 14:17:52.476 | DEBUG    | __main__:trials:24 - Trial = 17828/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.476 | DEBUG    | __main__:trials:29 - Trial = 17828/30000 | Total reward = 51.37
2022-01-26 14:17:52.480 | DEBUG    | __main__:trials:24 - Trial = 17829/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.481 | DEBUG    | __main__:trials:29 - Trial = 17829/30000 | Total reward = 50.56
2022-01-26 14:17:52.484 | DEBUG    | __main__:trials:24 - Trial = 17830/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.486 | DEBUG    | __main__:trials:29 - Trial = 17830/30000 | Total reward = 47.01
2022-01-26 14:17:52.489 | DEBUG    | __main__:trials:24 - Trial = 17831/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.490 | DEBUG    | __main__:trials:29 - Trial = 17831/30000 | Total reward = 47.70
2022-01-26 14:17:52.493 | DEBUG    | __main__:trials:24 - Trial = 17832/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.494 | DEBUG    | __main__:trials:29 - Trial = 17832/30000 | Total reward = 39.89
2022-01-26 14:17:52.497 | DEBUG    | __main__:trials:24 - Trial = 17833/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.498 | DEBUG    | __main__:trials:29 - Trial = 17833/30000 | Total reward = 36.12
2022-01-26 14:17:52.501 | DEBUG    | __main__:trials:24 - Trial = 17834/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.502 | DEBUG    | __main__:trials:29 - Trial = 17834/30000 | Total reward = 35.42
2022-01-26 14:17:52.506 | DEBUG    | __main__:trials:24 - Trial = 17835/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.507 | DEBUG    | __main__:trials:29 - Trial = 17835/30000 | Total reward = 58.36
2022-01-26 14:17:52.510 | DEBUG    | __main__:trials:24 - Trial = 17836/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.511 | DEBUG    | __main__:trials:29 - Trial = 17836/30000 | Total reward = 33.57
2022-01-26 14:17:52.514 | DEBUG    | __main__:trials:26 - Trial = 17837/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.514 | DEBUG    | __main__:trials:29 - Trial = 17837/30000 | Total reward = 30.48
2022-01-26 14:17:52.518 | DEBUG    | __main__:trials:24 - Trial = 17838/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.519 | DEBUG    | __main__:trials:29 - Trial = 17838/30000 | Total reward = 41.26
2022-01-26 14:17:52.523 | DEBUG    | __main__:trials:24 - Trial = 17839/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.524 | DEBUG    | __main__:trials:29 - Trial = 17839/30000 | Total reward = 38.46
2022-01-26 14:17:52.527 | DEBUG    | __main__:trials:24 - Trial = 17840/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.529 | DEBUG    | __main__:trials:29 - Trial = 17840/30000 | Total reward = 49.43
2022-01-26 14:17:52.532 | DEBUG    | __main__:trials:24 - Trial = 17841/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.533 | DEBUG    | __main__:trials:29 - Trial = 17841/30000 | Total reward = 41.23
2022-01-26 14:17:52.536 | DEBUG    | __main__:trials:24 - Trial = 17842/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.538 | DEBUG    | __main__:trials:29 - Trial = 17842/30000 | Total reward = 41.57
2022-01-26 14:17:52.541 | DEBUG    | __main__:trials:24 - Trial = 17843/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.543 | DEBUG    | __main__:trials:29 - Trial = 17843/30000 | Total reward = 47.04
2022-01-26 14:17:52.546 | DEBUG    | __main__:trials:24 - Trial = 17844/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.548 | DEBUG    | __main__:trials:29 - Trial = 17844/30000 | Total reward = 43.96
2022-01-26 14:17:52.551 | DEBUG    | __main__:trials:24 - Trial = 17845/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.552 | DEBUG    | __main__:trials:29 - Trial = 17845/30000 | Total reward = 45.96
2022-01-26 14:17:52.555 | DEBUG    | __main__:trials:24 - Trial = 17846/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.557 | DEBUG    | __main__:trials:29 - Trial = 17846/30000 | Total reward = 43.83
2022-01-26 14:17:52.561 | DEBUG    | __main__:trials:24 - Trial = 17847/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.562 | DEBUG    | __main__:trials:29 - Trial = 17847/30000 | Total reward = 47.14
2022-01-26 14:17:52.565 | DEBUG    | __main__:trials:24 - Trial = 17848/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.566 | DEBUG    | __main__:trials:29 - Trial = 17848/30000 | Total reward = 46.05
2022-01-26 14:17:52.569 | DEBUG    | __main__:trials:24 - Trial = 17849/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.571 | DEBUG    | __main__:trials:29 - Trial = 17849/30000 | Total reward = 47.21
2022-01-26 14:17:52.574 | DEBUG    | __main__:trials:24 - Trial = 17850/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.575 | DEBUG    | __main__:trials:29 - Trial = 17850/30000 | Total reward = 46.33
2022-01-26 14:17:52.580 | DEBUG    | __main__:trials:24 - Trial = 17851/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.580 | DEBUG    | __main__:trials:29 - Trial = 17851/30000 | Total reward = 58.14
2022-01-26 14:17:52.584 | DEBUG    | __main__:trials:24 - Trial = 17852/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.585 | DEBUG    | __main__:trials:29 - Trial = 17852/30000 | Total reward = 60.30
2022-01-26 14:17:52.589 | DEBUG    | __main__:trials:24 - Trial = 17853/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.590 | DEBUG    | __main__:trials:29 - Trial = 17853/30000 | Total reward = 41.02
2022-01-26 14:17:52.594 | DEBUG    | __main__:trials:24 - Trial = 17854/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.596 | DEBUG    | __main__:trials:29 - Trial = 17854/30000 | Total reward = 32.01
2022-01-26 14:17:52.598 | DEBUG    | __main__:trials:24 - Trial = 17855/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.600 | DEBUG    | __main__:trials:29 - Trial = 17855/30000 | Total reward = 63.75
2022-01-26 14:17:52.603 | DEBUG    | __main__:trials:24 - Trial = 17856/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.605 | DEBUG    | __main__:trials:29 - Trial = 17856/30000 | Total reward = 46.61
2022-01-26 14:17:52.608 | DEBUG    | __main__:trials:24 - Trial = 17857/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.610 | DEBUG    | __main__:trials:29 - Trial = 17857/30000 | Total reward = 47.25
2022-01-26 14:17:52.613 | DEBUG    | __main__:trials:24 - Trial = 17858/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.614 | DEBUG    | __main__:trials:29 - Trial = 17858/30000 | Total reward = 50.81
2022-01-26 14:17:52.617 | DEBUG    | __main__:trials:24 - Trial = 17859/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.619 | DEBUG    | __main__:trials:29 - Trial = 17859/30000 | Total reward = 47.55
2022-01-26 14:17:52.623 | DEBUG    | __main__:trials:24 - Trial = 17860/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.624 | DEBUG    | __main__:trials:29 - Trial = 17860/30000 | Total reward = 46.35
2022-01-26 14:17:52.628 | DEBUG    | __main__:trials:24 - Trial = 17861/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.628 | DEBUG    | __main__:trials:29 - Trial = 17861/30000 | Total reward = 39.11
2022-01-26 14:17:52.632 | DEBUG    | __main__:trials:24 - Trial = 17862/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.633 | DEBUG    | __main__:trials:29 - Trial = 17862/30000 | Total reward = 47.06
2022-01-26 14:17:52.636 | DEBUG    | __main__:trials:24 - Trial = 17863/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.637 | DEBUG    | __main__:trials:29 - Trial = 17863/30000 | Total reward = 48.23
2022-01-26 14:17:52.640 | DEBUG    | __main__:trials:24 - Trial = 17864/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.641 | DEBUG    | __main__:trials:29 - Trial = 17864/30000 | Total reward = 42.76
2022-01-26 14:17:52.644 | DEBUG    | __main__:trials:24 - Trial = 17865/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.646 | DEBUG    | __main__:trials:29 - Trial = 17865/30000 | Total reward = 49.22
2022-01-26 14:17:52.649 | DEBUG    | __main__:trials:24 - Trial = 17866/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.650 | DEBUG    | __main__:trials:29 - Trial = 17866/30000 | Total reward = 35.91
2022-01-26 14:17:52.653 | DEBUG    | __main__:trials:24 - Trial = 17867/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.653 | DEBUG    | __main__:trials:29 - Trial = 17867/30000 | Total reward = 39.61
2022-01-26 14:17:52.658 | DEBUG    | __main__:trials:24 - Trial = 17868/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.658 | DEBUG    | __main__:trials:29 - Trial = 17868/30000 | Total reward = 47.01
2022-01-26 14:17:52.662 | DEBUG    | __main__:trials:24 - Trial = 17869/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.663 | DEBUG    | __main__:trials:29 - Trial = 17869/30000 | Total reward = 36.54
2022-01-26 14:17:52.667 | DEBUG    | __main__:trials:24 - Trial = 17870/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.669 | DEBUG    | __main__:trials:29 - Trial = 17870/30000 | Total reward = 62.87
2022-01-26 14:17:52.672 | DEBUG    | __main__:trials:24 - Trial = 17871/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.673 | DEBUG    | __main__:trials:29 - Trial = 17871/30000 | Total reward = 54.30
2022-01-26 14:17:52.676 | DEBUG    | __main__:trials:24 - Trial = 17872/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.678 | DEBUG    | __main__:trials:29 - Trial = 17872/30000 | Total reward = 43.40
2022-01-26 14:17:52.681 | DEBUG    | __main__:trials:24 - Trial = 17873/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.683 | DEBUG    | __main__:trials:29 - Trial = 17873/30000 | Total reward = 59.66
2022-01-26 14:17:52.686 | DEBUG    | __main__:trials:24 - Trial = 17874/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.687 | DEBUG    | __main__:trials:29 - Trial = 17874/30000 | Total reward = 58.45
2022-01-26 14:17:52.690 | DEBUG    | __main__:trials:24 - Trial = 17875/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.692 | DEBUG    | __main__:trials:29 - Trial = 17875/30000 | Total reward = 44.64
2022-01-26 14:17:52.695 | DEBUG    | __main__:trials:24 - Trial = 17876/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.696 | DEBUG    | __main__:trials:29 - Trial = 17876/30000 | Total reward = 40.92
2022-01-26 14:17:52.701 | DEBUG    | __main__:trials:24 - Trial = 17877/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.701 | DEBUG    | __main__:trials:29 - Trial = 17877/30000 | Total reward = 47.64
2022-01-26 14:17:52.705 | DEBUG    | __main__:trials:24 - Trial = 17878/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.706 | DEBUG    | __main__:trials:29 - Trial = 17878/30000 | Total reward = 44.21
2022-01-26 14:17:52.710 | DEBUG    | __main__:trials:24 - Trial = 17879/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.711 | DEBUG    | __main__:trials:29 - Trial = 17879/30000 | Total reward = 59.89
2022-01-26 14:17:52.715 | DEBUG    | __main__:trials:24 - Trial = 17880/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.716 | DEBUG    | __main__:trials:29 - Trial = 17880/30000 | Total reward = 47.29
2022-01-26 14:17:52.719 | DEBUG    | __main__:trials:24 - Trial = 17881/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.721 | DEBUG    | __main__:trials:29 - Trial = 17881/30000 | Total reward = 37.10
2022-01-26 14:17:52.724 | DEBUG    | __main__:trials:24 - Trial = 17882/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.726 | DEBUG    | __main__:trials:29 - Trial = 17882/30000 | Total reward = 47.25
2022-01-26 14:17:52.729 | DEBUG    | __main__:trials:24 - Trial = 17883/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.730 | DEBUG    | __main__:trials:29 - Trial = 17883/30000 | Total reward = 46.21
2022-01-26 14:17:52.734 | DEBUG    | __main__:trials:24 - Trial = 17884/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.735 | DEBUG    | __main__:trials:29 - Trial = 17884/30000 | Total reward = 42.03
2022-01-26 14:17:52.739 | DEBUG    | __main__:trials:24 - Trial = 17885/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.741 | DEBUG    | __main__:trials:29 - Trial = 17885/30000 | Total reward = 42.51
2022-01-26 14:17:52.745 | DEBUG    | __main__:trials:24 - Trial = 17886/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.746 | DEBUG    | __main__:trials:29 - Trial = 17886/30000 | Total reward = 47.04
2022-01-26 14:17:52.750 | DEBUG    | __main__:trials:24 - Trial = 17887/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.752 | DEBUG    | __main__:trials:29 - Trial = 17887/30000 | Total reward = 64.89
2022-01-26 14:17:52.755 | DEBUG    | __main__:trials:24 - Trial = 17888/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.755 | DEBUG    | __main__:trials:29 - Trial = 17888/30000 | Total reward = 43.32
2022-01-26 14:17:52.760 | DEBUG    | __main__:trials:24 - Trial = 17889/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.761 | DEBUG    | __main__:trials:29 - Trial = 17889/30000 | Total reward = 39.70
2022-01-26 14:17:52.764 | DEBUG    | __main__:trials:26 - Trial = 17890/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.764 | DEBUG    | __main__:trials:29 - Trial = 17890/30000 | Total reward = 15.63
2022-01-26 14:17:52.768 | DEBUG    | __main__:trials:24 - Trial = 17891/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.769 | DEBUG    | __main__:trials:29 - Trial = 17891/30000 | Total reward = 55.24
2022-01-26 14:17:52.773 | DEBUG    | __main__:trials:24 - Trial = 17892/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.774 | DEBUG    | __main__:trials:29 - Trial = 17892/30000 | Total reward = 39.82
2022-01-26 14:17:52.778 | DEBUG    | __main__:trials:24 - Trial = 17893/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.779 | DEBUG    | __main__:trials:29 - Trial = 17893/30000 | Total reward = 52.24
2022-01-26 14:17:52.783 | DEBUG    | __main__:trials:26 - Trial = 17894/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.784 | DEBUG    | __main__:trials:29 - Trial = 17894/30000 | Total reward = 34.27
2022-01-26 14:17:52.789 | DEBUG    | __main__:trials:24 - Trial = 17895/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.791 | DEBUG    | __main__:trials:29 - Trial = 17895/30000 | Total reward = 53.36
2022-01-26 14:17:52.794 | DEBUG    | __main__:trials:24 - Trial = 17896/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.795 | DEBUG    | __main__:trials:29 - Trial = 17896/30000 | Total reward = 38.23
2022-01-26 14:17:52.799 | DEBUG    | __main__:trials:24 - Trial = 17897/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.800 | DEBUG    | __main__:trials:29 - Trial = 17897/30000 | Total reward = 39.62
2022-01-26 14:17:52.805 | DEBUG    | __main__:trials:24 - Trial = 17898/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.805 | DEBUG    | __main__:trials:29 - Trial = 17898/30000 | Total reward = 57.91
2022-01-26 14:17:52.809 | DEBUG    | __main__:trials:24 - Trial = 17899/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.810 | DEBUG    | __main__:trials:29 - Trial = 17899/30000 | Total reward = 37.99
2022-01-26 14:17:52.814 | DEBUG    | __main__:trials:24 - Trial = 17900/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.816 | DEBUG    | __main__:trials:29 - Trial = 17900/30000 | Total reward = 53.23
2022-01-26 14:17:52.820 | DEBUG    | __main__:trials:24 - Trial = 17901/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.822 | DEBUG    | __main__:trials:29 - Trial = 17901/30000 | Total reward = 38.79
2022-01-26 14:17:52.825 | DEBUG    | __main__:trials:24 - Trial = 17902/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.827 | DEBUG    | __main__:trials:29 - Trial = 17902/30000 | Total reward = 57.69
2022-01-26 14:17:52.830 | DEBUG    | __main__:trials:24 - Trial = 17903/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.832 | DEBUG    | __main__:trials:29 - Trial = 17903/30000 | Total reward = 37.15
2022-01-26 14:17:52.835 | DEBUG    | __main__:trials:24 - Trial = 17904/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.837 | DEBUG    | __main__:trials:29 - Trial = 17904/30000 | Total reward = 45.69
2022-01-26 14:17:52.840 | DEBUG    | __main__:trials:24 - Trial = 17905/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.841 | DEBUG    | __main__:trials:29 - Trial = 17905/30000 | Total reward = 47.30
2022-01-26 14:17:52.845 | DEBUG    | __main__:trials:24 - Trial = 17906/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.846 | DEBUG    | __main__:trials:29 - Trial = 17906/30000 | Total reward = 45.57
2022-01-26 14:17:52.850 | DEBUG    | __main__:trials:24 - Trial = 17907/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.852 | DEBUG    | __main__:trials:29 - Trial = 17907/30000 | Total reward = 57.15
2022-01-26 14:17:52.855 | DEBUG    | __main__:trials:24 - Trial = 17908/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.857 | DEBUG    | __main__:trials:29 - Trial = 17908/30000 | Total reward = 46.73
2022-01-26 14:17:52.861 | DEBUG    | __main__:trials:24 - Trial = 17909/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.861 | DEBUG    | __main__:trials:29 - Trial = 17909/30000 | Total reward = 48.91
2022-01-26 14:17:52.865 | DEBUG    | __main__:trials:24 - Trial = 17910/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.867 | DEBUG    | __main__:trials:29 - Trial = 17910/30000 | Total reward = 46.16
2022-01-26 14:17:52.870 | DEBUG    | __main__:trials:24 - Trial = 17911/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.872 | DEBUG    | __main__:trials:29 - Trial = 17911/30000 | Total reward = 36.49
2022-01-26 14:17:52.876 | DEBUG    | __main__:trials:24 - Trial = 17912/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.878 | DEBUG    | __main__:trials:29 - Trial = 17912/30000 | Total reward = 53.51
2022-01-26 14:17:52.881 | DEBUG    | __main__:trials:24 - Trial = 17913/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.883 | DEBUG    | __main__:trials:29 - Trial = 17913/30000 | Total reward = 43.52
2022-01-26 14:17:52.887 | DEBUG    | __main__:trials:24 - Trial = 17914/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.888 | DEBUG    | __main__:trials:29 - Trial = 17914/30000 | Total reward = 46.99
2022-01-26 14:17:52.891 | DEBUG    | __main__:trials:24 - Trial = 17915/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.893 | DEBUG    | __main__:trials:29 - Trial = 17915/30000 | Total reward = 53.60
2022-01-26 14:17:52.897 | DEBUG    | __main__:trials:24 - Trial = 17916/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.898 | DEBUG    | __main__:trials:29 - Trial = 17916/30000 | Total reward = 41.98
2022-01-26 14:17:52.901 | DEBUG    | __main__:trials:24 - Trial = 17917/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.902 | DEBUG    | __main__:trials:29 - Trial = 17917/30000 | Total reward = 52.52
2022-01-26 14:17:52.905 | DEBUG    | __main__:trials:24 - Trial = 17918/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.906 | DEBUG    | __main__:trials:29 - Trial = 17918/30000 | Total reward = 43.26
2022-01-26 14:17:52.910 | DEBUG    | __main__:trials:24 - Trial = 17919/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.910 | DEBUG    | __main__:trials:29 - Trial = 17919/30000 | Total reward = 33.43
2022-01-26 14:17:52.914 | DEBUG    | __main__:trials:24 - Trial = 17920/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.915 | DEBUG    | __main__:trials:29 - Trial = 17920/30000 | Total reward = 54.55
2022-01-26 14:17:52.919 | DEBUG    | __main__:trials:24 - Trial = 17921/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.920 | DEBUG    | __main__:trials:29 - Trial = 17921/30000 | Total reward = 42.39
2022-01-26 14:17:52.924 | DEBUG    | __main__:trials:24 - Trial = 17922/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.925 | DEBUG    | __main__:trials:29 - Trial = 17922/30000 | Total reward = 38.17
2022-01-26 14:17:52.929 | DEBUG    | __main__:trials:24 - Trial = 17923/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.930 | DEBUG    | __main__:trials:29 - Trial = 17923/30000 | Total reward = 35.67
2022-01-26 14:17:52.934 | DEBUG    | __main__:trials:24 - Trial = 17924/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.935 | DEBUG    | __main__:trials:29 - Trial = 17924/30000 | Total reward = 46.99
2022-01-26 14:17:52.938 | DEBUG    | __main__:trials:24 - Trial = 17925/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.939 | DEBUG    | __main__:trials:29 - Trial = 17925/30000 | Total reward = 40.88
2022-01-26 14:17:52.942 | DEBUG    | __main__:trials:24 - Trial = 17926/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.943 | DEBUG    | __main__:trials:29 - Trial = 17926/30000 | Total reward = 32.61
2022-01-26 14:17:52.946 | DEBUG    | __main__:trials:24 - Trial = 17927/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.947 | DEBUG    | __main__:trials:29 - Trial = 17927/30000 | Total reward = 38.94
2022-01-26 14:17:52.950 | DEBUG    | __main__:trials:24 - Trial = 17928/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.952 | DEBUG    | __main__:trials:29 - Trial = 17928/30000 | Total reward = 59.37
2022-01-26 14:17:52.954 | DEBUG    | __main__:trials:26 - Trial = 17929/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:52.956 | DEBUG    | __main__:trials:29 - Trial = 17929/30000 | Total reward = 17.46
2022-01-26 14:17:52.959 | DEBUG    | __main__:trials:24 - Trial = 17930/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.960 | DEBUG    | __main__:trials:29 - Trial = 17930/30000 | Total reward = 39.97
2022-01-26 14:17:52.964 | DEBUG    | __main__:trials:24 - Trial = 17931/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.965 | DEBUG    | __main__:trials:29 - Trial = 17931/30000 | Total reward = 47.29
2022-01-26 14:17:52.969 | DEBUG    | __main__:trials:24 - Trial = 17932/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.970 | DEBUG    | __main__:trials:29 - Trial = 17932/30000 | Total reward = 35.44
2022-01-26 14:17:52.974 | DEBUG    | __main__:trials:24 - Trial = 17933/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.975 | DEBUG    | __main__:trials:29 - Trial = 17933/30000 | Total reward = 62.37
2022-01-26 14:17:52.978 | DEBUG    | __main__:trials:24 - Trial = 17934/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.980 | DEBUG    | __main__:trials:29 - Trial = 17934/30000 | Total reward = 37.32
2022-01-26 14:17:52.983 | DEBUG    | __main__:trials:24 - Trial = 17935/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.985 | DEBUG    | __main__:trials:29 - Trial = 17935/30000 | Total reward = 35.46
2022-01-26 14:17:52.989 | DEBUG    | __main__:trials:24 - Trial = 17936/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.991 | DEBUG    | __main__:trials:29 - Trial = 17936/30000 | Total reward = 48.78
2022-01-26 14:17:52.994 | DEBUG    | __main__:trials:24 - Trial = 17937/30000 | Max number of steps (20) reached
2022-01-26 14:17:52.996 | DEBUG    | __main__:trials:29 - Trial = 17937/30000 | Total reward = 36.74
2022-01-26 14:17:53.000 | DEBUG    | __main__:trials:24 - Trial = 17938/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.001 | DEBUG    | __main__:trials:29 - Trial = 17938/30000 | Total reward = 47.09
2022-01-26 14:17:53.005 | DEBUG    | __main__:trials:24 - Trial = 17939/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.007 | DEBUG    | __main__:trials:29 - Trial = 17939/30000 | Total reward = 47.69
2022-01-26 14:17:53.010 | DEBUG    | __main__:trials:24 - Trial = 17940/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.012 | DEBUG    | __main__:trials:29 - Trial = 17940/30000 | Total reward = 47.27
2022-01-26 14:17:53.016 | DEBUG    | __main__:trials:24 - Trial = 17941/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.018 | DEBUG    | __main__:trials:29 - Trial = 17941/30000 | Total reward = 57.11
2022-01-26 14:17:53.021 | DEBUG    | __main__:trials:24 - Trial = 17942/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.022 | DEBUG    | __main__:trials:29 - Trial = 17942/30000 | Total reward = 47.00
2022-01-26 14:17:53.027 | DEBUG    | __main__:trials:24 - Trial = 17943/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.028 | DEBUG    | __main__:trials:29 - Trial = 17943/30000 | Total reward = 44.45
2022-01-26 14:17:53.032 | DEBUG    | __main__:trials:24 - Trial = 17944/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.034 | DEBUG    | __main__:trials:29 - Trial = 17944/30000 | Total reward = 36.35
2022-01-26 14:17:53.037 | DEBUG    | __main__:trials:24 - Trial = 17945/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.038 | DEBUG    | __main__:trials:29 - Trial = 17945/30000 | Total reward = 38.79
2022-01-26 14:17:53.043 | DEBUG    | __main__:trials:24 - Trial = 17946/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.044 | DEBUG    | __main__:trials:29 - Trial = 17946/30000 | Total reward = 41.58
2022-01-26 14:17:53.048 | DEBUG    | __main__:trials:24 - Trial = 17947/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.050 | DEBUG    | __main__:trials:29 - Trial = 17947/30000 | Total reward = 58.64
2022-01-26 14:17:53.054 | DEBUG    | __main__:trials:24 - Trial = 17948/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.054 | DEBUG    | __main__:trials:29 - Trial = 17948/30000 | Total reward = 47.06
2022-01-26 14:17:53.059 | DEBUG    | __main__:trials:24 - Trial = 17949/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.060 | DEBUG    | __main__:trials:29 - Trial = 17949/30000 | Total reward = 52.66
2022-01-26 14:17:53.064 | DEBUG    | __main__:trials:24 - Trial = 17950/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.066 | DEBUG    | __main__:trials:29 - Trial = 17950/30000 | Total reward = 59.05
2022-01-26 14:17:53.069 | DEBUG    | __main__:trials:24 - Trial = 17951/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.071 | DEBUG    | __main__:trials:29 - Trial = 17951/30000 | Total reward = 59.79
2022-01-26 14:17:53.074 | DEBUG    | __main__:trials:24 - Trial = 17952/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.076 | DEBUG    | __main__:trials:29 - Trial = 17952/30000 | Total reward = 52.57
2022-01-26 14:17:53.079 | DEBUG    | __main__:trials:24 - Trial = 17953/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.080 | DEBUG    | __main__:trials:29 - Trial = 17953/30000 | Total reward = 48.00
2022-01-26 14:17:53.083 | DEBUG    | __main__:trials:24 - Trial = 17954/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.085 | DEBUG    | __main__:trials:29 - Trial = 17954/30000 | Total reward = 44.21
2022-01-26 14:17:53.088 | DEBUG    | __main__:trials:24 - Trial = 17955/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.090 | DEBUG    | __main__:trials:29 - Trial = 17955/30000 | Total reward = 53.35
2022-01-26 14:17:53.093 | DEBUG    | __main__:trials:24 - Trial = 17956/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.095 | DEBUG    | __main__:trials:29 - Trial = 17956/30000 | Total reward = 49.90
2022-01-26 14:17:53.098 | DEBUG    | __main__:trials:24 - Trial = 17957/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.100 | DEBUG    | __main__:trials:29 - Trial = 17957/30000 | Total reward = 52.04
2022-01-26 14:17:53.103 | DEBUG    | __main__:trials:24 - Trial = 17958/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.105 | DEBUG    | __main__:trials:29 - Trial = 17958/30000 | Total reward = 39.85
2022-01-26 14:17:53.108 | DEBUG    | __main__:trials:24 - Trial = 17959/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.110 | DEBUG    | __main__:trials:29 - Trial = 17959/30000 | Total reward = 44.49
2022-01-26 14:17:53.113 | DEBUG    | __main__:trials:24 - Trial = 17960/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.114 | DEBUG    | __main__:trials:29 - Trial = 17960/30000 | Total reward = 40.02
2022-01-26 14:17:53.117 | DEBUG    | __main__:trials:24 - Trial = 17961/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.118 | DEBUG    | __main__:trials:29 - Trial = 17961/30000 | Total reward = 52.47
2022-01-26 14:17:53.121 | DEBUG    | __main__:trials:24 - Trial = 17962/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.123 | DEBUG    | __main__:trials:29 - Trial = 17962/30000 | Total reward = 54.52
2022-01-26 14:17:53.126 | DEBUG    | __main__:trials:24 - Trial = 17963/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.127 | DEBUG    | __main__:trials:29 - Trial = 17963/30000 | Total reward = 65.59
2022-01-26 14:17:53.131 | DEBUG    | __main__:trials:24 - Trial = 17964/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.133 | DEBUG    | __main__:trials:29 - Trial = 17964/30000 | Total reward = 57.63
2022-01-26 14:17:53.136 | DEBUG    | __main__:trials:24 - Trial = 17965/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.137 | DEBUG    | __main__:trials:29 - Trial = 17965/30000 | Total reward = 57.32
2022-01-26 14:17:53.140 | DEBUG    | __main__:trials:24 - Trial = 17966/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.141 | DEBUG    | __main__:trials:29 - Trial = 17966/30000 | Total reward = 49.44
2022-01-26 14:17:53.146 | DEBUG    | __main__:trials:24 - Trial = 17967/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.146 | DEBUG    | __main__:trials:29 - Trial = 17967/30000 | Total reward = 39.64
2022-01-26 14:17:53.151 | DEBUG    | __main__:trials:24 - Trial = 17968/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.152 | DEBUG    | __main__:trials:29 - Trial = 17968/30000 | Total reward = 65.56
2022-01-26 14:17:53.155 | DEBUG    | __main__:trials:24 - Trial = 17969/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.157 | DEBUG    | __main__:trials:29 - Trial = 17969/30000 | Total reward = 65.06
2022-01-26 14:17:53.160 | DEBUG    | __main__:trials:24 - Trial = 17970/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.162 | DEBUG    | __main__:trials:29 - Trial = 17970/30000 | Total reward = 50.84
2022-01-26 14:17:53.165 | DEBUG    | __main__:trials:24 - Trial = 17971/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.166 | DEBUG    | __main__:trials:29 - Trial = 17971/30000 | Total reward = 50.78
2022-01-26 14:17:53.169 | DEBUG    | __main__:trials:24 - Trial = 17972/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.170 | DEBUG    | __main__:trials:29 - Trial = 17972/30000 | Total reward = 48.28
2022-01-26 14:17:53.174 | DEBUG    | __main__:trials:24 - Trial = 17973/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.175 | DEBUG    | __main__:trials:29 - Trial = 17973/30000 | Total reward = 49.64
2022-01-26 14:17:53.179 | DEBUG    | __main__:trials:24 - Trial = 17974/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.179 | DEBUG    | __main__:trials:29 - Trial = 17974/30000 | Total reward = 41.06
2022-01-26 14:17:53.184 | DEBUG    | __main__:trials:24 - Trial = 17975/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.185 | DEBUG    | __main__:trials:29 - Trial = 17975/30000 | Total reward = 47.77
2022-01-26 14:17:53.189 | DEBUG    | __main__:trials:24 - Trial = 17976/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.190 | DEBUG    | __main__:trials:29 - Trial = 17976/30000 | Total reward = 36.74
2022-01-26 14:17:53.193 | DEBUG    | __main__:trials:24 - Trial = 17977/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.196 | DEBUG    | __main__:trials:29 - Trial = 17977/30000 | Total reward = 55.07
2022-01-26 14:17:53.199 | DEBUG    | __main__:trials:24 - Trial = 17978/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.200 | DEBUG    | __main__:trials:29 - Trial = 17978/30000 | Total reward = 44.40
2022-01-26 14:17:53.204 | DEBUG    | __main__:trials:24 - Trial = 17979/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.206 | DEBUG    | __main__:trials:29 - Trial = 17979/30000 | Total reward = 47.69
2022-01-26 14:17:53.210 | DEBUG    | __main__:trials:24 - Trial = 17980/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.212 | DEBUG    | __main__:trials:29 - Trial = 17980/30000 | Total reward = 57.55
2022-01-26 14:17:53.215 | DEBUG    | __main__:trials:24 - Trial = 17981/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.217 | DEBUG    | __main__:trials:29 - Trial = 17981/30000 | Total reward = 53.05
2022-01-26 14:17:53.220 | DEBUG    | __main__:trials:26 - Trial = 17982/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.222 | DEBUG    | __main__:trials:29 - Trial = 17982/30000 | Total reward = 30.28
2022-01-26 14:17:53.225 | DEBUG    | __main__:trials:24 - Trial = 17983/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.227 | DEBUG    | __main__:trials:29 - Trial = 17983/30000 | Total reward = 62.64
2022-01-26 14:17:53.231 | DEBUG    | __main__:trials:24 - Trial = 17984/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.232 | DEBUG    | __main__:trials:29 - Trial = 17984/30000 | Total reward = 46.74
2022-01-26 14:17:53.236 | DEBUG    | __main__:trials:24 - Trial = 17985/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.237 | DEBUG    | __main__:trials:29 - Trial = 17985/30000 | Total reward = 40.49
2022-01-26 14:17:53.241 | DEBUG    | __main__:trials:24 - Trial = 17986/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.241 | DEBUG    | __main__:trials:29 - Trial = 17986/30000 | Total reward = 45.72
2022-01-26 14:17:53.245 | DEBUG    | __main__:trials:24 - Trial = 17987/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.246 | DEBUG    | __main__:trials:29 - Trial = 17987/30000 | Total reward = 53.30
2022-01-26 14:17:53.250 | DEBUG    | __main__:trials:24 - Trial = 17988/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.252 | DEBUG    | __main__:trials:29 - Trial = 17988/30000 | Total reward = 47.82
2022-01-26 14:17:53.255 | DEBUG    | __main__:trials:24 - Trial = 17989/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.255 | DEBUG    | __main__:trials:29 - Trial = 17989/30000 | Total reward = 49.19
2022-01-26 14:17:53.259 | DEBUG    | __main__:trials:24 - Trial = 17990/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.261 | DEBUG    | __main__:trials:29 - Trial = 17990/30000 | Total reward = 48.09
2022-01-26 14:17:53.265 | DEBUG    | __main__:trials:24 - Trial = 17991/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.266 | DEBUG    | __main__:trials:29 - Trial = 17991/30000 | Total reward = 54.63
2022-01-26 14:17:53.269 | DEBUG    | __main__:trials:24 - Trial = 17992/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.271 | DEBUG    | __main__:trials:29 - Trial = 17992/30000 | Total reward = 37.55
2022-01-26 14:17:53.273 | DEBUG    | __main__:trials:26 - Trial = 17993/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.274 | DEBUG    | __main__:trials:29 - Trial = 17993/30000 | Total reward = 25.43
2022-01-26 14:17:53.278 | DEBUG    | __main__:trials:24 - Trial = 17994/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.279 | DEBUG    | __main__:trials:29 - Trial = 17994/30000 | Total reward = 49.40
2022-01-26 14:17:53.282 | DEBUG    | __main__:trials:24 - Trial = 17995/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.284 | DEBUG    | __main__:trials:29 - Trial = 17995/30000 | Total reward = 43.81
2022-01-26 14:17:53.287 | DEBUG    | __main__:trials:24 - Trial = 17996/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.287 | DEBUG    | __main__:trials:29 - Trial = 17996/30000 | Total reward = 34.98
2022-01-26 14:17:53.291 | DEBUG    | __main__:trials:24 - Trial = 17997/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.293 | DEBUG    | __main__:trials:29 - Trial = 17997/30000 | Total reward = 44.07
2022-01-26 14:17:53.296 | DEBUG    | __main__:trials:24 - Trial = 17998/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.296 | DEBUG    | __main__:trials:29 - Trial = 17998/30000 | Total reward = 46.48
2022-01-26 14:17:53.300 | DEBUG    | __main__:trials:24 - Trial = 17999/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.301 | DEBUG    | __main__:trials:29 - Trial = 17999/30000 | Total reward = 40.11
2022-01-26 14:17:53.304 | DEBUG    | __main__:trials:24 - Trial = 18000/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.305 | DEBUG    | __main__:trials:29 - Trial = 18000/30000 | Total reward = 43.10
2022-01-26 14:17:53.309 | DEBUG    | __main__:trials:24 - Trial = 18001/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.310 | DEBUG    | __main__:trials:29 - Trial = 18001/30000 | Total reward = 43.96
2022-01-26 14:17:53.314 | DEBUG    | __main__:trials:26 - Trial = 18002/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.314 | DEBUG    | __main__:trials:29 - Trial = 18002/30000 | Total reward = 25.61
2022-01-26 14:17:53.318 | DEBUG    | __main__:trials:24 - Trial = 18003/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.319 | DEBUG    | __main__:trials:29 - Trial = 18003/30000 | Total reward = 39.27
2022-01-26 14:17:53.322 | DEBUG    | __main__:trials:24 - Trial = 18004/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.323 | DEBUG    | __main__:trials:29 - Trial = 18004/30000 | Total reward = 49.00
2022-01-26 14:17:53.327 | DEBUG    | __main__:trials:24 - Trial = 18005/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.327 | DEBUG    | __main__:trials:29 - Trial = 18005/30000 | Total reward = 48.55
2022-01-26 14:17:53.331 | DEBUG    | __main__:trials:24 - Trial = 18006/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.333 | DEBUG    | __main__:trials:29 - Trial = 18006/30000 | Total reward = 49.10
2022-01-26 14:17:53.335 | DEBUG    | __main__:trials:24 - Trial = 18007/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.337 | DEBUG    | __main__:trials:29 - Trial = 18007/30000 | Total reward = 43.44
2022-01-26 14:17:53.340 | DEBUG    | __main__:trials:24 - Trial = 18008/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.341 | DEBUG    | __main__:trials:29 - Trial = 18008/30000 | Total reward = 35.93
2022-01-26 14:17:53.344 | DEBUG    | __main__:trials:24 - Trial = 18009/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.345 | DEBUG    | __main__:trials:29 - Trial = 18009/30000 | Total reward = 41.90
2022-01-26 14:17:53.348 | DEBUG    | __main__:trials:24 - Trial = 18010/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.349 | DEBUG    | __main__:trials:29 - Trial = 18010/30000 | Total reward = 47.91
2022-01-26 14:17:53.353 | DEBUG    | __main__:trials:24 - Trial = 18011/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.354 | DEBUG    | __main__:trials:29 - Trial = 18011/30000 | Total reward = 40.52
2022-01-26 14:17:53.357 | DEBUG    | __main__:trials:24 - Trial = 18012/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.358 | DEBUG    | __main__:trials:29 - Trial = 18012/30000 | Total reward = 59.61
2022-01-26 14:17:53.361 | DEBUG    | __main__:trials:24 - Trial = 18013/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.362 | DEBUG    | __main__:trials:29 - Trial = 18013/30000 | Total reward = 41.78
2022-01-26 14:17:53.366 | DEBUG    | __main__:trials:24 - Trial = 18014/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.368 | DEBUG    | __main__:trials:29 - Trial = 18014/30000 | Total reward = 51.65
2022-01-26 14:17:53.371 | DEBUG    | __main__:trials:24 - Trial = 18015/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.371 | DEBUG    | __main__:trials:29 - Trial = 18015/30000 | Total reward = 49.52
2022-01-26 14:17:53.374 | DEBUG    | __main__:trials:24 - Trial = 18016/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.375 | DEBUG    | __main__:trials:29 - Trial = 18016/30000 | Total reward = 55.37
2022-01-26 14:17:53.378 | DEBUG    | __main__:trials:24 - Trial = 18017/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.379 | DEBUG    | __main__:trials:29 - Trial = 18017/30000 | Total reward = 51.96
2022-01-26 14:17:53.383 | DEBUG    | __main__:trials:24 - Trial = 18018/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.383 | DEBUG    | __main__:trials:29 - Trial = 18018/30000 | Total reward = 48.62
2022-01-26 14:17:53.387 | DEBUG    | __main__:trials:24 - Trial = 18019/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.389 | DEBUG    | __main__:trials:29 - Trial = 18019/30000 | Total reward = 43.55
2022-01-26 14:17:53.392 | DEBUG    | __main__:trials:24 - Trial = 18020/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.394 | DEBUG    | __main__:trials:29 - Trial = 18020/30000 | Total reward = 43.70
2022-01-26 14:17:53.397 | DEBUG    | __main__:trials:24 - Trial = 18021/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.399 | DEBUG    | __main__:trials:29 - Trial = 18021/30000 | Total reward = 51.44
2022-01-26 14:17:53.403 | DEBUG    | __main__:trials:24 - Trial = 18022/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.404 | DEBUG    | __main__:trials:29 - Trial = 18022/30000 | Total reward = 45.67
2022-01-26 14:17:53.407 | DEBUG    | __main__:trials:24 - Trial = 18023/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.409 | DEBUG    | __main__:trials:29 - Trial = 18023/30000 | Total reward = 53.60
2022-01-26 14:17:53.412 | DEBUG    | __main__:trials:24 - Trial = 18024/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.413 | DEBUG    | __main__:trials:29 - Trial = 18024/30000 | Total reward = 49.82
2022-01-26 14:17:53.416 | DEBUG    | __main__:trials:24 - Trial = 18025/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.418 | DEBUG    | __main__:trials:29 - Trial = 18025/30000 | Total reward = 60.36
2022-01-26 14:17:53.422 | DEBUG    | __main__:trials:24 - Trial = 18026/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.423 | DEBUG    | __main__:trials:29 - Trial = 18026/30000 | Total reward = 60.51
2022-01-26 14:17:53.427 | DEBUG    | __main__:trials:24 - Trial = 18027/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.428 | DEBUG    | __main__:trials:29 - Trial = 18027/30000 | Total reward = 48.30
2022-01-26 14:17:53.432 | DEBUG    | __main__:trials:24 - Trial = 18028/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.434 | DEBUG    | __main__:trials:29 - Trial = 18028/30000 | Total reward = 47.92
2022-01-26 14:17:53.437 | DEBUG    | __main__:trials:24 - Trial = 18029/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.439 | DEBUG    | __main__:trials:29 - Trial = 18029/30000 | Total reward = 53.09
2022-01-26 14:17:53.443 | DEBUG    | __main__:trials:24 - Trial = 18030/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.444 | DEBUG    | __main__:trials:29 - Trial = 18030/30000 | Total reward = 54.58
2022-01-26 14:17:53.449 | DEBUG    | __main__:trials:24 - Trial = 18031/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.450 | DEBUG    | __main__:trials:29 - Trial = 18031/30000 | Total reward = 38.02
2022-01-26 14:17:53.454 | DEBUG    | __main__:trials:24 - Trial = 18032/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.455 | DEBUG    | __main__:trials:29 - Trial = 18032/30000 | Total reward = 68.52
2022-01-26 14:17:53.459 | DEBUG    | __main__:trials:24 - Trial = 18033/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.460 | DEBUG    | __main__:trials:29 - Trial = 18033/30000 | Total reward = 54.82
2022-01-26 14:17:53.465 | DEBUG    | __main__:trials:24 - Trial = 18034/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.465 | DEBUG    | __main__:trials:29 - Trial = 18034/30000 | Total reward = 50.19
2022-01-26 14:17:53.470 | DEBUG    | __main__:trials:24 - Trial = 18035/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.471 | DEBUG    | __main__:trials:29 - Trial = 18035/30000 | Total reward = 58.84
2022-01-26 14:17:53.475 | DEBUG    | __main__:trials:24 - Trial = 18036/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.477 | DEBUG    | __main__:trials:29 - Trial = 18036/30000 | Total reward = 47.83
2022-01-26 14:17:53.480 | DEBUG    | __main__:trials:24 - Trial = 18037/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.482 | DEBUG    | __main__:trials:29 - Trial = 18037/30000 | Total reward = 44.52
2022-01-26 14:17:53.486 | DEBUG    | __main__:trials:24 - Trial = 18038/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.486 | DEBUG    | __main__:trials:29 - Trial = 18038/30000 | Total reward = 45.20
2022-01-26 14:17:53.491 | DEBUG    | __main__:trials:24 - Trial = 18039/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.492 | DEBUG    | __main__:trials:29 - Trial = 18039/30000 | Total reward = 58.44
2022-01-26 14:17:53.496 | DEBUG    | __main__:trials:24 - Trial = 18040/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.497 | DEBUG    | __main__:trials:29 - Trial = 18040/30000 | Total reward = 46.52
2022-01-26 14:17:53.501 | DEBUG    | __main__:trials:24 - Trial = 18041/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.502 | DEBUG    | __main__:trials:29 - Trial = 18041/30000 | Total reward = 51.23
2022-01-26 14:17:53.505 | DEBUG    | __main__:trials:24 - Trial = 18042/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.507 | DEBUG    | __main__:trials:29 - Trial = 18042/30000 | Total reward = 43.01
2022-01-26 14:17:53.510 | DEBUG    | __main__:trials:24 - Trial = 18043/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.512 | DEBUG    | __main__:trials:29 - Trial = 18043/30000 | Total reward = 38.38
2022-01-26 14:17:53.516 | DEBUG    | __main__:trials:24 - Trial = 18044/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.516 | DEBUG    | __main__:trials:29 - Trial = 18044/30000 | Total reward = 43.17
2022-01-26 14:17:53.521 | DEBUG    | __main__:trials:24 - Trial = 18045/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.522 | DEBUG    | __main__:trials:29 - Trial = 18045/30000 | Total reward = 44.61
2022-01-26 14:17:53.526 | DEBUG    | __main__:trials:24 - Trial = 18046/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.527 | DEBUG    | __main__:trials:29 - Trial = 18046/30000 | Total reward = 47.74
2022-01-26 14:17:53.531 | DEBUG    | __main__:trials:24 - Trial = 18047/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.533 | DEBUG    | __main__:trials:29 - Trial = 18047/30000 | Total reward = 56.61
2022-01-26 14:17:53.536 | DEBUG    | __main__:trials:24 - Trial = 18048/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.537 | DEBUG    | __main__:trials:29 - Trial = 18048/30000 | Total reward = 63.02
2022-01-26 14:17:53.541 | DEBUG    | __main__:trials:24 - Trial = 18049/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.543 | DEBUG    | __main__:trials:29 - Trial = 18049/30000 | Total reward = 37.54
2022-01-26 14:17:53.546 | DEBUG    | __main__:trials:24 - Trial = 18050/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.548 | DEBUG    | __main__:trials:29 - Trial = 18050/30000 | Total reward = 41.25
2022-01-26 14:17:53.552 | DEBUG    | __main__:trials:24 - Trial = 18051/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.552 | DEBUG    | __main__:trials:29 - Trial = 18051/30000 | Total reward = 45.46
2022-01-26 14:17:53.556 | DEBUG    | __main__:trials:24 - Trial = 18052/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.558 | DEBUG    | __main__:trials:29 - Trial = 18052/30000 | Total reward = 49.11
2022-01-26 14:17:53.562 | DEBUG    | __main__:trials:24 - Trial = 18053/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.562 | DEBUG    | __main__:trials:29 - Trial = 18053/30000 | Total reward = 60.22
2022-01-26 14:17:53.567 | DEBUG    | __main__:trials:24 - Trial = 18054/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.568 | DEBUG    | __main__:trials:29 - Trial = 18054/30000 | Total reward = 55.96
2022-01-26 14:17:53.571 | DEBUG    | __main__:trials:24 - Trial = 18055/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.573 | DEBUG    | __main__:trials:29 - Trial = 18055/30000 | Total reward = 48.08
2022-01-26 14:17:53.576 | DEBUG    | __main__:trials:24 - Trial = 18056/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.577 | DEBUG    | __main__:trials:29 - Trial = 18056/30000 | Total reward = 45.43
2022-01-26 14:17:53.581 | DEBUG    | __main__:trials:24 - Trial = 18057/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.582 | DEBUG    | __main__:trials:29 - Trial = 18057/30000 | Total reward = 45.01
2022-01-26 14:17:53.586 | DEBUG    | __main__:trials:24 - Trial = 18058/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.587 | DEBUG    | __main__:trials:29 - Trial = 18058/30000 | Total reward = 53.14
2022-01-26 14:17:53.591 | DEBUG    | __main__:trials:24 - Trial = 18059/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.593 | DEBUG    | __main__:trials:29 - Trial = 18059/30000 | Total reward = 56.30
2022-01-26 14:17:53.596 | DEBUG    | __main__:trials:24 - Trial = 18060/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.597 | DEBUG    | __main__:trials:29 - Trial = 18060/30000 | Total reward = 48.30
2022-01-26 14:17:53.602 | DEBUG    | __main__:trials:24 - Trial = 18061/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.603 | DEBUG    | __main__:trials:29 - Trial = 18061/30000 | Total reward = 49.19
2022-01-26 14:17:53.606 | DEBUG    | __main__:trials:24 - Trial = 18062/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.608 | DEBUG    | __main__:trials:29 - Trial = 18062/30000 | Total reward = 43.19
2022-01-26 14:17:53.611 | DEBUG    | __main__:trials:24 - Trial = 18063/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.612 | DEBUG    | __main__:trials:29 - Trial = 18063/30000 | Total reward = 56.66
2022-01-26 14:17:53.616 | DEBUG    | __main__:trials:24 - Trial = 18064/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.617 | DEBUG    | __main__:trials:29 - Trial = 18064/30000 | Total reward = 53.77
2022-01-26 14:17:53.621 | DEBUG    | __main__:trials:24 - Trial = 18065/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.622 | DEBUG    | __main__:trials:29 - Trial = 18065/30000 | Total reward = 55.34
2022-01-26 14:17:53.625 | DEBUG    | __main__:trials:24 - Trial = 18066/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.626 | DEBUG    | __main__:trials:29 - Trial = 18066/30000 | Total reward = 48.10
2022-01-26 14:17:53.630 | DEBUG    | __main__:trials:24 - Trial = 18067/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.632 | DEBUG    | __main__:trials:29 - Trial = 18067/30000 | Total reward = 45.26
2022-01-26 14:17:53.635 | DEBUG    | __main__:trials:24 - Trial = 18068/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.636 | DEBUG    | __main__:trials:29 - Trial = 18068/30000 | Total reward = 46.07
2022-01-26 14:17:53.640 | DEBUG    | __main__:trials:24 - Trial = 18069/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.642 | DEBUG    | __main__:trials:29 - Trial = 18069/30000 | Total reward = 46.04
2022-01-26 14:17:53.645 | DEBUG    | __main__:trials:24 - Trial = 18070/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.647 | DEBUG    | __main__:trials:29 - Trial = 18070/30000 | Total reward = 51.16
2022-01-26 14:17:53.650 | DEBUG    | __main__:trials:24 - Trial = 18071/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.652 | DEBUG    | __main__:trials:29 - Trial = 18071/30000 | Total reward = 56.40
2022-01-26 14:17:53.656 | DEBUG    | __main__:trials:24 - Trial = 18072/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.656 | DEBUG    | __main__:trials:29 - Trial = 18072/30000 | Total reward = 48.12
2022-01-26 14:17:53.660 | DEBUG    | __main__:trials:24 - Trial = 18073/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.662 | DEBUG    | __main__:trials:29 - Trial = 18073/30000 | Total reward = 51.52
2022-01-26 14:17:53.665 | DEBUG    | __main__:trials:24 - Trial = 18074/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.666 | DEBUG    | __main__:trials:29 - Trial = 18074/30000 | Total reward = 48.14
2022-01-26 14:17:53.670 | DEBUG    | __main__:trials:24 - Trial = 18075/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.671 | DEBUG    | __main__:trials:29 - Trial = 18075/30000 | Total reward = 41.86
2022-01-26 14:17:53.675 | DEBUG    | __main__:trials:24 - Trial = 18076/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.677 | DEBUG    | __main__:trials:29 - Trial = 18076/30000 | Total reward = 49.76
2022-01-26 14:17:53.681 | DEBUG    | __main__:trials:24 - Trial = 18077/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.682 | DEBUG    | __main__:trials:29 - Trial = 18077/30000 | Total reward = 44.46
2022-01-26 14:17:53.685 | DEBUG    | __main__:trials:24 - Trial = 18078/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.686 | DEBUG    | __main__:trials:29 - Trial = 18078/30000 | Total reward = 53.17
2022-01-26 14:17:53.691 | DEBUG    | __main__:trials:24 - Trial = 18079/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.692 | DEBUG    | __main__:trials:29 - Trial = 18079/30000 | Total reward = 40.57
2022-01-26 14:17:53.695 | DEBUG    | __main__:trials:24 - Trial = 18080/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.697 | DEBUG    | __main__:trials:29 - Trial = 18080/30000 | Total reward = 49.47
2022-01-26 14:17:53.700 | DEBUG    | __main__:trials:24 - Trial = 18081/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.702 | DEBUG    | __main__:trials:29 - Trial = 18081/30000 | Total reward = 35.84
2022-01-26 14:17:53.706 | DEBUG    | __main__:trials:24 - Trial = 18082/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.706 | DEBUG    | __main__:trials:29 - Trial = 18082/30000 | Total reward = 51.16
2022-01-26 14:17:53.711 | DEBUG    | __main__:trials:24 - Trial = 18083/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.712 | DEBUG    | __main__:trials:29 - Trial = 18083/30000 | Total reward = 40.57
2022-01-26 14:17:53.715 | DEBUG    | __main__:trials:26 - Trial = 18084/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.716 | DEBUG    | __main__:trials:29 - Trial = 18084/30000 | Total reward = 19.65
2022-01-26 14:17:53.720 | DEBUG    | __main__:trials:24 - Trial = 18085/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.722 | DEBUG    | __main__:trials:29 - Trial = 18085/30000 | Total reward = 38.62
2022-01-26 14:17:53.725 | DEBUG    | __main__:trials:24 - Trial = 18086/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.727 | DEBUG    | __main__:trials:29 - Trial = 18086/30000 | Total reward = 41.59
2022-01-26 14:17:53.731 | DEBUG    | __main__:trials:24 - Trial = 18087/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.731 | DEBUG    | __main__:trials:29 - Trial = 18087/30000 | Total reward = 40.56
2022-01-26 14:17:53.736 | DEBUG    | __main__:trials:24 - Trial = 18088/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.737 | DEBUG    | __main__:trials:29 - Trial = 18088/30000 | Total reward = 53.08
2022-01-26 14:17:53.741 | DEBUG    | __main__:trials:24 - Trial = 18089/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.742 | DEBUG    | __main__:trials:29 - Trial = 18089/30000 | Total reward = 51.35
2022-01-26 14:17:53.745 | DEBUG    | __main__:trials:24 - Trial = 18090/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.746 | DEBUG    | __main__:trials:29 - Trial = 18090/30000 | Total reward = 39.77
2022-01-26 14:17:53.750 | DEBUG    | __main__:trials:24 - Trial = 18091/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.751 | DEBUG    | __main__:trials:29 - Trial = 18091/30000 | Total reward = 44.99
2022-01-26 14:17:53.755 | DEBUG    | __main__:trials:24 - Trial = 18092/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.756 | DEBUG    | __main__:trials:29 - Trial = 18092/30000 | Total reward = 49.33
2022-01-26 14:17:53.760 | DEBUG    | __main__:trials:24 - Trial = 18093/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.762 | DEBUG    | __main__:trials:29 - Trial = 18093/30000 | Total reward = 48.87
2022-01-26 14:17:53.765 | DEBUG    | __main__:trials:26 - Trial = 18094/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.767 | DEBUG    | __main__:trials:29 - Trial = 18094/30000 | Total reward = 31.33
2022-01-26 14:17:53.771 | DEBUG    | __main__:trials:24 - Trial = 18095/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.771 | DEBUG    | __main__:trials:29 - Trial = 18095/30000 | Total reward = 56.56
2022-01-26 14:17:53.776 | DEBUG    | __main__:trials:24 - Trial = 18096/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.776 | DEBUG    | __main__:trials:29 - Trial = 18096/30000 | Total reward = 52.52
2022-01-26 14:17:53.781 | DEBUG    | __main__:trials:24 - Trial = 18097/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.782 | DEBUG    | __main__:trials:29 - Trial = 18097/30000 | Total reward = 48.26
2022-01-26 14:17:53.786 | DEBUG    | __main__:trials:24 - Trial = 18098/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.788 | DEBUG    | __main__:trials:29 - Trial = 18098/30000 | Total reward = 49.23
2022-01-26 14:17:53.792 | DEBUG    | __main__:trials:24 - Trial = 18099/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.793 | DEBUG    | __main__:trials:29 - Trial = 18099/30000 | Total reward = 43.08
2022-01-26 14:17:53.797 | DEBUG    | __main__:trials:24 - Trial = 18100/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.799 | DEBUG    | __main__:trials:29 - Trial = 18100/30000 | Total reward = 30.75
2022-01-26 14:17:53.803 | DEBUG    | __main__:trials:24 - Trial = 18101/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.806 | DEBUG    | __main__:trials:29 - Trial = 18101/30000 | Total reward = 56.43
2022-01-26 14:17:53.810 | DEBUG    | __main__:trials:24 - Trial = 18102/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.811 | DEBUG    | __main__:trials:29 - Trial = 18102/30000 | Total reward = 41.93
2022-01-26 14:17:53.815 | DEBUG    | __main__:trials:24 - Trial = 18103/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.817 | DEBUG    | __main__:trials:29 - Trial = 18103/30000 | Total reward = 39.26
2022-01-26 14:17:53.820 | DEBUG    | __main__:trials:24 - Trial = 18104/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.822 | DEBUG    | __main__:trials:29 - Trial = 18104/30000 | Total reward = 44.65
2022-01-26 14:17:53.825 | DEBUG    | __main__:trials:24 - Trial = 18105/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.827 | DEBUG    | __main__:trials:29 - Trial = 18105/30000 | Total reward = 42.78
2022-01-26 14:17:53.830 | DEBUG    | __main__:trials:24 - Trial = 18106/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.832 | DEBUG    | __main__:trials:29 - Trial = 18106/30000 | Total reward = 53.87
2022-01-26 14:17:53.836 | DEBUG    | __main__:trials:24 - Trial = 18107/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.836 | DEBUG    | __main__:trials:29 - Trial = 18107/30000 | Total reward = 44.75
2022-01-26 14:17:53.840 | DEBUG    | __main__:trials:24 - Trial = 18108/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.842 | DEBUG    | __main__:trials:29 - Trial = 18108/30000 | Total reward = 52.45
2022-01-26 14:17:53.846 | DEBUG    | __main__:trials:24 - Trial = 18109/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.846 | DEBUG    | __main__:trials:29 - Trial = 18109/30000 | Total reward = 44.11
2022-01-26 14:17:53.851 | DEBUG    | __main__:trials:24 - Trial = 18110/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.852 | DEBUG    | __main__:trials:29 - Trial = 18110/30000 | Total reward = 36.68
2022-01-26 14:17:53.855 | DEBUG    | __main__:trials:24 - Trial = 18111/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.857 | DEBUG    | __main__:trials:29 - Trial = 18111/30000 | Total reward = 37.05
2022-01-26 14:17:53.860 | DEBUG    | __main__:trials:24 - Trial = 18112/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.862 | DEBUG    | __main__:trials:29 - Trial = 18112/30000 | Total reward = 35.68
2022-01-26 14:17:53.865 | DEBUG    | __main__:trials:24 - Trial = 18113/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.866 | DEBUG    | __main__:trials:29 - Trial = 18113/30000 | Total reward = 47.82
2022-01-26 14:17:53.870 | DEBUG    | __main__:trials:24 - Trial = 18114/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.870 | DEBUG    | __main__:trials:29 - Trial = 18114/30000 | Total reward = 35.84
2022-01-26 14:17:53.875 | DEBUG    | __main__:trials:24 - Trial = 18115/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.876 | DEBUG    | __main__:trials:29 - Trial = 18115/30000 | Total reward = 41.74
2022-01-26 14:17:53.879 | DEBUG    | __main__:trials:24 - Trial = 18116/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.881 | DEBUG    | __main__:trials:29 - Trial = 18116/30000 | Total reward = 53.17
2022-01-26 14:17:53.884 | DEBUG    | __main__:trials:24 - Trial = 18117/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.886 | DEBUG    | __main__:trials:29 - Trial = 18117/30000 | Total reward = 43.35
2022-01-26 14:17:53.890 | DEBUG    | __main__:trials:24 - Trial = 18118/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.890 | DEBUG    | __main__:trials:29 - Trial = 18118/30000 | Total reward = 51.89
2022-01-26 14:17:53.894 | DEBUG    | __main__:trials:24 - Trial = 18119/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.896 | DEBUG    | __main__:trials:29 - Trial = 18119/30000 | Total reward = 63.10
2022-01-26 14:17:53.899 | DEBUG    | __main__:trials:24 - Trial = 18120/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.900 | DEBUG    | __main__:trials:29 - Trial = 18120/30000 | Total reward = 43.06
2022-01-26 14:17:53.903 | DEBUG    | __main__:trials:24 - Trial = 18121/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.905 | DEBUG    | __main__:trials:29 - Trial = 18121/30000 | Total reward = 54.17
2022-01-26 14:17:53.908 | DEBUG    | __main__:trials:24 - Trial = 18122/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.910 | DEBUG    | __main__:trials:29 - Trial = 18122/30000 | Total reward = 39.82
2022-01-26 14:17:53.913 | DEBUG    | __main__:trials:24 - Trial = 18123/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.914 | DEBUG    | __main__:trials:29 - Trial = 18123/30000 | Total reward = 40.61
2022-01-26 14:17:53.918 | DEBUG    | __main__:trials:26 - Trial = 18124/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.919 | DEBUG    | __main__:trials:29 - Trial = 18124/30000 | Total reward = 11.73
2022-01-26 14:17:53.923 | DEBUG    | __main__:trials:24 - Trial = 18125/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.925 | DEBUG    | __main__:trials:29 - Trial = 18125/30000 | Total reward = 50.42
2022-01-26 14:17:53.928 | DEBUG    | __main__:trials:24 - Trial = 18126/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.929 | DEBUG    | __main__:trials:29 - Trial = 18126/30000 | Total reward = 56.49
2022-01-26 14:17:53.932 | DEBUG    | __main__:trials:24 - Trial = 18127/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.933 | DEBUG    | __main__:trials:29 - Trial = 18127/30000 | Total reward = 31.53
2022-01-26 14:17:53.937 | DEBUG    | __main__:trials:24 - Trial = 18128/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.938 | DEBUG    | __main__:trials:29 - Trial = 18128/30000 | Total reward = 43.37
2022-01-26 14:17:53.942 | DEBUG    | __main__:trials:24 - Trial = 18129/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.943 | DEBUG    | __main__:trials:29 - Trial = 18129/30000 | Total reward = 47.24
2022-01-26 14:17:53.946 | DEBUG    | __main__:trials:24 - Trial = 18130/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.948 | DEBUG    | __main__:trials:29 - Trial = 18130/30000 | Total reward = 40.99
2022-01-26 14:17:53.952 | DEBUG    | __main__:trials:24 - Trial = 18131/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.953 | DEBUG    | __main__:trials:29 - Trial = 18131/30000 | Total reward = 54.32
2022-01-26 14:17:53.957 | DEBUG    | __main__:trials:24 - Trial = 18132/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.959 | DEBUG    | __main__:trials:29 - Trial = 18132/30000 | Total reward = 46.20
2022-01-26 14:17:53.962 | DEBUG    | __main__:trials:24 - Trial = 18133/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.963 | DEBUG    | __main__:trials:29 - Trial = 18133/30000 | Total reward = 39.65
2022-01-26 14:17:53.966 | DEBUG    | __main__:trials:24 - Trial = 18134/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.968 | DEBUG    | __main__:trials:29 - Trial = 18134/30000 | Total reward = 40.21
2022-01-26 14:17:53.972 | DEBUG    | __main__:trials:24 - Trial = 18135/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.973 | DEBUG    | __main__:trials:29 - Trial = 18135/30000 | Total reward = 62.24
2022-01-26 14:17:53.977 | DEBUG    | __main__:trials:24 - Trial = 18136/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.979 | DEBUG    | __main__:trials:29 - Trial = 18136/30000 | Total reward = 36.67
2022-01-26 14:17:53.982 | DEBUG    | __main__:trials:24 - Trial = 18137/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.984 | DEBUG    | __main__:trials:29 - Trial = 18137/30000 | Total reward = 55.15
2022-01-26 14:17:53.987 | DEBUG    | __main__:trials:24 - Trial = 18138/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.988 | DEBUG    | __main__:trials:29 - Trial = 18138/30000 | Total reward = 32.45
2022-01-26 14:17:53.992 | DEBUG    | __main__:trials:24 - Trial = 18139/30000 | Max number of steps (20) reached
2022-01-26 14:17:53.993 | DEBUG    | __main__:trials:29 - Trial = 18139/30000 | Total reward = 28.93
2022-01-26 14:17:53.996 | DEBUG    | __main__:trials:26 - Trial = 18140/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:53.998 | DEBUG    | __main__:trials:29 - Trial = 18140/30000 | Total reward = 33.32
2022-01-26 14:17:54.002 | DEBUG    | __main__:trials:24 - Trial = 18141/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.003 | DEBUG    | __main__:trials:29 - Trial = 18141/30000 | Total reward = 42.06
2022-01-26 14:17:54.007 | DEBUG    | __main__:trials:24 - Trial = 18142/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.008 | DEBUG    | __main__:trials:29 - Trial = 18142/30000 | Total reward = 65.80
2022-01-26 14:17:54.012 | DEBUG    | __main__:trials:24 - Trial = 18143/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.013 | DEBUG    | __main__:trials:29 - Trial = 18143/30000 | Total reward = 56.78
2022-01-26 14:17:54.017 | DEBUG    | __main__:trials:24 - Trial = 18144/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.018 | DEBUG    | __main__:trials:29 - Trial = 18144/30000 | Total reward = 51.51
2022-01-26 14:17:54.023 | DEBUG    | __main__:trials:24 - Trial = 18145/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.024 | DEBUG    | __main__:trials:29 - Trial = 18145/30000 | Total reward = 51.81
2022-01-26 14:17:54.028 | DEBUG    | __main__:trials:24 - Trial = 18146/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.029 | DEBUG    | __main__:trials:29 - Trial = 18146/30000 | Total reward = 48.20
2022-01-26 14:17:54.033 | DEBUG    | __main__:trials:24 - Trial = 18147/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.034 | DEBUG    | __main__:trials:29 - Trial = 18147/30000 | Total reward = 54.88
2022-01-26 14:17:54.037 | DEBUG    | __main__:trials:24 - Trial = 18148/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.038 | DEBUG    | __main__:trials:29 - Trial = 18148/30000 | Total reward = 60.91
2022-01-26 14:17:54.042 | DEBUG    | __main__:trials:24 - Trial = 18149/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.043 | DEBUG    | __main__:trials:29 - Trial = 18149/30000 | Total reward = 40.80
2022-01-26 14:17:54.047 | DEBUG    | __main__:trials:26 - Trial = 18150/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.048 | DEBUG    | __main__:trials:29 - Trial = 18150/30000 | Total reward = 26.13
2022-01-26 14:17:54.052 | DEBUG    | __main__:trials:24 - Trial = 18151/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.053 | DEBUG    | __main__:trials:29 - Trial = 18151/30000 | Total reward = 42.23
2022-01-26 14:17:54.057 | DEBUG    | __main__:trials:24 - Trial = 18152/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.058 | DEBUG    | __main__:trials:29 - Trial = 18152/30000 | Total reward = 48.01
2022-01-26 14:17:54.062 | DEBUG    | __main__:trials:24 - Trial = 18153/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.063 | DEBUG    | __main__:trials:29 - Trial = 18153/30000 | Total reward = 46.89
2022-01-26 14:17:54.067 | DEBUG    | __main__:trials:24 - Trial = 18154/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.069 | DEBUG    | __main__:trials:29 - Trial = 18154/30000 | Total reward = 51.46
2022-01-26 14:17:54.072 | DEBUG    | __main__:trials:24 - Trial = 18155/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.074 | DEBUG    | __main__:trials:29 - Trial = 18155/30000 | Total reward = 29.31
2022-01-26 14:17:54.077 | DEBUG    | __main__:trials:24 - Trial = 18156/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.079 | DEBUG    | __main__:trials:29 - Trial = 18156/30000 | Total reward = 45.63
2022-01-26 14:17:54.082 | DEBUG    | __main__:trials:24 - Trial = 18157/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.082 | DEBUG    | __main__:trials:29 - Trial = 18157/30000 | Total reward = 54.19
2022-01-26 14:17:54.086 | DEBUG    | __main__:trials:24 - Trial = 18158/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.086 | DEBUG    | __main__:trials:29 - Trial = 18158/30000 | Total reward = 38.69
2022-01-26 14:17:54.090 | DEBUG    | __main__:trials:24 - Trial = 18159/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.091 | DEBUG    | __main__:trials:29 - Trial = 18159/30000 | Total reward = 48.48
2022-01-26 14:17:54.095 | DEBUG    | __main__:trials:24 - Trial = 18160/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.097 | DEBUG    | __main__:trials:29 - Trial = 18160/30000 | Total reward = 53.44
2022-01-26 14:17:54.100 | DEBUG    | __main__:trials:24 - Trial = 18161/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.101 | DEBUG    | __main__:trials:29 - Trial = 18161/30000 | Total reward = 45.06
2022-01-26 14:17:54.104 | DEBUG    | __main__:trials:24 - Trial = 18162/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.105 | DEBUG    | __main__:trials:29 - Trial = 18162/30000 | Total reward = 47.76
2022-01-26 14:17:54.108 | DEBUG    | __main__:trials:24 - Trial = 18163/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.110 | DEBUG    | __main__:trials:29 - Trial = 18163/30000 | Total reward = 37.85
2022-01-26 14:17:54.113 | DEBUG    | __main__:trials:24 - Trial = 18164/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.115 | DEBUG    | __main__:trials:29 - Trial = 18164/30000 | Total reward = 62.85
2022-01-26 14:17:54.119 | DEBUG    | __main__:trials:24 - Trial = 18165/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.119 | DEBUG    | __main__:trials:29 - Trial = 18165/30000 | Total reward = 57.04
2022-01-26 14:17:54.124 | DEBUG    | __main__:trials:24 - Trial = 18166/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.125 | DEBUG    | __main__:trials:29 - Trial = 18166/30000 | Total reward = 46.61
2022-01-26 14:17:54.128 | DEBUG    | __main__:trials:24 - Trial = 18167/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.132 | DEBUG    | __main__:trials:29 - Trial = 18167/30000 | Total reward = 40.75
2022-01-26 14:17:54.135 | DEBUG    | __main__:trials:24 - Trial = 18168/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.137 | DEBUG    | __main__:trials:29 - Trial = 18168/30000 | Total reward = 42.58
2022-01-26 14:17:54.140 | DEBUG    | __main__:trials:24 - Trial = 18169/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.142 | DEBUG    | __main__:trials:29 - Trial = 18169/30000 | Total reward = 50.53
2022-01-26 14:17:54.145 | DEBUG    | __main__:trials:24 - Trial = 18170/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.146 | DEBUG    | __main__:trials:29 - Trial = 18170/30000 | Total reward = 59.72
2022-01-26 14:17:54.150 | DEBUG    | __main__:trials:26 - Trial = 18171/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.151 | DEBUG    | __main__:trials:29 - Trial = 18171/30000 | Total reward = 25.86
2022-01-26 14:17:54.155 | DEBUG    | __main__:trials:24 - Trial = 18172/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.157 | DEBUG    | __main__:trials:29 - Trial = 18172/30000 | Total reward = 43.61
2022-01-26 14:17:54.160 | DEBUG    | __main__:trials:24 - Trial = 18173/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.162 | DEBUG    | __main__:trials:29 - Trial = 18173/30000 | Total reward = 46.44
2022-01-26 14:17:54.166 | DEBUG    | __main__:trials:24 - Trial = 18174/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.167 | DEBUG    | __main__:trials:29 - Trial = 18174/30000 | Total reward = 47.30
2022-01-26 14:17:54.170 | DEBUG    | __main__:trials:26 - Trial = 18175/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.171 | DEBUG    | __main__:trials:29 - Trial = 18175/30000 | Total reward = 10.75
2022-01-26 14:17:54.175 | DEBUG    | __main__:trials:24 - Trial = 18176/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.176 | DEBUG    | __main__:trials:29 - Trial = 18176/30000 | Total reward = 47.52
2022-01-26 14:17:54.179 | DEBUG    | __main__:trials:24 - Trial = 18177/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.181 | DEBUG    | __main__:trials:29 - Trial = 18177/30000 | Total reward = 61.62
2022-01-26 14:17:54.184 | DEBUG    | __main__:trials:24 - Trial = 18178/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.186 | DEBUG    | __main__:trials:29 - Trial = 18178/30000 | Total reward = 44.19
2022-01-26 14:17:54.190 | DEBUG    | __main__:trials:24 - Trial = 18179/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.191 | DEBUG    | __main__:trials:29 - Trial = 18179/30000 | Total reward = 40.58
2022-01-26 14:17:54.194 | DEBUG    | __main__:trials:24 - Trial = 18180/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.196 | DEBUG    | __main__:trials:29 - Trial = 18180/30000 | Total reward = 34.39
2022-01-26 14:17:54.199 | DEBUG    | __main__:trials:24 - Trial = 18181/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.201 | DEBUG    | __main__:trials:29 - Trial = 18181/30000 | Total reward = 56.37
2022-01-26 14:17:54.205 | DEBUG    | __main__:trials:24 - Trial = 18182/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.206 | DEBUG    | __main__:trials:29 - Trial = 18182/30000 | Total reward = 35.72
2022-01-26 14:17:54.210 | DEBUG    | __main__:trials:24 - Trial = 18183/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.210 | DEBUG    | __main__:trials:29 - Trial = 18183/30000 | Total reward = 47.51
2022-01-26 14:17:54.215 | DEBUG    | __main__:trials:24 - Trial = 18184/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.217 | DEBUG    | __main__:trials:29 - Trial = 18184/30000 | Total reward = 43.69
2022-01-26 14:17:54.220 | DEBUG    | __main__:trials:24 - Trial = 18185/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.222 | DEBUG    | __main__:trials:29 - Trial = 18185/30000 | Total reward = 58.30
2022-01-26 14:17:54.225 | DEBUG    | __main__:trials:24 - Trial = 18186/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.227 | DEBUG    | __main__:trials:29 - Trial = 18186/30000 | Total reward = 47.76
2022-01-26 14:17:54.230 | DEBUG    | __main__:trials:24 - Trial = 18187/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.232 | DEBUG    | __main__:trials:29 - Trial = 18187/30000 | Total reward = 48.41
2022-01-26 14:17:54.235 | DEBUG    | __main__:trials:24 - Trial = 18188/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.237 | DEBUG    | __main__:trials:29 - Trial = 18188/30000 | Total reward = 50.03
2022-01-26 14:17:54.240 | DEBUG    | __main__:trials:24 - Trial = 18189/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.242 | DEBUG    | __main__:trials:29 - Trial = 18189/30000 | Total reward = 42.63
2022-01-26 14:17:54.246 | DEBUG    | __main__:trials:24 - Trial = 18190/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.247 | DEBUG    | __main__:trials:29 - Trial = 18190/30000 | Total reward = 44.80
2022-01-26 14:17:54.251 | DEBUG    | __main__:trials:24 - Trial = 18191/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.252 | DEBUG    | __main__:trials:29 - Trial = 18191/30000 | Total reward = 48.07
2022-01-26 14:17:54.256 | DEBUG    | __main__:trials:24 - Trial = 18192/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.257 | DEBUG    | __main__:trials:29 - Trial = 18192/30000 | Total reward = 41.36
2022-01-26 14:17:54.261 | DEBUG    | __main__:trials:24 - Trial = 18193/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.262 | DEBUG    | __main__:trials:29 - Trial = 18193/30000 | Total reward = 48.06
2022-01-26 14:17:54.266 | DEBUG    | __main__:trials:24 - Trial = 18194/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.267 | DEBUG    | __main__:trials:29 - Trial = 18194/30000 | Total reward = 48.07
2022-01-26 14:17:54.271 | DEBUG    | __main__:trials:24 - Trial = 18195/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.272 | DEBUG    | __main__:trials:29 - Trial = 18195/30000 | Total reward = 57.82
2022-01-26 14:17:54.276 | DEBUG    | __main__:trials:24 - Trial = 18196/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.277 | DEBUG    | __main__:trials:29 - Trial = 18196/30000 | Total reward = 46.91
2022-01-26 14:17:54.281 | DEBUG    | __main__:trials:24 - Trial = 18197/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.282 | DEBUG    | __main__:trials:29 - Trial = 18197/30000 | Total reward = 46.84
2022-01-26 14:17:54.286 | DEBUG    | __main__:trials:24 - Trial = 18198/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.287 | DEBUG    | __main__:trials:29 - Trial = 18198/30000 | Total reward = 43.71
2022-01-26 14:17:54.290 | DEBUG    | __main__:trials:24 - Trial = 18199/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.292 | DEBUG    | __main__:trials:29 - Trial = 18199/30000 | Total reward = 42.41
2022-01-26 14:17:54.296 | DEBUG    | __main__:trials:24 - Trial = 18200/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.297 | DEBUG    | __main__:trials:29 - Trial = 18200/30000 | Total reward = 33.90
2022-01-26 14:17:54.301 | DEBUG    | __main__:trials:24 - Trial = 18201/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.302 | DEBUG    | __main__:trials:29 - Trial = 18201/30000 | Total reward = 48.42
2022-01-26 14:17:54.306 | DEBUG    | __main__:trials:24 - Trial = 18202/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.307 | DEBUG    | __main__:trials:29 - Trial = 18202/30000 | Total reward = 57.19
2022-01-26 14:17:54.311 | DEBUG    | __main__:trials:24 - Trial = 18203/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.312 | DEBUG    | __main__:trials:29 - Trial = 18203/30000 | Total reward = 51.97
2022-01-26 14:17:54.316 | DEBUG    | __main__:trials:24 - Trial = 18204/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.318 | DEBUG    | __main__:trials:29 - Trial = 18204/30000 | Total reward = 46.16
2022-01-26 14:17:54.322 | DEBUG    | __main__:trials:24 - Trial = 18205/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.323 | DEBUG    | __main__:trials:29 - Trial = 18205/30000 | Total reward = 54.08
2022-01-26 14:17:54.327 | DEBUG    | __main__:trials:24 - Trial = 18206/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.328 | DEBUG    | __main__:trials:29 - Trial = 18206/30000 | Total reward = 43.93
2022-01-26 14:17:54.332 | DEBUG    | __main__:trials:24 - Trial = 18207/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.333 | DEBUG    | __main__:trials:29 - Trial = 18207/30000 | Total reward = 52.13
2022-01-26 14:17:54.337 | DEBUG    | __main__:trials:24 - Trial = 18208/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.338 | DEBUG    | __main__:trials:29 - Trial = 18208/30000 | Total reward = 33.83
2022-01-26 14:17:54.342 | DEBUG    | __main__:trials:24 - Trial = 18209/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.344 | DEBUG    | __main__:trials:29 - Trial = 18209/30000 | Total reward = 20.07
2022-01-26 14:17:54.347 | DEBUG    | __main__:trials:24 - Trial = 18210/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.348 | DEBUG    | __main__:trials:29 - Trial = 18210/30000 | Total reward = 45.65
2022-01-26 14:17:54.351 | DEBUG    | __main__:trials:24 - Trial = 18211/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.353 | DEBUG    | __main__:trials:29 - Trial = 18211/30000 | Total reward = 38.24
2022-01-26 14:17:54.357 | DEBUG    | __main__:trials:24 - Trial = 18212/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.358 | DEBUG    | __main__:trials:29 - Trial = 18212/30000 | Total reward = 18.31
2022-01-26 14:17:54.361 | DEBUG    | __main__:trials:24 - Trial = 18213/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.363 | DEBUG    | __main__:trials:29 - Trial = 18213/30000 | Total reward = 37.07
2022-01-26 14:17:54.366 | DEBUG    | __main__:trials:24 - Trial = 18214/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.368 | DEBUG    | __main__:trials:29 - Trial = 18214/30000 | Total reward = 36.09
2022-01-26 14:17:54.371 | DEBUG    | __main__:trials:26 - Trial = 18215/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.373 | DEBUG    | __main__:trials:29 - Trial = 18215/30000 | Total reward = 22.30
2022-01-26 14:17:54.376 | DEBUG    | __main__:trials:24 - Trial = 18216/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.377 | DEBUG    | __main__:trials:29 - Trial = 18216/30000 | Total reward = 37.93
2022-01-26 14:17:54.382 | DEBUG    | __main__:trials:24 - Trial = 18217/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.382 | DEBUG    | __main__:trials:29 - Trial = 18217/30000 | Total reward = 35.14
2022-01-26 14:17:54.386 | DEBUG    | __main__:trials:24 - Trial = 18218/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.387 | DEBUG    | __main__:trials:29 - Trial = 18218/30000 | Total reward = 42.38
2022-01-26 14:17:54.391 | DEBUG    | __main__:trials:24 - Trial = 18219/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.392 | DEBUG    | __main__:trials:29 - Trial = 18219/30000 | Total reward = 32.10
2022-01-26 14:17:54.396 | DEBUG    | __main__:trials:24 - Trial = 18220/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.397 | DEBUG    | __main__:trials:29 - Trial = 18220/30000 | Total reward = 35.69
2022-01-26 14:17:54.400 | DEBUG    | __main__:trials:24 - Trial = 18221/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.401 | DEBUG    | __main__:trials:29 - Trial = 18221/30000 | Total reward = 35.80
2022-01-26 14:17:54.406 | DEBUG    | __main__:trials:24 - Trial = 18222/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.406 | DEBUG    | __main__:trials:29 - Trial = 18222/30000 | Total reward = 53.19
2022-01-26 14:17:54.411 | DEBUG    | __main__:trials:24 - Trial = 18223/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.412 | DEBUG    | __main__:trials:29 - Trial = 18223/30000 | Total reward = 27.90
2022-01-26 14:17:54.416 | DEBUG    | __main__:trials:24 - Trial = 18224/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.418 | DEBUG    | __main__:trials:29 - Trial = 18224/30000 | Total reward = 57.23
2022-01-26 14:17:54.420 | DEBUG    | __main__:trials:26 - Trial = 18225/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.421 | DEBUG    | __main__:trials:29 - Trial = 18225/30000 | Total reward = 15.34
2022-01-26 14:17:54.424 | DEBUG    | __main__:trials:24 - Trial = 18226/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.425 | DEBUG    | __main__:trials:29 - Trial = 18226/30000 | Total reward = 47.01
2022-01-26 14:17:54.429 | DEBUG    | __main__:trials:24 - Trial = 18227/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.430 | DEBUG    | __main__:trials:29 - Trial = 18227/30000 | Total reward = 50.13
2022-01-26 14:17:54.433 | DEBUG    | __main__:trials:24 - Trial = 18228/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.434 | DEBUG    | __main__:trials:29 - Trial = 18228/30000 | Total reward = 43.70
2022-01-26 14:17:54.437 | DEBUG    | __main__:trials:24 - Trial = 18229/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.439 | DEBUG    | __main__:trials:29 - Trial = 18229/30000 | Total reward = 53.23
2022-01-26 14:17:54.442 | DEBUG    | __main__:trials:24 - Trial = 18230/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.444 | DEBUG    | __main__:trials:29 - Trial = 18230/30000 | Total reward = 24.45
2022-01-26 14:17:54.447 | DEBUG    | __main__:trials:24 - Trial = 18231/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.449 | DEBUG    | __main__:trials:29 - Trial = 18231/30000 | Total reward = 37.93
2022-01-26 14:17:54.453 | DEBUG    | __main__:trials:24 - Trial = 18232/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.453 | DEBUG    | __main__:trials:29 - Trial = 18232/30000 | Total reward = 30.12
2022-01-26 14:17:54.458 | DEBUG    | __main__:trials:24 - Trial = 18233/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.458 | DEBUG    | __main__:trials:29 - Trial = 18233/30000 | Total reward = 34.71
2022-01-26 14:17:54.463 | DEBUG    | __main__:trials:24 - Trial = 18234/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.463 | DEBUG    | __main__:trials:29 - Trial = 18234/30000 | Total reward = 41.50
2022-01-26 14:17:54.467 | DEBUG    | __main__:trials:24 - Trial = 18235/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.468 | DEBUG    | __main__:trials:29 - Trial = 18235/30000 | Total reward = 38.22
2022-01-26 14:17:54.472 | DEBUG    | __main__:trials:24 - Trial = 18236/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.473 | DEBUG    | __main__:trials:29 - Trial = 18236/30000 | Total reward = 26.60
2022-01-26 14:17:54.477 | DEBUG    | __main__:trials:26 - Trial = 18237/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.478 | DEBUG    | __main__:trials:29 - Trial = 18237/30000 | Total reward = 29.04
2022-01-26 14:17:54.482 | DEBUG    | __main__:trials:24 - Trial = 18238/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.483 | DEBUG    | __main__:trials:29 - Trial = 18238/30000 | Total reward = 40.52
2022-01-26 14:17:54.487 | DEBUG    | __main__:trials:24 - Trial = 18239/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.488 | DEBUG    | __main__:trials:29 - Trial = 18239/30000 | Total reward = 50.26
2022-01-26 14:17:54.491 | DEBUG    | __main__:trials:24 - Trial = 18240/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.492 | DEBUG    | __main__:trials:29 - Trial = 18240/30000 | Total reward = 38.74
2022-01-26 14:17:54.496 | DEBUG    | __main__:trials:24 - Trial = 18241/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.497 | DEBUG    | __main__:trials:29 - Trial = 18241/30000 | Total reward = 42.42
2022-01-26 14:17:54.502 | DEBUG    | __main__:trials:24 - Trial = 18242/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.502 | DEBUG    | __main__:trials:29 - Trial = 18242/30000 | Total reward = 54.61
2022-01-26 14:17:54.507 | DEBUG    | __main__:trials:24 - Trial = 18243/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.508 | DEBUG    | __main__:trials:29 - Trial = 18243/30000 | Total reward = 37.23
2022-01-26 14:17:54.512 | DEBUG    | __main__:trials:24 - Trial = 18244/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.514 | DEBUG    | __main__:trials:29 - Trial = 18244/30000 | Total reward = 35.76
2022-01-26 14:17:54.517 | DEBUG    | __main__:trials:24 - Trial = 18245/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.519 | DEBUG    | __main__:trials:29 - Trial = 18245/30000 | Total reward = 33.34
2022-01-26 14:17:54.522 | DEBUG    | __main__:trials:26 - Trial = 18246/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.524 | DEBUG    | __main__:trials:29 - Trial = 18246/30000 | Total reward = 28.72
2022-01-26 14:17:54.528 | DEBUG    | __main__:trials:24 - Trial = 18247/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.529 | DEBUG    | __main__:trials:29 - Trial = 18247/30000 | Total reward = 37.93
2022-01-26 14:17:54.533 | DEBUG    | __main__:trials:24 - Trial = 18248/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.535 | DEBUG    | __main__:trials:29 - Trial = 18248/30000 | Total reward = 47.13
2022-01-26 14:17:54.537 | DEBUG    | __main__:trials:26 - Trial = 18249/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.538 | DEBUG    | __main__:trials:29 - Trial = 18249/30000 | Total reward = 25.98
2022-01-26 14:17:54.541 | DEBUG    | __main__:trials:24 - Trial = 18250/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.543 | DEBUG    | __main__:trials:29 - Trial = 18250/30000 | Total reward = 37.93
2022-01-26 14:17:54.545 | DEBUG    | __main__:trials:26 - Trial = 18251/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.547 | DEBUG    | __main__:trials:29 - Trial = 18251/30000 | Total reward = 12.17
2022-01-26 14:17:54.549 | DEBUG    | __main__:trials:26 - Trial = 18252/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.550 | DEBUG    | __main__:trials:29 - Trial = 18252/30000 | Total reward = 13.05
2022-01-26 14:17:54.553 | DEBUG    | __main__:trials:24 - Trial = 18253/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.554 | DEBUG    | __main__:trials:29 - Trial = 18253/30000 | Total reward = 37.31
2022-01-26 14:17:54.557 | DEBUG    | __main__:trials:24 - Trial = 18254/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.558 | DEBUG    | __main__:trials:29 - Trial = 18254/30000 | Total reward = 36.85
2022-01-26 14:17:54.560 | DEBUG    | __main__:trials:26 - Trial = 18255/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.562 | DEBUG    | __main__:trials:29 - Trial = 18255/30000 | Total reward = 17.99
2022-01-26 14:17:54.566 | DEBUG    | __main__:trials:24 - Trial = 18256/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.567 | DEBUG    | __main__:trials:29 - Trial = 18256/30000 | Total reward = 32.27
2022-01-26 14:17:54.571 | DEBUG    | __main__:trials:24 - Trial = 18257/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.573 | DEBUG    | __main__:trials:29 - Trial = 18257/30000 | Total reward = 43.06
2022-01-26 14:17:54.576 | DEBUG    | __main__:trials:24 - Trial = 18258/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.578 | DEBUG    | __main__:trials:29 - Trial = 18258/30000 | Total reward = 50.73
2022-01-26 14:17:54.581 | DEBUG    | __main__:trials:24 - Trial = 18259/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.582 | DEBUG    | __main__:trials:29 - Trial = 18259/30000 | Total reward = 53.63
2022-01-26 14:17:54.585 | DEBUG    | __main__:trials:26 - Trial = 18260/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.586 | DEBUG    | __main__:trials:29 - Trial = 18260/30000 | Total reward = 23.58
2022-01-26 14:17:54.590 | DEBUG    | __main__:trials:26 - Trial = 18261/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.592 | DEBUG    | __main__:trials:29 - Trial = 18261/30000 | Total reward = 19.69
2022-01-26 14:17:54.595 | DEBUG    | __main__:trials:24 - Trial = 18262/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.597 | DEBUG    | __main__:trials:29 - Trial = 18262/30000 | Total reward = 33.61
2022-01-26 14:17:54.600 | DEBUG    | __main__:trials:24 - Trial = 18263/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.602 | DEBUG    | __main__:trials:29 - Trial = 18263/30000 | Total reward = 33.46
2022-01-26 14:17:54.605 | DEBUG    | __main__:trials:24 - Trial = 18264/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.606 | DEBUG    | __main__:trials:29 - Trial = 18264/30000 | Total reward = 34.63
2022-01-26 14:17:54.608 | DEBUG    | __main__:trials:26 - Trial = 18265/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.609 | DEBUG    | __main__:trials:29 - Trial = 18265/30000 | Total reward = 11.53
2022-01-26 14:17:54.613 | DEBUG    | __main__:trials:24 - Trial = 18266/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.613 | DEBUG    | __main__:trials:29 - Trial = 18266/30000 | Total reward = 33.08
2022-01-26 14:17:54.616 | DEBUG    | __main__:trials:26 - Trial = 18267/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.618 | DEBUG    | __main__:trials:29 - Trial = 18267/30000 | Total reward = 24.49
2022-01-26 14:17:54.620 | DEBUG    | __main__:trials:26 - Trial = 18268/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.622 | DEBUG    | __main__:trials:29 - Trial = 18268/30000 | Total reward = 12.21
2022-01-26 14:17:54.625 | DEBUG    | __main__:trials:24 - Trial = 18269/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.626 | DEBUG    | __main__:trials:29 - Trial = 18269/30000 | Total reward = 34.41
2022-01-26 14:17:54.631 | DEBUG    | __main__:trials:24 - Trial = 18270/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.632 | DEBUG    | __main__:trials:29 - Trial = 18270/30000 | Total reward = 29.89
2022-01-26 14:17:54.636 | DEBUG    | __main__:trials:24 - Trial = 18271/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.637 | DEBUG    | __main__:trials:29 - Trial = 18271/30000 | Total reward = 32.70
2022-01-26 14:17:54.641 | DEBUG    | __main__:trials:24 - Trial = 18272/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.641 | DEBUG    | __main__:trials:29 - Trial = 18272/30000 | Total reward = 33.12
2022-01-26 14:17:54.646 | DEBUG    | __main__:trials:24 - Trial = 18273/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.647 | DEBUG    | __main__:trials:29 - Trial = 18273/30000 | Total reward = 33.08
2022-01-26 14:17:54.651 | DEBUG    | __main__:trials:24 - Trial = 18274/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.653 | DEBUG    | __main__:trials:29 - Trial = 18274/30000 | Total reward = 34.07
2022-01-26 14:17:54.656 | DEBUG    | __main__:trials:24 - Trial = 18275/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.657 | DEBUG    | __main__:trials:29 - Trial = 18275/30000 | Total reward = 35.27
2022-01-26 14:17:54.662 | DEBUG    | __main__:trials:24 - Trial = 18276/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.663 | DEBUG    | __main__:trials:29 - Trial = 18276/30000 | Total reward = 46.91
2022-01-26 14:17:54.667 | DEBUG    | __main__:trials:24 - Trial = 18277/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.668 | DEBUG    | __main__:trials:29 - Trial = 18277/30000 | Total reward = 33.17
2022-01-26 14:17:54.672 | DEBUG    | __main__:trials:24 - Trial = 18278/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.673 | DEBUG    | __main__:trials:29 - Trial = 18278/30000 | Total reward = 39.19
2022-01-26 14:17:54.677 | DEBUG    | __main__:trials:24 - Trial = 18279/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.678 | DEBUG    | __main__:trials:29 - Trial = 18279/30000 | Total reward = 40.95
2022-01-26 14:17:54.682 | DEBUG    | __main__:trials:24 - Trial = 18280/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.684 | DEBUG    | __main__:trials:29 - Trial = 18280/30000 | Total reward = 52.03
2022-01-26 14:17:54.688 | DEBUG    | __main__:trials:24 - Trial = 18281/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.689 | DEBUG    | __main__:trials:29 - Trial = 18281/30000 | Total reward = 39.23
2022-01-26 14:17:54.693 | DEBUG    | __main__:trials:24 - Trial = 18282/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.694 | DEBUG    | __main__:trials:29 - Trial = 18282/30000 | Total reward = 36.63
2022-01-26 14:17:54.697 | DEBUG    | __main__:trials:24 - Trial = 18283/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.698 | DEBUG    | __main__:trials:29 - Trial = 18283/30000 | Total reward = 38.65
2022-01-26 14:17:54.701 | DEBUG    | __main__:trials:24 - Trial = 18284/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.702 | DEBUG    | __main__:trials:29 - Trial = 18284/30000 | Total reward = 55.34
2022-01-26 14:17:54.705 | DEBUG    | __main__:trials:26 - Trial = 18285/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.706 | DEBUG    | __main__:trials:29 - Trial = 18285/30000 | Total reward = 19.69
2022-01-26 14:17:54.709 | DEBUG    | __main__:trials:24 - Trial = 18286/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.711 | DEBUG    | __main__:trials:29 - Trial = 18286/30000 | Total reward = 33.00
2022-01-26 14:17:54.714 | DEBUG    | __main__:trials:24 - Trial = 18287/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.715 | DEBUG    | __main__:trials:29 - Trial = 18287/30000 | Total reward = 18.18
2022-01-26 14:17:54.719 | DEBUG    | __main__:trials:24 - Trial = 18288/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.720 | DEBUG    | __main__:trials:29 - Trial = 18288/30000 | Total reward = 34.29
2022-01-26 14:17:54.724 | DEBUG    | __main__:trials:24 - Trial = 18289/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.725 | DEBUG    | __main__:trials:29 - Trial = 18289/30000 | Total reward = 34.40
2022-01-26 14:17:54.728 | DEBUG    | __main__:trials:26 - Trial = 18290/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.730 | DEBUG    | __main__:trials:29 - Trial = 18290/30000 | Total reward = 8.99
2022-01-26 14:17:54.733 | DEBUG    | __main__:trials:24 - Trial = 18291/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.735 | DEBUG    | __main__:trials:29 - Trial = 18291/30000 | Total reward = 27.73
2022-01-26 14:17:54.738 | DEBUG    | __main__:trials:24 - Trial = 18292/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.740 | DEBUG    | __main__:trials:29 - Trial = 18292/30000 | Total reward = 32.58
2022-01-26 14:17:54.743 | DEBUG    | __main__:trials:24 - Trial = 18293/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.745 | DEBUG    | __main__:trials:29 - Trial = 18293/30000 | Total reward = 45.73
2022-01-26 14:17:54.747 | DEBUG    | __main__:trials:26 - Trial = 18294/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.748 | DEBUG    | __main__:trials:29 - Trial = 18294/30000 | Total reward = 9.99
2022-01-26 14:17:54.751 | DEBUG    | __main__:trials:26 - Trial = 18295/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.752 | DEBUG    | __main__:trials:29 - Trial = 18295/30000 | Total reward = 19.78
2022-01-26 14:17:54.755 | DEBUG    | __main__:trials:24 - Trial = 18296/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.757 | DEBUG    | __main__:trials:29 - Trial = 18296/30000 | Total reward = 40.32
2022-01-26 14:17:54.760 | DEBUG    | __main__:trials:24 - Trial = 18297/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.762 | DEBUG    | __main__:trials:29 - Trial = 18297/30000 | Total reward = 47.79
2022-01-26 14:17:54.766 | DEBUG    | __main__:trials:24 - Trial = 18298/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.766 | DEBUG    | __main__:trials:29 - Trial = 18298/30000 | Total reward = 39.16
2022-01-26 14:17:54.770 | DEBUG    | __main__:trials:26 - Trial = 18299/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.772 | DEBUG    | __main__:trials:29 - Trial = 18299/30000 | Total reward = 30.95
2022-01-26 14:17:54.775 | DEBUG    | __main__:trials:24 - Trial = 18300/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.776 | DEBUG    | __main__:trials:29 - Trial = 18300/30000 | Total reward = 54.30
2022-01-26 14:17:54.781 | DEBUG    | __main__:trials:24 - Trial = 18301/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.781 | DEBUG    | __main__:trials:29 - Trial = 18301/30000 | Total reward = 57.83
2022-01-26 14:17:54.784 | DEBUG    | __main__:trials:26 - Trial = 18302/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.784 | DEBUG    | __main__:trials:29 - Trial = 18302/30000 | Total reward = 19.69
2022-01-26 14:17:54.788 | DEBUG    | __main__:trials:24 - Trial = 18303/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.789 | DEBUG    | __main__:trials:29 - Trial = 18303/30000 | Total reward = 38.19
2022-01-26 14:17:54.792 | DEBUG    | __main__:trials:26 - Trial = 18304/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.794 | DEBUG    | __main__:trials:29 - Trial = 18304/30000 | Total reward = 15.26
2022-01-26 14:17:54.798 | DEBUG    | __main__:trials:24 - Trial = 18305/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.798 | DEBUG    | __main__:trials:29 - Trial = 18305/30000 | Total reward = 31.06
2022-01-26 14:17:54.802 | DEBUG    | __main__:trials:24 - Trial = 18306/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.804 | DEBUG    | __main__:trials:29 - Trial = 18306/30000 | Total reward = 31.91
2022-01-26 14:17:54.807 | DEBUG    | __main__:trials:24 - Trial = 18307/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.808 | DEBUG    | __main__:trials:29 - Trial = 18307/30000 | Total reward = 36.71
2022-01-26 14:17:54.812 | DEBUG    | __main__:trials:24 - Trial = 18308/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.814 | DEBUG    | __main__:trials:29 - Trial = 18308/30000 | Total reward = 35.47
2022-01-26 14:17:54.819 | DEBUG    | __main__:trials:24 - Trial = 18309/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.820 | DEBUG    | __main__:trials:29 - Trial = 18309/30000 | Total reward = 35.27
2022-01-26 14:17:54.824 | DEBUG    | __main__:trials:24 - Trial = 18310/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.826 | DEBUG    | __main__:trials:29 - Trial = 18310/30000 | Total reward = 33.53
2022-01-26 14:17:54.830 | DEBUG    | __main__:trials:24 - Trial = 18311/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.831 | DEBUG    | __main__:trials:29 - Trial = 18311/30000 | Total reward = 39.38
2022-01-26 14:17:54.835 | DEBUG    | __main__:trials:24 - Trial = 18312/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.836 | DEBUG    | __main__:trials:29 - Trial = 18312/30000 | Total reward = 33.40
2022-01-26 14:17:54.840 | DEBUG    | __main__:trials:24 - Trial = 18313/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.841 | DEBUG    | __main__:trials:29 - Trial = 18313/30000 | Total reward = 40.29
2022-01-26 14:17:54.845 | DEBUG    | __main__:trials:24 - Trial = 18314/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.846 | DEBUG    | __main__:trials:29 - Trial = 18314/30000 | Total reward = 37.24
2022-01-26 14:17:54.850 | DEBUG    | __main__:trials:24 - Trial = 18315/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.852 | DEBUG    | __main__:trials:29 - Trial = 18315/30000 | Total reward = 41.77
2022-01-26 14:17:54.854 | DEBUG    | __main__:trials:26 - Trial = 18316/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:54.856 | DEBUG    | __main__:trials:29 - Trial = 18316/30000 | Total reward = 17.33
2022-01-26 14:17:54.859 | DEBUG    | __main__:trials:24 - Trial = 18317/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.861 | DEBUG    | __main__:trials:29 - Trial = 18317/30000 | Total reward = 24.31
2022-01-26 14:17:54.864 | DEBUG    | __main__:trials:24 - Trial = 18318/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.866 | DEBUG    | __main__:trials:29 - Trial = 18318/30000 | Total reward = 37.51
2022-01-26 14:17:54.870 | DEBUG    | __main__:trials:24 - Trial = 18319/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.870 | DEBUG    | __main__:trials:29 - Trial = 18319/30000 | Total reward = 41.99
2022-01-26 14:17:54.874 | DEBUG    | __main__:trials:24 - Trial = 18320/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.875 | DEBUG    | __main__:trials:29 - Trial = 18320/30000 | Total reward = 36.53
2022-01-26 14:17:54.880 | DEBUG    | __main__:trials:24 - Trial = 18321/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.881 | DEBUG    | __main__:trials:29 - Trial = 18321/30000 | Total reward = 44.87
2022-01-26 14:17:54.885 | DEBUG    | __main__:trials:24 - Trial = 18322/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.887 | DEBUG    | __main__:trials:29 - Trial = 18322/30000 | Total reward = 37.56
2022-01-26 14:17:54.890 | DEBUG    | __main__:trials:24 - Trial = 18323/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.892 | DEBUG    | __main__:trials:29 - Trial = 18323/30000 | Total reward = 56.91
2022-01-26 14:17:54.896 | DEBUG    | __main__:trials:24 - Trial = 18324/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.897 | DEBUG    | __main__:trials:29 - Trial = 18324/30000 | Total reward = 40.25
2022-01-26 14:17:54.901 | DEBUG    | __main__:trials:24 - Trial = 18325/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.902 | DEBUG    | __main__:trials:29 - Trial = 18325/30000 | Total reward = 38.07
2022-01-26 14:17:54.906 | DEBUG    | __main__:trials:24 - Trial = 18326/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.908 | DEBUG    | __main__:trials:29 - Trial = 18326/30000 | Total reward = 36.16
2022-01-26 14:17:54.912 | DEBUG    | __main__:trials:24 - Trial = 18327/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.913 | DEBUG    | __main__:trials:29 - Trial = 18327/30000 | Total reward = 49.89
2022-01-26 14:17:54.916 | DEBUG    | __main__:trials:24 - Trial = 18328/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.918 | DEBUG    | __main__:trials:29 - Trial = 18328/30000 | Total reward = 41.02
2022-01-26 14:17:54.922 | DEBUG    | __main__:trials:24 - Trial = 18329/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.923 | DEBUG    | __main__:trials:29 - Trial = 18329/30000 | Total reward = 35.13
2022-01-26 14:17:54.927 | DEBUG    | __main__:trials:24 - Trial = 18330/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.928 | DEBUG    | __main__:trials:29 - Trial = 18330/30000 | Total reward = 41.64
2022-01-26 14:17:54.932 | DEBUG    | __main__:trials:24 - Trial = 18331/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.933 | DEBUG    | __main__:trials:29 - Trial = 18331/30000 | Total reward = 40.25
2022-01-26 14:17:54.937 | DEBUG    | __main__:trials:24 - Trial = 18332/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.939 | DEBUG    | __main__:trials:29 - Trial = 18332/30000 | Total reward = 39.58
2022-01-26 14:17:54.942 | DEBUG    | __main__:trials:24 - Trial = 18333/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.943 | DEBUG    | __main__:trials:29 - Trial = 18333/30000 | Total reward = 43.85
2022-01-26 14:17:54.947 | DEBUG    | __main__:trials:24 - Trial = 18334/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.949 | DEBUG    | __main__:trials:29 - Trial = 18334/30000 | Total reward = 33.29
2022-01-26 14:17:54.952 | DEBUG    | __main__:trials:24 - Trial = 18335/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.953 | DEBUG    | __main__:trials:29 - Trial = 18335/30000 | Total reward = 40.25
2022-01-26 14:17:54.958 | DEBUG    | __main__:trials:24 - Trial = 18336/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.959 | DEBUG    | __main__:trials:29 - Trial = 18336/30000 | Total reward = 40.77
2022-01-26 14:17:54.962 | DEBUG    | __main__:trials:24 - Trial = 18337/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.964 | DEBUG    | __main__:trials:29 - Trial = 18337/30000 | Total reward = 32.70
2022-01-26 14:17:54.967 | DEBUG    | __main__:trials:24 - Trial = 18338/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.969 | DEBUG    | __main__:trials:29 - Trial = 18338/30000 | Total reward = 44.51
2022-01-26 14:17:54.972 | DEBUG    | __main__:trials:24 - Trial = 18339/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.974 | DEBUG    | __main__:trials:29 - Trial = 18339/30000 | Total reward = 36.21
2022-01-26 14:17:54.978 | DEBUG    | __main__:trials:24 - Trial = 18340/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.978 | DEBUG    | __main__:trials:29 - Trial = 18340/30000 | Total reward = 34.44
2022-01-26 14:17:54.983 | DEBUG    | __main__:trials:24 - Trial = 18341/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.984 | DEBUG    | __main__:trials:29 - Trial = 18341/30000 | Total reward = 46.20
2022-01-26 14:17:54.988 | DEBUG    | __main__:trials:24 - Trial = 18342/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.989 | DEBUG    | __main__:trials:29 - Trial = 18342/30000 | Total reward = 43.18
2022-01-26 14:17:54.993 | DEBUG    | __main__:trials:24 - Trial = 18343/30000 | Max number of steps (20) reached
2022-01-26 14:17:54.995 | DEBUG    | __main__:trials:29 - Trial = 18343/30000 | Total reward = 37.75
2022-01-26 14:17:54.999 | DEBUG    | __main__:trials:24 - Trial = 18344/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.000 | DEBUG    | __main__:trials:29 - Trial = 18344/30000 | Total reward = 34.98
2022-01-26 14:17:55.004 | DEBUG    | __main__:trials:24 - Trial = 18345/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.005 | DEBUG    | __main__:trials:29 - Trial = 18345/30000 | Total reward = 55.17
2022-01-26 14:17:55.009 | DEBUG    | __main__:trials:24 - Trial = 18346/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.011 | DEBUG    | __main__:trials:29 - Trial = 18346/30000 | Total reward = 37.46
2022-01-26 14:17:55.014 | DEBUG    | __main__:trials:24 - Trial = 18347/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.016 | DEBUG    | __main__:trials:29 - Trial = 18347/30000 | Total reward = 45.85
2022-01-26 14:17:55.019 | DEBUG    | __main__:trials:24 - Trial = 18348/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.021 | DEBUG    | __main__:trials:29 - Trial = 18348/30000 | Total reward = 43.18
2022-01-26 14:17:55.024 | DEBUG    | __main__:trials:24 - Trial = 18349/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.026 | DEBUG    | __main__:trials:29 - Trial = 18349/30000 | Total reward = 37.87
2022-01-26 14:17:55.030 | DEBUG    | __main__:trials:24 - Trial = 18350/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.031 | DEBUG    | __main__:trials:29 - Trial = 18350/30000 | Total reward = 38.55
2022-01-26 14:17:55.035 | DEBUG    | __main__:trials:24 - Trial = 18351/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.037 | DEBUG    | __main__:trials:29 - Trial = 18351/30000 | Total reward = 37.73
2022-01-26 14:17:55.040 | DEBUG    | __main__:trials:26 - Trial = 18352/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.041 | DEBUG    | __main__:trials:29 - Trial = 18352/30000 | Total reward = 24.10
2022-01-26 14:17:55.045 | DEBUG    | __main__:trials:24 - Trial = 18353/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.046 | DEBUG    | __main__:trials:29 - Trial = 18353/30000 | Total reward = 33.20
2022-01-26 14:17:55.050 | DEBUG    | __main__:trials:24 - Trial = 18354/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.052 | DEBUG    | __main__:trials:29 - Trial = 18354/30000 | Total reward = 34.29
2022-01-26 14:17:55.055 | DEBUG    | __main__:trials:24 - Trial = 18355/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.056 | DEBUG    | __main__:trials:29 - Trial = 18355/30000 | Total reward = 39.86
2022-01-26 14:17:55.060 | DEBUG    | __main__:trials:26 - Trial = 18356/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.061 | DEBUG    | __main__:trials:29 - Trial = 18356/30000 | Total reward = 26.47
2022-01-26 14:17:55.065 | DEBUG    | __main__:trials:24 - Trial = 18357/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.066 | DEBUG    | __main__:trials:29 - Trial = 18357/30000 | Total reward = 32.04
2022-01-26 14:17:55.070 | DEBUG    | __main__:trials:24 - Trial = 18358/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.070 | DEBUG    | __main__:trials:29 - Trial = 18358/30000 | Total reward = 41.34
2022-01-26 14:17:55.075 | DEBUG    | __main__:trials:24 - Trial = 18359/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.077 | DEBUG    | __main__:trials:29 - Trial = 18359/30000 | Total reward = 30.11
2022-01-26 14:17:55.080 | DEBUG    | __main__:trials:24 - Trial = 18360/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.082 | DEBUG    | __main__:trials:29 - Trial = 18360/30000 | Total reward = 37.50
2022-01-26 14:17:55.086 | DEBUG    | __main__:trials:24 - Trial = 18361/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.086 | DEBUG    | __main__:trials:29 - Trial = 18361/30000 | Total reward = 63.51
2022-01-26 14:17:55.090 | DEBUG    | __main__:trials:26 - Trial = 18362/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.091 | DEBUG    | __main__:trials:29 - Trial = 18362/30000 | Total reward = 25.12
2022-01-26 14:17:55.096 | DEBUG    | __main__:trials:24 - Trial = 18363/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.096 | DEBUG    | __main__:trials:29 - Trial = 18363/30000 | Total reward = 37.67
2022-01-26 14:17:55.100 | DEBUG    | __main__:trials:24 - Trial = 18364/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.102 | DEBUG    | __main__:trials:29 - Trial = 18364/30000 | Total reward = 39.04
2022-01-26 14:17:55.106 | DEBUG    | __main__:trials:24 - Trial = 18365/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.106 | DEBUG    | __main__:trials:29 - Trial = 18365/30000 | Total reward = 41.21
2022-01-26 14:17:55.111 | DEBUG    | __main__:trials:24 - Trial = 18366/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.112 | DEBUG    | __main__:trials:29 - Trial = 18366/30000 | Total reward = 42.19
2022-01-26 14:17:55.115 | DEBUG    | __main__:trials:26 - Trial = 18367/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.117 | DEBUG    | __main__:trials:29 - Trial = 18367/30000 | Total reward = 19.73
2022-01-26 14:17:55.120 | DEBUG    | __main__:trials:24 - Trial = 18368/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.122 | DEBUG    | __main__:trials:29 - Trial = 18368/30000 | Total reward = 41.69
2022-01-26 14:17:55.125 | DEBUG    | __main__:trials:24 - Trial = 18369/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.126 | DEBUG    | __main__:trials:29 - Trial = 18369/30000 | Total reward = 36.83
2022-01-26 14:17:55.129 | DEBUG    | __main__:trials:24 - Trial = 18370/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.131 | DEBUG    | __main__:trials:29 - Trial = 18370/30000 | Total reward = 40.93
2022-01-26 14:17:55.134 | DEBUG    | __main__:trials:24 - Trial = 18371/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.135 | DEBUG    | __main__:trials:29 - Trial = 18371/30000 | Total reward = 43.78
2022-01-26 14:17:55.139 | DEBUG    | __main__:trials:24 - Trial = 18372/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.140 | DEBUG    | __main__:trials:29 - Trial = 18372/30000 | Total reward = 36.89
2022-01-26 14:17:55.144 | DEBUG    | __main__:trials:24 - Trial = 18373/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.146 | DEBUG    | __main__:trials:29 - Trial = 18373/30000 | Total reward = 38.15
2022-01-26 14:17:55.150 | DEBUG    | __main__:trials:24 - Trial = 18374/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.151 | DEBUG    | __main__:trials:29 - Trial = 18374/30000 | Total reward = 42.45
2022-01-26 14:17:55.155 | DEBUG    | __main__:trials:24 - Trial = 18375/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.156 | DEBUG    | __main__:trials:29 - Trial = 18375/30000 | Total reward = 40.15
2022-01-26 14:17:55.160 | DEBUG    | __main__:trials:24 - Trial = 18376/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.161 | DEBUG    | __main__:trials:29 - Trial = 18376/30000 | Total reward = 34.94
2022-01-26 14:17:55.165 | DEBUG    | __main__:trials:24 - Trial = 18377/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.166 | DEBUG    | __main__:trials:29 - Trial = 18377/30000 | Total reward = 43.03
2022-01-26 14:17:55.170 | DEBUG    | __main__:trials:24 - Trial = 18378/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.172 | DEBUG    | __main__:trials:29 - Trial = 18378/30000 | Total reward = 47.80
2022-01-26 14:17:55.175 | DEBUG    | __main__:trials:24 - Trial = 18379/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.176 | DEBUG    | __main__:trials:29 - Trial = 18379/30000 | Total reward = 48.76
2022-01-26 14:17:55.180 | DEBUG    | __main__:trials:24 - Trial = 18380/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.181 | DEBUG    | __main__:trials:29 - Trial = 18380/30000 | Total reward = 41.96
2022-01-26 14:17:55.186 | DEBUG    | __main__:trials:24 - Trial = 18381/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.187 | DEBUG    | __main__:trials:29 - Trial = 18381/30000 | Total reward = 32.07
2022-01-26 14:17:55.191 | DEBUG    | __main__:trials:24 - Trial = 18382/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.192 | DEBUG    | __main__:trials:29 - Trial = 18382/30000 | Total reward = 43.11
2022-01-26 14:17:55.196 | DEBUG    | __main__:trials:24 - Trial = 18383/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.197 | DEBUG    | __main__:trials:29 - Trial = 18383/30000 | Total reward = 44.39
2022-01-26 14:17:55.201 | DEBUG    | __main__:trials:24 - Trial = 18384/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.203 | DEBUG    | __main__:trials:29 - Trial = 18384/30000 | Total reward = 47.15
2022-01-26 14:17:55.205 | DEBUG    | __main__:trials:24 - Trial = 18385/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.207 | DEBUG    | __main__:trials:29 - Trial = 18385/30000 | Total reward = 43.32
2022-01-26 14:17:55.211 | DEBUG    | __main__:trials:24 - Trial = 18386/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.213 | DEBUG    | __main__:trials:29 - Trial = 18386/30000 | Total reward = 46.93
2022-01-26 14:17:55.216 | DEBUG    | __main__:trials:24 - Trial = 18387/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.218 | DEBUG    | __main__:trials:29 - Trial = 18387/30000 | Total reward = 54.50
2022-01-26 14:17:55.222 | DEBUG    | __main__:trials:24 - Trial = 18388/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.223 | DEBUG    | __main__:trials:29 - Trial = 18388/30000 | Total reward = 39.25
2022-01-26 14:17:55.227 | DEBUG    | __main__:trials:24 - Trial = 18389/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.228 | DEBUG    | __main__:trials:29 - Trial = 18389/30000 | Total reward = 59.70
2022-01-26 14:17:55.232 | DEBUG    | __main__:trials:24 - Trial = 18390/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.234 | DEBUG    | __main__:trials:29 - Trial = 18390/30000 | Total reward = 33.24
2022-01-26 14:17:55.238 | DEBUG    | __main__:trials:24 - Trial = 18391/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.239 | DEBUG    | __main__:trials:29 - Trial = 18391/30000 | Total reward = 28.74
2022-01-26 14:17:55.242 | DEBUG    | __main__:trials:24 - Trial = 18392/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.244 | DEBUG    | __main__:trials:29 - Trial = 18392/30000 | Total reward = 23.61
2022-01-26 14:17:55.246 | DEBUG    | __main__:trials:26 - Trial = 18393/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.248 | DEBUG    | __main__:trials:29 - Trial = 18393/30000 | Total reward = 19.69
2022-01-26 14:17:55.252 | DEBUG    | __main__:trials:24 - Trial = 18394/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.253 | DEBUG    | __main__:trials:29 - Trial = 18394/30000 | Total reward = 37.61
2022-01-26 14:17:55.255 | DEBUG    | __main__:trials:26 - Trial = 18395/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.257 | DEBUG    | __main__:trials:29 - Trial = 18395/30000 | Total reward = 22.62
2022-01-26 14:17:55.261 | DEBUG    | __main__:trials:24 - Trial = 18396/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.262 | DEBUG    | __main__:trials:29 - Trial = 18396/30000 | Total reward = 33.03
2022-01-26 14:17:55.266 | DEBUG    | __main__:trials:26 - Trial = 18397/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.267 | DEBUG    | __main__:trials:29 - Trial = 18397/30000 | Total reward = 30.53
2022-01-26 14:17:55.270 | DEBUG    | __main__:trials:24 - Trial = 18398/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.272 | DEBUG    | __main__:trials:29 - Trial = 18398/30000 | Total reward = 51.04
2022-01-26 14:17:55.275 | DEBUG    | __main__:trials:24 - Trial = 18399/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.277 | DEBUG    | __main__:trials:29 - Trial = 18399/30000 | Total reward = 30.02
2022-01-26 14:17:55.280 | DEBUG    | __main__:trials:26 - Trial = 18400/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.282 | DEBUG    | __main__:trials:29 - Trial = 18400/30000 | Total reward = 21.24
2022-01-26 14:17:55.286 | DEBUG    | __main__:trials:24 - Trial = 18401/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.287 | DEBUG    | __main__:trials:29 - Trial = 18401/30000 | Total reward = 32.28
2022-01-26 14:17:55.291 | DEBUG    | __main__:trials:26 - Trial = 18402/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.292 | DEBUG    | __main__:trials:29 - Trial = 18402/30000 | Total reward = 15.17
2022-01-26 14:17:55.296 | DEBUG    | __main__:trials:26 - Trial = 18403/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.297 | DEBUG    | __main__:trials:29 - Trial = 18403/30000 | Total reward = 22.36
2022-01-26 14:17:55.301 | DEBUG    | __main__:trials:24 - Trial = 18404/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.302 | DEBUG    | __main__:trials:29 - Trial = 18404/30000 | Total reward = 27.31
2022-01-26 14:17:55.305 | DEBUG    | __main__:trials:24 - Trial = 18405/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.306 | DEBUG    | __main__:trials:29 - Trial = 18405/30000 | Total reward = 27.86
2022-01-26 14:17:55.309 | DEBUG    | __main__:trials:26 - Trial = 18406/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.310 | DEBUG    | __main__:trials:29 - Trial = 18406/30000 | Total reward = 24.36
2022-01-26 14:17:55.313 | DEBUG    | __main__:trials:24 - Trial = 18407/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.314 | DEBUG    | __main__:trials:29 - Trial = 18407/30000 | Total reward = 38.07
2022-01-26 14:17:55.317 | DEBUG    | __main__:trials:24 - Trial = 18408/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.319 | DEBUG    | __main__:trials:29 - Trial = 18408/30000 | Total reward = 37.75
2022-01-26 14:17:55.323 | DEBUG    | __main__:trials:24 - Trial = 18409/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.325 | DEBUG    | __main__:trials:29 - Trial = 18409/30000 | Total reward = 40.26
2022-01-26 14:17:55.329 | DEBUG    | __main__:trials:24 - Trial = 18410/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.330 | DEBUG    | __main__:trials:29 - Trial = 18410/30000 | Total reward = 44.32
2022-01-26 14:17:55.334 | DEBUG    | __main__:trials:24 - Trial = 18411/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.336 | DEBUG    | __main__:trials:29 - Trial = 18411/30000 | Total reward = 34.34
2022-01-26 14:17:55.340 | DEBUG    | __main__:trials:24 - Trial = 18412/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.340 | DEBUG    | __main__:trials:29 - Trial = 18412/30000 | Total reward = 27.47
2022-01-26 14:17:55.344 | DEBUG    | __main__:trials:24 - Trial = 18413/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.345 | DEBUG    | __main__:trials:29 - Trial = 18413/30000 | Total reward = 39.54
2022-01-26 14:17:55.349 | DEBUG    | __main__:trials:26 - Trial = 18414/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.350 | DEBUG    | __main__:trials:29 - Trial = 18414/30000 | Total reward = 6.73
2022-01-26 14:17:55.355 | DEBUG    | __main__:trials:24 - Trial = 18415/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.356 | DEBUG    | __main__:trials:29 - Trial = 18415/30000 | Total reward = 30.70
2022-01-26 14:17:55.360 | DEBUG    | __main__:trials:24 - Trial = 18416/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.361 | DEBUG    | __main__:trials:29 - Trial = 18416/30000 | Total reward = 33.88
2022-01-26 14:17:55.366 | DEBUG    | __main__:trials:24 - Trial = 18417/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.366 | DEBUG    | __main__:trials:29 - Trial = 18417/30000 | Total reward = 33.70
2022-01-26 14:17:55.371 | DEBUG    | __main__:trials:26 - Trial = 18418/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.372 | DEBUG    | __main__:trials:29 - Trial = 18418/30000 | Total reward = 16.70
2022-01-26 14:17:55.376 | DEBUG    | __main__:trials:24 - Trial = 18419/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.377 | DEBUG    | __main__:trials:29 - Trial = 18419/30000 | Total reward = 40.02
2022-01-26 14:17:55.381 | DEBUG    | __main__:trials:24 - Trial = 18420/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.382 | DEBUG    | __main__:trials:29 - Trial = 18420/30000 | Total reward = 44.20
2022-01-26 14:17:55.386 | DEBUG    | __main__:trials:24 - Trial = 18421/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.387 | DEBUG    | __main__:trials:29 - Trial = 18421/30000 | Total reward = 34.99
2022-01-26 14:17:55.391 | DEBUG    | __main__:trials:24 - Trial = 18422/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.392 | DEBUG    | __main__:trials:29 - Trial = 18422/30000 | Total reward = 47.95
2022-01-26 14:17:55.395 | DEBUG    | __main__:trials:26 - Trial = 18423/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.397 | DEBUG    | __main__:trials:29 - Trial = 18423/30000 | Total reward = 17.99
2022-01-26 14:17:55.401 | DEBUG    | __main__:trials:26 - Trial = 18424/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.402 | DEBUG    | __main__:trials:29 - Trial = 18424/30000 | Total reward = 16.65
2022-01-26 14:17:55.406 | DEBUG    | __main__:trials:24 - Trial = 18425/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.407 | DEBUG    | __main__:trials:29 - Trial = 18425/30000 | Total reward = 49.49
2022-01-26 14:17:55.411 | DEBUG    | __main__:trials:24 - Trial = 18426/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.412 | DEBUG    | __main__:trials:29 - Trial = 18426/30000 | Total reward = 35.87
2022-01-26 14:17:55.415 | DEBUG    | __main__:trials:26 - Trial = 18427/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.416 | DEBUG    | __main__:trials:29 - Trial = 18427/30000 | Total reward = 12.21
2022-01-26 14:17:55.421 | DEBUG    | __main__:trials:24 - Trial = 18428/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.421 | DEBUG    | __main__:trials:29 - Trial = 18428/30000 | Total reward = 36.60
2022-01-26 14:17:55.425 | DEBUG    | __main__:trials:24 - Trial = 18429/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.428 | DEBUG    | __main__:trials:29 - Trial = 18429/30000 | Total reward = 33.51
2022-01-26 14:17:55.431 | DEBUG    | __main__:trials:24 - Trial = 18430/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.433 | DEBUG    | __main__:trials:29 - Trial = 18430/30000 | Total reward = 37.35
2022-01-26 14:17:55.436 | DEBUG    | __main__:trials:24 - Trial = 18431/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.438 | DEBUG    | __main__:trials:29 - Trial = 18431/30000 | Total reward = 52.19
2022-01-26 14:17:55.442 | DEBUG    | __main__:trials:24 - Trial = 18432/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.442 | DEBUG    | __main__:trials:29 - Trial = 18432/30000 | Total reward = 52.92
2022-01-26 14:17:55.446 | DEBUG    | __main__:trials:24 - Trial = 18433/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.448 | DEBUG    | __main__:trials:29 - Trial = 18433/30000 | Total reward = 31.76
2022-01-26 14:17:55.450 | DEBUG    | __main__:trials:26 - Trial = 18434/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.451 | DEBUG    | __main__:trials:29 - Trial = 18434/30000 | Total reward = 14.85
2022-01-26 14:17:55.454 | DEBUG    | __main__:trials:24 - Trial = 18435/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.456 | DEBUG    | __main__:trials:29 - Trial = 18435/30000 | Total reward = 35.08
2022-01-26 14:17:55.459 | DEBUG    | __main__:trials:24 - Trial = 18436/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.461 | DEBUG    | __main__:trials:29 - Trial = 18436/30000 | Total reward = 37.93
2022-01-26 14:17:55.463 | DEBUG    | __main__:trials:26 - Trial = 18437/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.465 | DEBUG    | __main__:trials:29 - Trial = 18437/30000 | Total reward = 19.38
2022-01-26 14:17:55.468 | DEBUG    | __main__:trials:24 - Trial = 18438/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.469 | DEBUG    | __main__:trials:29 - Trial = 18438/30000 | Total reward = 31.88
2022-01-26 14:17:55.473 | DEBUG    | __main__:trials:24 - Trial = 18439/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.474 | DEBUG    | __main__:trials:29 - Trial = 18439/30000 | Total reward = 38.49
2022-01-26 14:17:55.478 | DEBUG    | __main__:trials:26 - Trial = 18440/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.479 | DEBUG    | __main__:trials:29 - Trial = 18440/30000 | Total reward = 27.50
2022-01-26 14:17:55.483 | DEBUG    | __main__:trials:24 - Trial = 18441/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.484 | DEBUG    | __main__:trials:29 - Trial = 18441/30000 | Total reward = 50.23
2022-01-26 14:17:55.488 | DEBUG    | __main__:trials:24 - Trial = 18442/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.490 | DEBUG    | __main__:trials:29 - Trial = 18442/30000 | Total reward = 36.93
2022-01-26 14:17:55.493 | DEBUG    | __main__:trials:24 - Trial = 18443/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.494 | DEBUG    | __main__:trials:29 - Trial = 18443/30000 | Total reward = 34.79
2022-01-26 14:17:55.498 | DEBUG    | __main__:trials:24 - Trial = 18444/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.500 | DEBUG    | __main__:trials:29 - Trial = 18444/30000 | Total reward = 37.45
2022-01-26 14:17:55.503 | DEBUG    | __main__:trials:24 - Trial = 18445/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.505 | DEBUG    | __main__:trials:29 - Trial = 18445/30000 | Total reward = 32.67
2022-01-26 14:17:55.509 | DEBUG    | __main__:trials:24 - Trial = 18446/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.510 | DEBUG    | __main__:trials:29 - Trial = 18446/30000 | Total reward = 35.49
2022-01-26 14:17:55.514 | DEBUG    | __main__:trials:24 - Trial = 18447/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.516 | DEBUG    | __main__:trials:29 - Trial = 18447/30000 | Total reward = 11.95
2022-01-26 14:17:55.520 | DEBUG    | __main__:trials:24 - Trial = 18448/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.520 | DEBUG    | __main__:trials:29 - Trial = 18448/30000 | Total reward = 37.26
2022-01-26 14:17:55.524 | DEBUG    | __main__:trials:26 - Trial = 18449/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.525 | DEBUG    | __main__:trials:29 - Trial = 18449/30000 | Total reward = 16.86
2022-01-26 14:17:55.530 | DEBUG    | __main__:trials:24 - Trial = 18450/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.531 | DEBUG    | __main__:trials:29 - Trial = 18450/30000 | Total reward = 34.29
2022-01-26 14:17:55.536 | DEBUG    | __main__:trials:26 - Trial = 18451/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.537 | DEBUG    | __main__:trials:29 - Trial = 18451/30000 | Total reward = 30.91
2022-01-26 14:17:55.540 | DEBUG    | __main__:trials:26 - Trial = 18452/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.541 | DEBUG    | __main__:trials:29 - Trial = 18452/30000 | Total reward = 17.99
2022-01-26 14:17:55.546 | DEBUG    | __main__:trials:24 - Trial = 18453/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.546 | DEBUG    | __main__:trials:29 - Trial = 18453/30000 | Total reward = 39.80
2022-01-26 14:17:55.550 | DEBUG    | __main__:trials:24 - Trial = 18454/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.552 | DEBUG    | __main__:trials:29 - Trial = 18454/30000 | Total reward = 40.07
2022-01-26 14:17:55.556 | DEBUG    | __main__:trials:24 - Trial = 18455/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.556 | DEBUG    | __main__:trials:29 - Trial = 18455/30000 | Total reward = 34.79
2022-01-26 14:17:55.560 | DEBUG    | __main__:trials:26 - Trial = 18456/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.560 | DEBUG    | __main__:trials:29 - Trial = 18456/30000 | Total reward = 20.97
2022-01-26 14:17:55.564 | DEBUG    | __main__:trials:24 - Trial = 18457/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.565 | DEBUG    | __main__:trials:29 - Trial = 18457/30000 | Total reward = 30.29
2022-01-26 14:17:55.568 | DEBUG    | __main__:trials:24 - Trial = 18458/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.570 | DEBUG    | __main__:trials:29 - Trial = 18458/30000 | Total reward = 48.04
2022-01-26 14:17:55.574 | DEBUG    | __main__:trials:24 - Trial = 18459/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.574 | DEBUG    | __main__:trials:29 - Trial = 18459/30000 | Total reward = 30.09
2022-01-26 14:17:55.579 | DEBUG    | __main__:trials:24 - Trial = 18460/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.579 | DEBUG    | __main__:trials:29 - Trial = 18460/30000 | Total reward = 40.66
2022-01-26 14:17:55.584 | DEBUG    | __main__:trials:24 - Trial = 18461/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.585 | DEBUG    | __main__:trials:29 - Trial = 18461/30000 | Total reward = 39.87
2022-01-26 14:17:55.589 | DEBUG    | __main__:trials:24 - Trial = 18462/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.589 | DEBUG    | __main__:trials:29 - Trial = 18462/30000 | Total reward = 35.26
2022-01-26 14:17:55.593 | DEBUG    | __main__:trials:24 - Trial = 18463/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.594 | DEBUG    | __main__:trials:29 - Trial = 18463/30000 | Total reward = 46.82
2022-01-26 14:17:55.597 | DEBUG    | __main__:trials:26 - Trial = 18464/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.598 | DEBUG    | __main__:trials:29 - Trial = 18464/30000 | Total reward = 24.14
2022-01-26 14:17:55.602 | DEBUG    | __main__:trials:24 - Trial = 18465/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.603 | DEBUG    | __main__:trials:29 - Trial = 18465/30000 | Total reward = 47.92
2022-01-26 14:17:55.606 | DEBUG    | __main__:trials:26 - Trial = 18466/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.607 | DEBUG    | __main__:trials:29 - Trial = 18466/30000 | Total reward = 23.01
2022-01-26 14:17:55.611 | DEBUG    | __main__:trials:24 - Trial = 18467/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.613 | DEBUG    | __main__:trials:29 - Trial = 18467/30000 | Total reward = 27.44
2022-01-26 14:17:55.616 | DEBUG    | __main__:trials:24 - Trial = 18468/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.618 | DEBUG    | __main__:trials:29 - Trial = 18468/30000 | Total reward = 35.95
2022-01-26 14:17:55.621 | DEBUG    | __main__:trials:24 - Trial = 18469/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.622 | DEBUG    | __main__:trials:29 - Trial = 18469/30000 | Total reward = 40.85
2022-01-26 14:17:55.627 | DEBUG    | __main__:trials:24 - Trial = 18470/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.628 | DEBUG    | __main__:trials:29 - Trial = 18470/30000 | Total reward = 33.64
2022-01-26 14:17:55.632 | DEBUG    | __main__:trials:24 - Trial = 18471/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.633 | DEBUG    | __main__:trials:29 - Trial = 18471/30000 | Total reward = 37.25
2022-01-26 14:17:55.637 | DEBUG    | __main__:trials:24 - Trial = 18472/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.639 | DEBUG    | __main__:trials:29 - Trial = 18472/30000 | Total reward = 34.03
2022-01-26 14:17:55.642 | DEBUG    | __main__:trials:24 - Trial = 18473/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.644 | DEBUG    | __main__:trials:29 - Trial = 18473/30000 | Total reward = 34.65
2022-01-26 14:17:55.646 | DEBUG    | __main__:trials:26 - Trial = 18474/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.648 | DEBUG    | __main__:trials:29 - Trial = 18474/30000 | Total reward = 16.53
2022-01-26 14:17:55.652 | DEBUG    | __main__:trials:24 - Trial = 18475/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.653 | DEBUG    | __main__:trials:29 - Trial = 18475/30000 | Total reward = 27.23
2022-01-26 14:17:55.656 | DEBUG    | __main__:trials:26 - Trial = 18476/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.658 | DEBUG    | __main__:trials:29 - Trial = 18476/30000 | Total reward = 20.39
2022-01-26 14:17:55.661 | DEBUG    | __main__:trials:26 - Trial = 18477/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.662 | DEBUG    | __main__:trials:29 - Trial = 18477/30000 | Total reward = 15.04
2022-01-26 14:17:55.667 | DEBUG    | __main__:trials:24 - Trial = 18478/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.668 | DEBUG    | __main__:trials:29 - Trial = 18478/30000 | Total reward = 46.58
2022-01-26 14:17:55.672 | DEBUG    | __main__:trials:24 - Trial = 18479/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.673 | DEBUG    | __main__:trials:29 - Trial = 18479/30000 | Total reward = 50.57
2022-01-26 14:17:55.677 | DEBUG    | __main__:trials:24 - Trial = 18480/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.678 | DEBUG    | __main__:trials:29 - Trial = 18480/30000 | Total reward = 35.02
2022-01-26 14:17:55.681 | DEBUG    | __main__:trials:24 - Trial = 18481/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.683 | DEBUG    | __main__:trials:29 - Trial = 18481/30000 | Total reward = 34.34
2022-01-26 14:17:55.685 | DEBUG    | __main__:trials:24 - Trial = 18482/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.686 | DEBUG    | __main__:trials:29 - Trial = 18482/30000 | Total reward = 28.01
2022-01-26 14:17:55.689 | DEBUG    | __main__:trials:24 - Trial = 18483/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.691 | DEBUG    | __main__:trials:29 - Trial = 18483/30000 | Total reward = 34.60
2022-01-26 14:17:55.695 | DEBUG    | __main__:trials:24 - Trial = 18484/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.697 | DEBUG    | __main__:trials:29 - Trial = 18484/30000 | Total reward = 35.11
2022-01-26 14:17:55.700 | DEBUG    | __main__:trials:24 - Trial = 18485/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.702 | DEBUG    | __main__:trials:29 - Trial = 18485/30000 | Total reward = 51.57
2022-01-26 14:17:55.706 | DEBUG    | __main__:trials:24 - Trial = 18486/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.706 | DEBUG    | __main__:trials:29 - Trial = 18486/30000 | Total reward = 27.73
2022-01-26 14:17:55.711 | DEBUG    | __main__:trials:24 - Trial = 18487/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.713 | DEBUG    | __main__:trials:29 - Trial = 18487/30000 | Total reward = 40.18
2022-01-26 14:17:55.716 | DEBUG    | __main__:trials:26 - Trial = 18488/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.718 | DEBUG    | __main__:trials:29 - Trial = 18488/30000 | Total reward = 12.78
2022-01-26 14:17:55.721 | DEBUG    | __main__:trials:24 - Trial = 18489/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.721 | DEBUG    | __main__:trials:29 - Trial = 18489/30000 | Total reward = 28.48
2022-01-26 14:17:55.726 | DEBUG    | __main__:trials:24 - Trial = 18490/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.727 | DEBUG    | __main__:trials:29 - Trial = 18490/30000 | Total reward = 40.93
2022-01-26 14:17:55.731 | DEBUG    | __main__:trials:24 - Trial = 18491/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.732 | DEBUG    | __main__:trials:29 - Trial = 18491/30000 | Total reward = 37.48
2022-01-26 14:17:55.736 | DEBUG    | __main__:trials:24 - Trial = 18492/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.737 | DEBUG    | __main__:trials:29 - Trial = 18492/30000 | Total reward = 47.19
2022-01-26 14:17:55.741 | DEBUG    | __main__:trials:24 - Trial = 18493/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.743 | DEBUG    | __main__:trials:29 - Trial = 18493/30000 | Total reward = 33.30
2022-01-26 14:17:55.747 | DEBUG    | __main__:trials:24 - Trial = 18494/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.748 | DEBUG    | __main__:trials:29 - Trial = 18494/30000 | Total reward = 52.01
2022-01-26 14:17:55.752 | DEBUG    | __main__:trials:24 - Trial = 18495/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.754 | DEBUG    | __main__:trials:29 - Trial = 18495/30000 | Total reward = 39.12
2022-01-26 14:17:55.757 | DEBUG    | __main__:trials:24 - Trial = 18496/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.758 | DEBUG    | __main__:trials:29 - Trial = 18496/30000 | Total reward = 41.78
2022-01-26 14:17:55.762 | DEBUG    | __main__:trials:24 - Trial = 18497/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.764 | DEBUG    | __main__:trials:29 - Trial = 18497/30000 | Total reward = 42.20
2022-01-26 14:17:55.767 | DEBUG    | __main__:trials:24 - Trial = 18498/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.768 | DEBUG    | __main__:trials:29 - Trial = 18498/30000 | Total reward = 35.34
2022-01-26 14:17:55.773 | DEBUG    | __main__:trials:24 - Trial = 18499/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.774 | DEBUG    | __main__:trials:29 - Trial = 18499/30000 | Total reward = 32.94
2022-01-26 14:17:55.778 | DEBUG    | __main__:trials:24 - Trial = 18500/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.778 | DEBUG    | __main__:trials:29 - Trial = 18500/30000 | Total reward = 34.75
2022-01-26 14:17:55.782 | DEBUG    | __main__:trials:26 - Trial = 18501/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.784 | DEBUG    | __main__:trials:29 - Trial = 18501/30000 | Total reward = 18.11
2022-01-26 14:17:55.787 | DEBUG    | __main__:trials:24 - Trial = 18502/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.789 | DEBUG    | __main__:trials:29 - Trial = 18502/30000 | Total reward = 50.04
2022-01-26 14:17:55.791 | DEBUG    | __main__:trials:26 - Trial = 18503/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.793 | DEBUG    | __main__:trials:29 - Trial = 18503/30000 | Total reward = 23.86
2022-01-26 14:17:55.797 | DEBUG    | __main__:trials:24 - Trial = 18504/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.799 | DEBUG    | __main__:trials:29 - Trial = 18504/30000 | Total reward = 36.25
2022-01-26 14:17:55.802 | DEBUG    | __main__:trials:26 - Trial = 18505/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.803 | DEBUG    | __main__:trials:29 - Trial = 18505/30000 | Total reward = 31.59
2022-01-26 14:17:55.807 | DEBUG    | __main__:trials:24 - Trial = 18506/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.808 | DEBUG    | __main__:trials:29 - Trial = 18506/30000 | Total reward = 38.94
2022-01-26 14:17:55.812 | DEBUG    | __main__:trials:26 - Trial = 18507/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.813 | DEBUG    | __main__:trials:29 - Trial = 18507/30000 | Total reward = 23.03
2022-01-26 14:17:55.816 | DEBUG    | __main__:trials:26 - Trial = 18508/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:55.818 | DEBUG    | __main__:trials:29 - Trial = 18508/30000 | Total reward = 20.90
2022-01-26 14:17:55.821 | DEBUG    | __main__:trials:24 - Trial = 18509/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.823 | DEBUG    | __main__:trials:29 - Trial = 18509/30000 | Total reward = 33.21
2022-01-26 14:17:55.827 | DEBUG    | __main__:trials:24 - Trial = 18510/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.827 | DEBUG    | __main__:trials:29 - Trial = 18510/30000 | Total reward = 38.64
2022-01-26 14:17:55.832 | DEBUG    | __main__:trials:24 - Trial = 18511/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.834 | DEBUG    | __main__:trials:29 - Trial = 18511/30000 | Total reward = 41.00
2022-01-26 14:17:55.837 | DEBUG    | __main__:trials:24 - Trial = 18512/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.838 | DEBUG    | __main__:trials:29 - Trial = 18512/30000 | Total reward = 33.13
2022-01-26 14:17:55.843 | DEBUG    | __main__:trials:24 - Trial = 18513/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.843 | DEBUG    | __main__:trials:29 - Trial = 18513/30000 | Total reward = 36.72
2022-01-26 14:17:55.848 | DEBUG    | __main__:trials:24 - Trial = 18514/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.849 | DEBUG    | __main__:trials:29 - Trial = 18514/30000 | Total reward = 30.17
2022-01-26 14:17:55.853 | DEBUG    | __main__:trials:24 - Trial = 18515/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.854 | DEBUG    | __main__:trials:29 - Trial = 18515/30000 | Total reward = 35.37
2022-01-26 14:17:55.858 | DEBUG    | __main__:trials:24 - Trial = 18516/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.859 | DEBUG    | __main__:trials:29 - Trial = 18516/30000 | Total reward = 31.37
2022-01-26 14:17:55.863 | DEBUG    | __main__:trials:24 - Trial = 18517/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.865 | DEBUG    | __main__:trials:29 - Trial = 18517/30000 | Total reward = 23.45
2022-01-26 14:17:55.868 | DEBUG    | __main__:trials:24 - Trial = 18518/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.870 | DEBUG    | __main__:trials:29 - Trial = 18518/30000 | Total reward = 36.66
2022-01-26 14:17:55.873 | DEBUG    | __main__:trials:24 - Trial = 18519/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.875 | DEBUG    | __main__:trials:29 - Trial = 18519/30000 | Total reward = 53.34
2022-01-26 14:17:55.879 | DEBUG    | __main__:trials:24 - Trial = 18520/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.879 | DEBUG    | __main__:trials:29 - Trial = 18520/30000 | Total reward = 42.72
2022-01-26 14:17:55.884 | DEBUG    | __main__:trials:24 - Trial = 18521/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.886 | DEBUG    | __main__:trials:29 - Trial = 18521/30000 | Total reward = 33.44
2022-01-26 14:17:55.890 | DEBUG    | __main__:trials:24 - Trial = 18522/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.891 | DEBUG    | __main__:trials:29 - Trial = 18522/30000 | Total reward = 38.57
2022-01-26 14:17:55.895 | DEBUG    | __main__:trials:24 - Trial = 18523/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.896 | DEBUG    | __main__:trials:29 - Trial = 18523/30000 | Total reward = 32.57
2022-01-26 14:17:55.900 | DEBUG    | __main__:trials:24 - Trial = 18524/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.901 | DEBUG    | __main__:trials:29 - Trial = 18524/30000 | Total reward = 30.73
2022-01-26 14:17:55.905 | DEBUG    | __main__:trials:24 - Trial = 18525/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.906 | DEBUG    | __main__:trials:29 - Trial = 18525/30000 | Total reward = 38.36
2022-01-26 14:17:55.910 | DEBUG    | __main__:trials:24 - Trial = 18526/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.912 | DEBUG    | __main__:trials:29 - Trial = 18526/30000 | Total reward = 37.95
2022-01-26 14:17:55.915 | DEBUG    | __main__:trials:24 - Trial = 18527/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.917 | DEBUG    | __main__:trials:29 - Trial = 18527/30000 | Total reward = 37.96
2022-01-26 14:17:55.920 | DEBUG    | __main__:trials:24 - Trial = 18528/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.921 | DEBUG    | __main__:trials:29 - Trial = 18528/30000 | Total reward = 35.35
2022-01-26 14:17:55.925 | DEBUG    | __main__:trials:24 - Trial = 18529/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.925 | DEBUG    | __main__:trials:29 - Trial = 18529/30000 | Total reward = 40.25
2022-01-26 14:17:55.929 | DEBUG    | __main__:trials:24 - Trial = 18530/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.930 | DEBUG    | __main__:trials:29 - Trial = 18530/30000 | Total reward = 40.14
2022-01-26 14:17:55.935 | DEBUG    | __main__:trials:24 - Trial = 18531/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.935 | DEBUG    | __main__:trials:29 - Trial = 18531/30000 | Total reward = 43.58
2022-01-26 14:17:55.940 | DEBUG    | __main__:trials:24 - Trial = 18532/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.940 | DEBUG    | __main__:trials:29 - Trial = 18532/30000 | Total reward = 48.70
2022-01-26 14:17:55.944 | DEBUG    | __main__:trials:24 - Trial = 18533/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.945 | DEBUG    | __main__:trials:29 - Trial = 18533/30000 | Total reward = 25.98
2022-01-26 14:17:55.949 | DEBUG    | __main__:trials:24 - Trial = 18534/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.949 | DEBUG    | __main__:trials:29 - Trial = 18534/30000 | Total reward = 45.69
2022-01-26 14:17:55.954 | DEBUG    | __main__:trials:24 - Trial = 18535/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.955 | DEBUG    | __main__:trials:29 - Trial = 18535/30000 | Total reward = 51.28
2022-01-26 14:17:55.959 | DEBUG    | __main__:trials:24 - Trial = 18536/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.960 | DEBUG    | __main__:trials:29 - Trial = 18536/30000 | Total reward = 48.55
2022-01-26 14:17:55.964 | DEBUG    | __main__:trials:24 - Trial = 18537/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.966 | DEBUG    | __main__:trials:29 - Trial = 18537/30000 | Total reward = 41.95
2022-01-26 14:17:55.970 | DEBUG    | __main__:trials:24 - Trial = 18538/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.971 | DEBUG    | __main__:trials:29 - Trial = 18538/30000 | Total reward = 35.76
2022-01-26 14:17:55.975 | DEBUG    | __main__:trials:24 - Trial = 18539/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.977 | DEBUG    | __main__:trials:29 - Trial = 18539/30000 | Total reward = 36.69
2022-01-26 14:17:55.981 | DEBUG    | __main__:trials:24 - Trial = 18540/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.982 | DEBUG    | __main__:trials:29 - Trial = 18540/30000 | Total reward = 35.91
2022-01-26 14:17:55.985 | DEBUG    | __main__:trials:24 - Trial = 18541/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.986 | DEBUG    | __main__:trials:29 - Trial = 18541/30000 | Total reward = 41.41
2022-01-26 14:17:55.989 | DEBUG    | __main__:trials:24 - Trial = 18542/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.990 | DEBUG    | __main__:trials:29 - Trial = 18542/30000 | Total reward = 53.78
2022-01-26 14:17:55.994 | DEBUG    | __main__:trials:24 - Trial = 18543/30000 | Max number of steps (20) reached
2022-01-26 14:17:55.995 | DEBUG    | __main__:trials:29 - Trial = 18543/30000 | Total reward = 40.79
2022-01-26 14:17:55.998 | DEBUG    | __main__:trials:24 - Trial = 18544/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.000 | DEBUG    | __main__:trials:29 - Trial = 18544/30000 | Total reward = 35.39
2022-01-26 14:17:56.003 | DEBUG    | __main__:trials:24 - Trial = 18545/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.005 | DEBUG    | __main__:trials:29 - Trial = 18545/30000 | Total reward = 38.08
2022-01-26 14:17:56.009 | DEBUG    | __main__:trials:24 - Trial = 18546/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.010 | DEBUG    | __main__:trials:29 - Trial = 18546/30000 | Total reward = 46.03
2022-01-26 14:17:56.014 | DEBUG    | __main__:trials:24 - Trial = 18547/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.016 | DEBUG    | __main__:trials:29 - Trial = 18547/30000 | Total reward = 43.32
2022-01-26 14:17:56.019 | DEBUG    | __main__:trials:24 - Trial = 18548/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.021 | DEBUG    | __main__:trials:29 - Trial = 18548/30000 | Total reward = 49.60
2022-01-26 14:17:56.025 | DEBUG    | __main__:trials:24 - Trial = 18549/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.026 | DEBUG    | __main__:trials:29 - Trial = 18549/30000 | Total reward = 38.03
2022-01-26 14:17:56.029 | DEBUG    | __main__:trials:24 - Trial = 18550/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.031 | DEBUG    | __main__:trials:29 - Trial = 18550/30000 | Total reward = 37.66
2022-01-26 14:17:56.033 | DEBUG    | __main__:trials:24 - Trial = 18551/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.034 | DEBUG    | __main__:trials:29 - Trial = 18551/30000 | Total reward = 42.49
2022-01-26 14:17:56.038 | DEBUG    | __main__:trials:24 - Trial = 18552/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.038 | DEBUG    | __main__:trials:29 - Trial = 18552/30000 | Total reward = 41.39
2022-01-26 14:17:56.042 | DEBUG    | __main__:trials:24 - Trial = 18553/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.043 | DEBUG    | __main__:trials:29 - Trial = 18553/30000 | Total reward = 42.18
2022-01-26 14:17:56.046 | DEBUG    | __main__:trials:24 - Trial = 18554/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.047 | DEBUG    | __main__:trials:29 - Trial = 18554/30000 | Total reward = 45.97
2022-01-26 14:17:56.050 | DEBUG    | __main__:trials:24 - Trial = 18555/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.053 | DEBUG    | __main__:trials:29 - Trial = 18555/30000 | Total reward = 37.55
2022-01-26 14:17:56.055 | DEBUG    | __main__:trials:26 - Trial = 18556/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.056 | DEBUG    | __main__:trials:29 - Trial = 18556/30000 | Total reward = 17.99
2022-01-26 14:17:56.060 | DEBUG    | __main__:trials:24 - Trial = 18557/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.061 | DEBUG    | __main__:trials:29 - Trial = 18557/30000 | Total reward = 32.19
2022-01-26 14:17:56.065 | DEBUG    | __main__:trials:24 - Trial = 18558/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.066 | DEBUG    | __main__:trials:29 - Trial = 18558/30000 | Total reward = 32.67
2022-01-26 14:17:56.069 | DEBUG    | __main__:trials:24 - Trial = 18559/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.071 | DEBUG    | __main__:trials:29 - Trial = 18559/30000 | Total reward = 35.58
2022-01-26 14:17:56.073 | DEBUG    | __main__:trials:24 - Trial = 18560/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.074 | DEBUG    | __main__:trials:29 - Trial = 18560/30000 | Total reward = 37.33
2022-01-26 14:17:56.078 | DEBUG    | __main__:trials:24 - Trial = 18561/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.078 | DEBUG    | __main__:trials:29 - Trial = 18561/30000 | Total reward = 35.03
2022-01-26 14:17:56.081 | DEBUG    | __main__:trials:24 - Trial = 18562/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.082 | DEBUG    | __main__:trials:29 - Trial = 18562/30000 | Total reward = 20.08
2022-01-26 14:17:56.086 | DEBUG    | __main__:trials:24 - Trial = 18563/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.088 | DEBUG    | __main__:trials:29 - Trial = 18563/30000 | Total reward = 46.75
2022-01-26 14:17:56.091 | DEBUG    | __main__:trials:24 - Trial = 18564/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.093 | DEBUG    | __main__:trials:29 - Trial = 18564/30000 | Total reward = 33.24
2022-01-26 14:17:56.096 | DEBUG    | __main__:trials:24 - Trial = 18565/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.098 | DEBUG    | __main__:trials:29 - Trial = 18565/30000 | Total reward = 38.01
2022-01-26 14:17:56.101 | DEBUG    | __main__:trials:24 - Trial = 18566/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.102 | DEBUG    | __main__:trials:29 - Trial = 18566/30000 | Total reward = 49.75
2022-01-26 14:17:56.106 | DEBUG    | __main__:trials:24 - Trial = 18567/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.107 | DEBUG    | __main__:trials:29 - Trial = 18567/30000 | Total reward = 24.29
2022-01-26 14:17:56.111 | DEBUG    | __main__:trials:24 - Trial = 18568/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.112 | DEBUG    | __main__:trials:29 - Trial = 18568/30000 | Total reward = 39.16
2022-01-26 14:17:56.115 | DEBUG    | __main__:trials:24 - Trial = 18569/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.117 | DEBUG    | __main__:trials:29 - Trial = 18569/30000 | Total reward = 56.93
2022-01-26 14:17:56.121 | DEBUG    | __main__:trials:24 - Trial = 18570/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.122 | DEBUG    | __main__:trials:29 - Trial = 18570/30000 | Total reward = 31.37
2022-01-26 14:17:56.126 | DEBUG    | __main__:trials:24 - Trial = 18571/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.127 | DEBUG    | __main__:trials:29 - Trial = 18571/30000 | Total reward = 24.50
2022-01-26 14:17:56.130 | DEBUG    | __main__:trials:26 - Trial = 18572/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.132 | DEBUG    | __main__:trials:29 - Trial = 18572/30000 | Total reward = 17.84
2022-01-26 14:17:56.136 | DEBUG    | __main__:trials:24 - Trial = 18573/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.137 | DEBUG    | __main__:trials:29 - Trial = 18573/30000 | Total reward = 48.01
2022-01-26 14:17:56.141 | DEBUG    | __main__:trials:24 - Trial = 18574/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.142 | DEBUG    | __main__:trials:29 - Trial = 18574/30000 | Total reward = 61.46
2022-01-26 14:17:56.147 | DEBUG    | __main__:trials:24 - Trial = 18575/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.148 | DEBUG    | __main__:trials:29 - Trial = 18575/30000 | Total reward = 30.17
2022-01-26 14:17:56.151 | DEBUG    | __main__:trials:24 - Trial = 18576/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.153 | DEBUG    | __main__:trials:29 - Trial = 18576/30000 | Total reward = 39.39
2022-01-26 14:17:56.156 | DEBUG    | __main__:trials:26 - Trial = 18577/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.158 | DEBUG    | __main__:trials:29 - Trial = 18577/30000 | Total reward = 26.14
2022-01-26 14:17:56.162 | DEBUG    | __main__:trials:24 - Trial = 18578/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.163 | DEBUG    | __main__:trials:29 - Trial = 18578/30000 | Total reward = 46.41
2022-01-26 14:17:56.166 | DEBUG    | __main__:trials:24 - Trial = 18579/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.168 | DEBUG    | __main__:trials:29 - Trial = 18579/30000 | Total reward = 46.41
2022-01-26 14:17:56.171 | DEBUG    | __main__:trials:24 - Trial = 18580/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.173 | DEBUG    | __main__:trials:29 - Trial = 18580/30000 | Total reward = 44.86
2022-01-26 14:17:56.176 | DEBUG    | __main__:trials:24 - Trial = 18581/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.178 | DEBUG    | __main__:trials:29 - Trial = 18581/30000 | Total reward = 32.39
2022-01-26 14:17:56.182 | DEBUG    | __main__:trials:24 - Trial = 18582/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.183 | DEBUG    | __main__:trials:29 - Trial = 18582/30000 | Total reward = 52.56
2022-01-26 14:17:56.186 | DEBUG    | __main__:trials:26 - Trial = 18583/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.188 | DEBUG    | __main__:trials:29 - Trial = 18583/30000 | Total reward = 21.17
2022-01-26 14:17:56.191 | DEBUG    | __main__:trials:24 - Trial = 18584/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.192 | DEBUG    | __main__:trials:29 - Trial = 18584/30000 | Total reward = 46.45
2022-01-26 14:17:56.196 | DEBUG    | __main__:trials:24 - Trial = 18585/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.197 | DEBUG    | __main__:trials:29 - Trial = 18585/30000 | Total reward = 43.76
2022-01-26 14:17:56.200 | DEBUG    | __main__:trials:24 - Trial = 18586/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.202 | DEBUG    | __main__:trials:29 - Trial = 18586/30000 | Total reward = 51.54
2022-01-26 14:17:56.205 | DEBUG    | __main__:trials:24 - Trial = 18587/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.206 | DEBUG    | __main__:trials:29 - Trial = 18587/30000 | Total reward = 34.34
2022-01-26 14:17:56.209 | DEBUG    | __main__:trials:24 - Trial = 18588/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.211 | DEBUG    | __main__:trials:29 - Trial = 18588/30000 | Total reward = 36.08
2022-01-26 14:17:56.214 | DEBUG    | __main__:trials:24 - Trial = 18589/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.215 | DEBUG    | __main__:trials:29 - Trial = 18589/30000 | Total reward = 30.48
2022-01-26 14:17:56.218 | DEBUG    | __main__:trials:26 - Trial = 18590/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.220 | DEBUG    | __main__:trials:29 - Trial = 18590/30000 | Total reward = 27.55
2022-01-26 14:17:56.225 | DEBUG    | __main__:trials:24 - Trial = 18591/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.226 | DEBUG    | __main__:trials:29 - Trial = 18591/30000 | Total reward = 29.50
2022-01-26 14:17:56.230 | DEBUG    | __main__:trials:24 - Trial = 18592/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.231 | DEBUG    | __main__:trials:29 - Trial = 18592/30000 | Total reward = 34.69
2022-01-26 14:17:56.235 | DEBUG    | __main__:trials:24 - Trial = 18593/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.237 | DEBUG    | __main__:trials:29 - Trial = 18593/30000 | Total reward = 35.94
2022-01-26 14:17:56.241 | DEBUG    | __main__:trials:24 - Trial = 18594/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.242 | DEBUG    | __main__:trials:29 - Trial = 18594/30000 | Total reward = 33.37
2022-01-26 14:17:56.245 | DEBUG    | __main__:trials:24 - Trial = 18595/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.246 | DEBUG    | __main__:trials:29 - Trial = 18595/30000 | Total reward = 44.95
2022-01-26 14:17:56.250 | DEBUG    | __main__:trials:24 - Trial = 18596/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.252 | DEBUG    | __main__:trials:29 - Trial = 18596/30000 | Total reward = 45.72
2022-01-26 14:17:56.253 | DEBUG    | __main__:trials:26 - Trial = 18597/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.255 | DEBUG    | __main__:trials:29 - Trial = 18597/30000 | Total reward = 10.62
2022-01-26 14:17:56.257 | DEBUG    | __main__:trials:26 - Trial = 18598/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.258 | DEBUG    | __main__:trials:29 - Trial = 18598/30000 | Total reward = 10.92
2022-01-26 14:17:56.261 | DEBUG    | __main__:trials:24 - Trial = 18599/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.262 | DEBUG    | __main__:trials:29 - Trial = 18599/30000 | Total reward = 49.25
2022-01-26 14:17:56.265 | DEBUG    | __main__:trials:26 - Trial = 18600/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.266 | DEBUG    | __main__:trials:29 - Trial = 18600/30000 | Total reward = 20.46
2022-01-26 14:17:56.270 | DEBUG    | __main__:trials:24 - Trial = 18601/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.271 | DEBUG    | __main__:trials:29 - Trial = 18601/30000 | Total reward = 27.17
2022-01-26 14:17:56.275 | DEBUG    | __main__:trials:24 - Trial = 18602/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.277 | DEBUG    | __main__:trials:29 - Trial = 18602/30000 | Total reward = 51.61
2022-01-26 14:17:56.280 | DEBUG    | __main__:trials:24 - Trial = 18603/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.282 | DEBUG    | __main__:trials:29 - Trial = 18603/30000 | Total reward = 36.46
2022-01-26 14:17:56.285 | DEBUG    | __main__:trials:26 - Trial = 18604/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.286 | DEBUG    | __main__:trials:29 - Trial = 18604/30000 | Total reward = 13.83
2022-01-26 14:17:56.290 | DEBUG    | __main__:trials:24 - Trial = 18605/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.291 | DEBUG    | __main__:trials:29 - Trial = 18605/30000 | Total reward = 52.28
2022-01-26 14:17:56.295 | DEBUG    | __main__:trials:24 - Trial = 18606/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.297 | DEBUG    | __main__:trials:29 - Trial = 18606/30000 | Total reward = 45.71
2022-01-26 14:17:56.300 | DEBUG    | __main__:trials:26 - Trial = 18607/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.300 | DEBUG    | __main__:trials:29 - Trial = 18607/30000 | Total reward = 11.75
2022-01-26 14:17:56.304 | DEBUG    | __main__:trials:26 - Trial = 18608/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.305 | DEBUG    | __main__:trials:29 - Trial = 18608/30000 | Total reward = 13.83
2022-01-26 14:17:56.308 | DEBUG    | __main__:trials:24 - Trial = 18609/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.310 | DEBUG    | __main__:trials:29 - Trial = 18609/30000 | Total reward = 50.88
2022-01-26 14:17:56.314 | DEBUG    | __main__:trials:24 - Trial = 18610/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.315 | DEBUG    | __main__:trials:29 - Trial = 18610/30000 | Total reward = 44.22
2022-01-26 14:17:56.318 | DEBUG    | __main__:trials:26 - Trial = 18611/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.320 | DEBUG    | __main__:trials:29 - Trial = 18611/30000 | Total reward = 14.83
2022-01-26 14:17:56.323 | DEBUG    | __main__:trials:26 - Trial = 18612/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.325 | DEBUG    | __main__:trials:29 - Trial = 18612/30000 | Total reward = 29.34
2022-01-26 14:17:56.327 | DEBUG    | __main__:trials:24 - Trial = 18613/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.329 | DEBUG    | __main__:trials:29 - Trial = 18613/30000 | Total reward = 52.22
2022-01-26 14:17:56.332 | DEBUG    | __main__:trials:26 - Trial = 18614/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.334 | DEBUG    | __main__:trials:29 - Trial = 18614/30000 | Total reward = 14.85
2022-01-26 14:17:56.337 | DEBUG    | __main__:trials:26 - Trial = 18615/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.339 | DEBUG    | __main__:trials:29 - Trial = 18615/30000 | Total reward = 25.90
2022-01-26 14:17:56.343 | DEBUG    | __main__:trials:24 - Trial = 18616/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.344 | DEBUG    | __main__:trials:29 - Trial = 18616/30000 | Total reward = 51.82
2022-01-26 14:17:56.348 | DEBUG    | __main__:trials:24 - Trial = 18617/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.349 | DEBUG    | __main__:trials:29 - Trial = 18617/30000 | Total reward = 46.76
2022-01-26 14:17:56.352 | DEBUG    | __main__:trials:26 - Trial = 18618/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.354 | DEBUG    | __main__:trials:29 - Trial = 18618/30000 | Total reward = 12.34
2022-01-26 14:17:56.357 | DEBUG    | __main__:trials:26 - Trial = 18619/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.357 | DEBUG    | __main__:trials:29 - Trial = 18619/30000 | Total reward = 14.85
2022-01-26 14:17:56.361 | DEBUG    | __main__:trials:26 - Trial = 18620/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.361 | DEBUG    | __main__:trials:29 - Trial = 18620/30000 | Total reward = 15.29
2022-01-26 14:17:56.364 | DEBUG    | __main__:trials:26 - Trial = 18621/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.366 | DEBUG    | __main__:trials:29 - Trial = 18621/30000 | Total reward = 17.79
2022-01-26 14:17:56.369 | DEBUG    | __main__:trials:24 - Trial = 18622/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.369 | DEBUG    | __main__:trials:29 - Trial = 18622/30000 | Total reward = 43.75
2022-01-26 14:17:56.373 | DEBUG    | __main__:trials:24 - Trial = 18623/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.374 | DEBUG    | __main__:trials:29 - Trial = 18623/30000 | Total reward = 46.98
2022-01-26 14:17:56.378 | DEBUG    | __main__:trials:24 - Trial = 18624/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.379 | DEBUG    | __main__:trials:29 - Trial = 18624/30000 | Total reward = 51.77
2022-01-26 14:17:56.382 | DEBUG    | __main__:trials:26 - Trial = 18625/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.384 | DEBUG    | __main__:trials:29 - Trial = 18625/30000 | Total reward = 13.83
2022-01-26 14:17:56.386 | DEBUG    | __main__:trials:26 - Trial = 18626/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.388 | DEBUG    | __main__:trials:29 - Trial = 18626/30000 | Total reward = 10.77
2022-01-26 14:17:56.391 | DEBUG    | __main__:trials:26 - Trial = 18627/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.391 | DEBUG    | __main__:trials:29 - Trial = 18627/30000 | Total reward = 10.45
2022-01-26 14:17:56.396 | DEBUG    | __main__:trials:24 - Trial = 18628/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.397 | DEBUG    | __main__:trials:29 - Trial = 18628/30000 | Total reward = 59.81
2022-01-26 14:17:56.400 | DEBUG    | __main__:trials:26 - Trial = 18629/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.401 | DEBUG    | __main__:trials:29 - Trial = 18629/30000 | Total reward = 15.06
2022-01-26 14:17:56.405 | DEBUG    | __main__:trials:26 - Trial = 18630/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.405 | DEBUG    | __main__:trials:29 - Trial = 18630/30000 | Total reward = 16.31
2022-01-26 14:17:56.410 | DEBUG    | __main__:trials:24 - Trial = 18631/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.412 | DEBUG    | __main__:trials:29 - Trial = 18631/30000 | Total reward = 38.35
2022-01-26 14:17:56.416 | DEBUG    | __main__:trials:24 - Trial = 18632/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.417 | DEBUG    | __main__:trials:29 - Trial = 18632/30000 | Total reward = 44.99
2022-01-26 14:17:56.421 | DEBUG    | __main__:trials:24 - Trial = 18633/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.423 | DEBUG    | __main__:trials:29 - Trial = 18633/30000 | Total reward = 43.15
2022-01-26 14:17:56.426 | DEBUG    | __main__:trials:24 - Trial = 18634/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.428 | DEBUG    | __main__:trials:29 - Trial = 18634/30000 | Total reward = 43.73
2022-01-26 14:17:56.431 | DEBUG    | __main__:trials:24 - Trial = 18635/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.433 | DEBUG    | __main__:trials:29 - Trial = 18635/30000 | Total reward = 48.54
2022-01-26 14:17:56.436 | DEBUG    | __main__:trials:24 - Trial = 18636/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.438 | DEBUG    | __main__:trials:29 - Trial = 18636/30000 | Total reward = 39.05
2022-01-26 14:17:56.441 | DEBUG    | __main__:trials:24 - Trial = 18637/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.443 | DEBUG    | __main__:trials:29 - Trial = 18637/30000 | Total reward = 32.95
2022-01-26 14:17:56.446 | DEBUG    | __main__:trials:24 - Trial = 18638/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.448 | DEBUG    | __main__:trials:29 - Trial = 18638/30000 | Total reward = 37.73
2022-01-26 14:17:56.452 | DEBUG    | __main__:trials:24 - Trial = 18639/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.453 | DEBUG    | __main__:trials:29 - Trial = 18639/30000 | Total reward = 39.37
2022-01-26 14:17:56.456 | DEBUG    | __main__:trials:24 - Trial = 18640/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.458 | DEBUG    | __main__:trials:29 - Trial = 18640/30000 | Total reward = 33.51
2022-01-26 14:17:56.462 | DEBUG    | __main__:trials:24 - Trial = 18641/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.463 | DEBUG    | __main__:trials:29 - Trial = 18641/30000 | Total reward = 31.74
2022-01-26 14:17:56.467 | DEBUG    | __main__:trials:24 - Trial = 18642/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.469 | DEBUG    | __main__:trials:29 - Trial = 18642/30000 | Total reward = 40.62
2022-01-26 14:17:56.472 | DEBUG    | __main__:trials:26 - Trial = 18643/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.474 | DEBUG    | __main__:trials:29 - Trial = 18643/30000 | Total reward = 23.52
2022-01-26 14:17:56.478 | DEBUG    | __main__:trials:24 - Trial = 18644/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.479 | DEBUG    | __main__:trials:29 - Trial = 18644/30000 | Total reward = 39.00
2022-01-26 14:17:56.483 | DEBUG    | __main__:trials:24 - Trial = 18645/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.485 | DEBUG    | __main__:trials:29 - Trial = 18645/30000 | Total reward = 36.96
2022-01-26 14:17:56.488 | DEBUG    | __main__:trials:24 - Trial = 18646/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.490 | DEBUG    | __main__:trials:29 - Trial = 18646/30000 | Total reward = 55.06
2022-01-26 14:17:56.494 | DEBUG    | __main__:trials:24 - Trial = 18647/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.495 | DEBUG    | __main__:trials:29 - Trial = 18647/30000 | Total reward = 34.28
2022-01-26 14:17:56.499 | DEBUG    | __main__:trials:26 - Trial = 18648/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.500 | DEBUG    | __main__:trials:29 - Trial = 18648/30000 | Total reward = 27.03
2022-01-26 14:17:56.504 | DEBUG    | __main__:trials:24 - Trial = 18649/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.505 | DEBUG    | __main__:trials:29 - Trial = 18649/30000 | Total reward = 39.81
2022-01-26 14:17:56.509 | DEBUG    | __main__:trials:24 - Trial = 18650/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.511 | DEBUG    | __main__:trials:29 - Trial = 18650/30000 | Total reward = 35.76
2022-01-26 14:17:56.514 | DEBUG    | __main__:trials:24 - Trial = 18651/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.516 | DEBUG    | __main__:trials:29 - Trial = 18651/30000 | Total reward = 36.46
2022-01-26 14:17:56.519 | DEBUG    | __main__:trials:24 - Trial = 18652/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.520 | DEBUG    | __main__:trials:29 - Trial = 18652/30000 | Total reward = 43.13
2022-01-26 14:17:56.524 | DEBUG    | __main__:trials:24 - Trial = 18653/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.525 | DEBUG    | __main__:trials:29 - Trial = 18653/30000 | Total reward = 40.97
2022-01-26 14:17:56.529 | DEBUG    | __main__:trials:24 - Trial = 18654/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.531 | DEBUG    | __main__:trials:29 - Trial = 18654/30000 | Total reward = 44.56
2022-01-26 14:17:56.534 | DEBUG    | __main__:trials:24 - Trial = 18655/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.536 | DEBUG    | __main__:trials:29 - Trial = 18655/30000 | Total reward = 42.94
2022-01-26 14:17:56.540 | DEBUG    | __main__:trials:24 - Trial = 18656/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.541 | DEBUG    | __main__:trials:29 - Trial = 18656/30000 | Total reward = 59.59
2022-01-26 14:17:56.545 | DEBUG    | __main__:trials:24 - Trial = 18657/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.547 | DEBUG    | __main__:trials:29 - Trial = 18657/30000 | Total reward = 42.91
2022-01-26 14:17:56.550 | DEBUG    | __main__:trials:24 - Trial = 18658/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.552 | DEBUG    | __main__:trials:29 - Trial = 18658/30000 | Total reward = 43.81
2022-01-26 14:17:56.555 | DEBUG    | __main__:trials:24 - Trial = 18659/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.556 | DEBUG    | __main__:trials:29 - Trial = 18659/30000 | Total reward = 35.95
2022-01-26 14:17:56.560 | DEBUG    | __main__:trials:24 - Trial = 18660/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.562 | DEBUG    | __main__:trials:29 - Trial = 18660/30000 | Total reward = 46.45
2022-01-26 14:17:56.566 | DEBUG    | __main__:trials:24 - Trial = 18661/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.567 | DEBUG    | __main__:trials:29 - Trial = 18661/30000 | Total reward = 47.60
2022-01-26 14:17:56.570 | DEBUG    | __main__:trials:26 - Trial = 18662/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.572 | DEBUG    | __main__:trials:29 - Trial = 18662/30000 | Total reward = 20.39
2022-01-26 14:17:56.576 | DEBUG    | __main__:trials:24 - Trial = 18663/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.577 | DEBUG    | __main__:trials:29 - Trial = 18663/30000 | Total reward = 41.94
2022-01-26 14:17:56.581 | DEBUG    | __main__:trials:24 - Trial = 18664/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.583 | DEBUG    | __main__:trials:29 - Trial = 18664/30000 | Total reward = 46.47
2022-01-26 14:17:56.587 | DEBUG    | __main__:trials:24 - Trial = 18665/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.588 | DEBUG    | __main__:trials:29 - Trial = 18665/30000 | Total reward = 41.55
2022-01-26 14:17:56.592 | DEBUG    | __main__:trials:24 - Trial = 18666/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.593 | DEBUG    | __main__:trials:29 - Trial = 18666/30000 | Total reward = 43.61
2022-01-26 14:17:56.597 | DEBUG    | __main__:trials:24 - Trial = 18667/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.598 | DEBUG    | __main__:trials:29 - Trial = 18667/30000 | Total reward = 36.58
2022-01-26 14:17:56.601 | DEBUG    | __main__:trials:24 - Trial = 18668/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.602 | DEBUG    | __main__:trials:29 - Trial = 18668/30000 | Total reward = 49.25
2022-01-26 14:17:56.605 | DEBUG    | __main__:trials:24 - Trial = 18669/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.606 | DEBUG    | __main__:trials:29 - Trial = 18669/30000 | Total reward = 58.54
2022-01-26 14:17:56.609 | DEBUG    | __main__:trials:24 - Trial = 18670/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.611 | DEBUG    | __main__:trials:29 - Trial = 18670/30000 | Total reward = 48.37
2022-01-26 14:17:56.615 | DEBUG    | __main__:trials:24 - Trial = 18671/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.617 | DEBUG    | __main__:trials:29 - Trial = 18671/30000 | Total reward = 42.85
2022-01-26 14:17:56.620 | DEBUG    | __main__:trials:24 - Trial = 18672/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.622 | DEBUG    | __main__:trials:29 - Trial = 18672/30000 | Total reward = 53.60
2022-01-26 14:17:56.625 | DEBUG    | __main__:trials:26 - Trial = 18673/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.627 | DEBUG    | __main__:trials:29 - Trial = 18673/30000 | Total reward = 38.34
2022-01-26 14:17:56.631 | DEBUG    | __main__:trials:24 - Trial = 18674/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.632 | DEBUG    | __main__:trials:29 - Trial = 18674/30000 | Total reward = 37.10
2022-01-26 14:17:56.636 | DEBUG    | __main__:trials:24 - Trial = 18675/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.637 | DEBUG    | __main__:trials:29 - Trial = 18675/30000 | Total reward = 38.10
2022-01-26 14:17:56.641 | DEBUG    | __main__:trials:24 - Trial = 18676/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.642 | DEBUG    | __main__:trials:29 - Trial = 18676/30000 | Total reward = 42.31
2022-01-26 14:17:56.644 | DEBUG    | __main__:trials:26 - Trial = 18677/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.646 | DEBUG    | __main__:trials:29 - Trial = 18677/30000 | Total reward = 14.84
2022-01-26 14:17:56.649 | DEBUG    | __main__:trials:24 - Trial = 18678/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.650 | DEBUG    | __main__:trials:29 - Trial = 18678/30000 | Total reward = 40.63
2022-01-26 14:17:56.653 | DEBUG    | __main__:trials:24 - Trial = 18679/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.655 | DEBUG    | __main__:trials:29 - Trial = 18679/30000 | Total reward = 40.25
2022-01-26 14:17:56.659 | DEBUG    | __main__:trials:24 - Trial = 18680/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.661 | DEBUG    | __main__:trials:29 - Trial = 18680/30000 | Total reward = 40.49
2022-01-26 14:17:56.664 | DEBUG    | __main__:trials:24 - Trial = 18681/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.666 | DEBUG    | __main__:trials:29 - Trial = 18681/30000 | Total reward = 43.87
2022-01-26 14:17:56.670 | DEBUG    | __main__:trials:24 - Trial = 18682/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.671 | DEBUG    | __main__:trials:29 - Trial = 18682/30000 | Total reward = 29.81
2022-01-26 14:17:56.675 | DEBUG    | __main__:trials:26 - Trial = 18683/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.677 | DEBUG    | __main__:trials:29 - Trial = 18683/30000 | Total reward = 27.89
2022-01-26 14:17:56.680 | DEBUG    | __main__:trials:24 - Trial = 18684/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.682 | DEBUG    | __main__:trials:29 - Trial = 18684/30000 | Total reward = 34.43
2022-01-26 14:17:56.685 | DEBUG    | __main__:trials:24 - Trial = 18685/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.686 | DEBUG    | __main__:trials:29 - Trial = 18685/30000 | Total reward = 59.02
2022-01-26 14:17:56.689 | DEBUG    | __main__:trials:24 - Trial = 18686/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.690 | DEBUG    | __main__:trials:29 - Trial = 18686/30000 | Total reward = 40.25
2022-01-26 14:17:56.694 | DEBUG    | __main__:trials:24 - Trial = 18687/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.695 | DEBUG    | __main__:trials:29 - Trial = 18687/30000 | Total reward = 45.49
2022-01-26 14:17:56.699 | DEBUG    | __main__:trials:24 - Trial = 18688/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.701 | DEBUG    | __main__:trials:29 - Trial = 18688/30000 | Total reward = 35.86
2022-01-26 14:17:56.704 | DEBUG    | __main__:trials:24 - Trial = 18689/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.705 | DEBUG    | __main__:trials:29 - Trial = 18689/30000 | Total reward = 38.02
2022-01-26 14:17:56.709 | DEBUG    | __main__:trials:24 - Trial = 18690/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.710 | DEBUG    | __main__:trials:29 - Trial = 18690/30000 | Total reward = 44.66
2022-01-26 14:17:56.713 | DEBUG    | __main__:trials:24 - Trial = 18691/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.714 | DEBUG    | __main__:trials:29 - Trial = 18691/30000 | Total reward = 35.71
2022-01-26 14:17:56.717 | DEBUG    | __main__:trials:24 - Trial = 18692/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.719 | DEBUG    | __main__:trials:29 - Trial = 18692/30000 | Total reward = 40.25
2022-01-26 14:17:56.722 | DEBUG    | __main__:trials:26 - Trial = 18693/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.724 | DEBUG    | __main__:trials:29 - Trial = 18693/30000 | Total reward = 19.21
2022-01-26 14:17:56.727 | DEBUG    | __main__:trials:24 - Trial = 18694/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.729 | DEBUG    | __main__:trials:29 - Trial = 18694/30000 | Total reward = 37.79
2022-01-26 14:17:56.732 | DEBUG    | __main__:trials:24 - Trial = 18695/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.734 | DEBUG    | __main__:trials:29 - Trial = 18695/30000 | Total reward = 35.64
2022-01-26 14:17:56.737 | DEBUG    | __main__:trials:26 - Trial = 18696/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.739 | DEBUG    | __main__:trials:29 - Trial = 18696/30000 | Total reward = 23.35
2022-01-26 14:17:56.742 | DEBUG    | __main__:trials:26 - Trial = 18697/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.744 | DEBUG    | __main__:trials:29 - Trial = 18697/30000 | Total reward = 19.66
2022-01-26 14:17:56.747 | DEBUG    | __main__:trials:26 - Trial = 18698/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.749 | DEBUG    | __main__:trials:29 - Trial = 18698/30000 | Total reward = 24.77
2022-01-26 14:17:56.751 | DEBUG    | __main__:trials:26 - Trial = 18699/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.753 | DEBUG    | __main__:trials:29 - Trial = 18699/30000 | Total reward = 8.99
2022-01-26 14:17:56.756 | DEBUG    | __main__:trials:26 - Trial = 18700/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.756 | DEBUG    | __main__:trials:29 - Trial = 18700/30000 | Total reward = 13.83
2022-01-26 14:17:56.759 | DEBUG    | __main__:trials:26 - Trial = 18701/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.761 | DEBUG    | __main__:trials:29 - Trial = 18701/30000 | Total reward = 12.83
2022-01-26 14:17:56.765 | DEBUG    | __main__:trials:24 - Trial = 18702/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.767 | DEBUG    | __main__:trials:29 - Trial = 18702/30000 | Total reward = 43.68
2022-01-26 14:17:56.770 | DEBUG    | __main__:trials:26 - Trial = 18703/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.772 | DEBUG    | __main__:trials:29 - Trial = 18703/30000 | Total reward = 23.20
2022-01-26 14:17:56.775 | DEBUG    | __main__:trials:26 - Trial = 18704/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.777 | DEBUG    | __main__:trials:29 - Trial = 18704/30000 | Total reward = 24.23
2022-01-26 14:17:56.780 | DEBUG    | __main__:trials:26 - Trial = 18705/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.781 | DEBUG    | __main__:trials:29 - Trial = 18705/30000 | Total reward = 17.53
2022-01-26 14:17:56.785 | DEBUG    | __main__:trials:24 - Trial = 18706/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.787 | DEBUG    | __main__:trials:29 - Trial = 18706/30000 | Total reward = 32.57
2022-01-26 14:17:56.791 | DEBUG    | __main__:trials:26 - Trial = 18707/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.791 | DEBUG    | __main__:trials:29 - Trial = 18707/30000 | Total reward = 28.66
2022-01-26 14:17:56.795 | DEBUG    | __main__:trials:24 - Trial = 18708/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.797 | DEBUG    | __main__:trials:29 - Trial = 18708/30000 | Total reward = 37.93
2022-01-26 14:17:56.800 | DEBUG    | __main__:trials:24 - Trial = 18709/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.802 | DEBUG    | __main__:trials:29 - Trial = 18709/30000 | Total reward = 50.62
2022-01-26 14:17:56.805 | DEBUG    | __main__:trials:26 - Trial = 18710/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.807 | DEBUG    | __main__:trials:29 - Trial = 18710/30000 | Total reward = 20.58
2022-01-26 14:17:56.811 | DEBUG    | __main__:trials:24 - Trial = 18711/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.812 | DEBUG    | __main__:trials:29 - Trial = 18711/30000 | Total reward = 24.19
2022-01-26 14:17:56.815 | DEBUG    | __main__:trials:26 - Trial = 18712/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.816 | DEBUG    | __main__:trials:29 - Trial = 18712/30000 | Total reward = 11.46
2022-01-26 14:17:56.818 | DEBUG    | __main__:trials:26 - Trial = 18713/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.820 | DEBUG    | __main__:trials:29 - Trial = 18713/30000 | Total reward = 11.46
2022-01-26 14:17:56.824 | DEBUG    | __main__:trials:24 - Trial = 18714/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.825 | DEBUG    | __main__:trials:29 - Trial = 18714/30000 | Total reward = 48.69
2022-01-26 14:17:56.829 | DEBUG    | __main__:trials:24 - Trial = 18715/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.831 | DEBUG    | __main__:trials:29 - Trial = 18715/30000 | Total reward = 44.49
2022-01-26 14:17:56.835 | DEBUG    | __main__:trials:24 - Trial = 18716/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.836 | DEBUG    | __main__:trials:29 - Trial = 18716/30000 | Total reward = 35.45
2022-01-26 14:17:56.840 | DEBUG    | __main__:trials:24 - Trial = 18717/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.841 | DEBUG    | __main__:trials:29 - Trial = 18717/30000 | Total reward = 37.34
2022-01-26 14:17:56.845 | DEBUG    | __main__:trials:24 - Trial = 18718/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.847 | DEBUG    | __main__:trials:29 - Trial = 18718/30000 | Total reward = 37.49
2022-01-26 14:17:56.850 | DEBUG    | __main__:trials:24 - Trial = 18719/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.851 | DEBUG    | __main__:trials:29 - Trial = 18719/30000 | Total reward = 39.41
2022-01-26 14:17:56.855 | DEBUG    | __main__:trials:24 - Trial = 18720/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.857 | DEBUG    | __main__:trials:29 - Trial = 18720/30000 | Total reward = 53.60
2022-01-26 14:17:56.860 | DEBUG    | __main__:trials:24 - Trial = 18721/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.862 | DEBUG    | __main__:trials:29 - Trial = 18721/30000 | Total reward = 37.80
2022-01-26 14:17:56.865 | DEBUG    | __main__:trials:26 - Trial = 18722/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:56.867 | DEBUG    | __main__:trials:29 - Trial = 18722/30000 | Total reward = 24.04
2022-01-26 14:17:56.870 | DEBUG    | __main__:trials:24 - Trial = 18723/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.872 | DEBUG    | __main__:trials:29 - Trial = 18723/30000 | Total reward = 39.00
2022-01-26 14:17:56.875 | DEBUG    | __main__:trials:24 - Trial = 18724/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.877 | DEBUG    | __main__:trials:29 - Trial = 18724/30000 | Total reward = 47.60
2022-01-26 14:17:56.880 | DEBUG    | __main__:trials:24 - Trial = 18725/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.881 | DEBUG    | __main__:trials:29 - Trial = 18725/30000 | Total reward = 42.87
2022-01-26 14:17:56.885 | DEBUG    | __main__:trials:24 - Trial = 18726/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.885 | DEBUG    | __main__:trials:29 - Trial = 18726/30000 | Total reward = 50.22
2022-01-26 14:17:56.889 | DEBUG    | __main__:trials:24 - Trial = 18727/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.889 | DEBUG    | __main__:trials:29 - Trial = 18727/30000 | Total reward = 38.13
2022-01-26 14:17:56.894 | DEBUG    | __main__:trials:24 - Trial = 18728/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.896 | DEBUG    | __main__:trials:29 - Trial = 18728/30000 | Total reward = 36.76
2022-01-26 14:17:56.899 | DEBUG    | __main__:trials:24 - Trial = 18729/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.901 | DEBUG    | __main__:trials:29 - Trial = 18729/30000 | Total reward = 37.17
2022-01-26 14:17:56.905 | DEBUG    | __main__:trials:24 - Trial = 18730/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.907 | DEBUG    | __main__:trials:29 - Trial = 18730/30000 | Total reward = 44.91
2022-01-26 14:17:56.910 | DEBUG    | __main__:trials:24 - Trial = 18731/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.912 | DEBUG    | __main__:trials:29 - Trial = 18731/30000 | Total reward = 40.25
2022-01-26 14:17:56.916 | DEBUG    | __main__:trials:24 - Trial = 18732/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.917 | DEBUG    | __main__:trials:29 - Trial = 18732/30000 | Total reward = 39.94
2022-01-26 14:17:56.921 | DEBUG    | __main__:trials:24 - Trial = 18733/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.923 | DEBUG    | __main__:trials:29 - Trial = 18733/30000 | Total reward = 44.90
2022-01-26 14:17:56.927 | DEBUG    | __main__:trials:24 - Trial = 18734/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.929 | DEBUG    | __main__:trials:29 - Trial = 18734/30000 | Total reward = 31.65
2022-01-26 14:17:56.932 | DEBUG    | __main__:trials:24 - Trial = 18735/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.933 | DEBUG    | __main__:trials:29 - Trial = 18735/30000 | Total reward = 42.67
2022-01-26 14:17:56.936 | DEBUG    | __main__:trials:24 - Trial = 18736/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.938 | DEBUG    | __main__:trials:29 - Trial = 18736/30000 | Total reward = 35.50
2022-01-26 14:17:56.942 | DEBUG    | __main__:trials:24 - Trial = 18737/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.944 | DEBUG    | __main__:trials:29 - Trial = 18737/30000 | Total reward = 44.76
2022-01-26 14:17:56.948 | DEBUG    | __main__:trials:24 - Trial = 18738/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.949 | DEBUG    | __main__:trials:29 - Trial = 18738/30000 | Total reward = 45.23
2022-01-26 14:17:56.952 | DEBUG    | __main__:trials:24 - Trial = 18739/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.953 | DEBUG    | __main__:trials:29 - Trial = 18739/30000 | Total reward = 35.86
2022-01-26 14:17:56.957 | DEBUG    | __main__:trials:24 - Trial = 18740/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.958 | DEBUG    | __main__:trials:29 - Trial = 18740/30000 | Total reward = 49.19
2022-01-26 14:17:56.962 | DEBUG    | __main__:trials:24 - Trial = 18741/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.964 | DEBUG    | __main__:trials:29 - Trial = 18741/30000 | Total reward = 28.40
2022-01-26 14:17:56.967 | DEBUG    | __main__:trials:24 - Trial = 18742/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.969 | DEBUG    | __main__:trials:29 - Trial = 18742/30000 | Total reward = 50.51
2022-01-26 14:17:56.972 | DEBUG    | __main__:trials:24 - Trial = 18743/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.974 | DEBUG    | __main__:trials:29 - Trial = 18743/30000 | Total reward = 43.22
2022-01-26 14:17:56.977 | DEBUG    | __main__:trials:24 - Trial = 18744/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.978 | DEBUG    | __main__:trials:29 - Trial = 18744/30000 | Total reward = 49.05
2022-01-26 14:17:56.981 | DEBUG    | __main__:trials:24 - Trial = 18745/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.982 | DEBUG    | __main__:trials:29 - Trial = 18745/30000 | Total reward = 48.47
2022-01-26 14:17:56.985 | DEBUG    | __main__:trials:24 - Trial = 18746/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.986 | DEBUG    | __main__:trials:29 - Trial = 18746/30000 | Total reward = 40.25
2022-01-26 14:17:56.990 | DEBUG    | __main__:trials:24 - Trial = 18747/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.991 | DEBUG    | __main__:trials:29 - Trial = 18747/30000 | Total reward = 35.02
2022-01-26 14:17:56.994 | DEBUG    | __main__:trials:24 - Trial = 18748/30000 | Max number of steps (20) reached
2022-01-26 14:17:56.996 | DEBUG    | __main__:trials:29 - Trial = 18748/30000 | Total reward = 48.19
2022-01-26 14:17:56.999 | DEBUG    | __main__:trials:24 - Trial = 18749/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.001 | DEBUG    | __main__:trials:29 - Trial = 18749/30000 | Total reward = 42.65
2022-01-26 14:17:57.004 | DEBUG    | __main__:trials:24 - Trial = 18750/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.006 | DEBUG    | __main__:trials:29 - Trial = 18750/30000 | Total reward = 37.11
2022-01-26 14:17:57.009 | DEBUG    | __main__:trials:24 - Trial = 18751/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.010 | DEBUG    | __main__:trials:29 - Trial = 18751/30000 | Total reward = 48.47
2022-01-26 14:17:57.013 | DEBUG    | __main__:trials:24 - Trial = 18752/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.015 | DEBUG    | __main__:trials:29 - Trial = 18752/30000 | Total reward = 46.10
2022-01-26 14:17:57.018 | DEBUG    | __main__:trials:24 - Trial = 18753/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.020 | DEBUG    | __main__:trials:29 - Trial = 18753/30000 | Total reward = 46.97
2022-01-26 14:17:57.023 | DEBUG    | __main__:trials:24 - Trial = 18754/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.025 | DEBUG    | __main__:trials:29 - Trial = 18754/30000 | Total reward = 46.13
2022-01-26 14:17:57.028 | DEBUG    | __main__:trials:24 - Trial = 18755/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.030 | DEBUG    | __main__:trials:29 - Trial = 18755/30000 | Total reward = 40.33
2022-01-26 14:17:57.034 | DEBUG    | __main__:trials:24 - Trial = 18756/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.035 | DEBUG    | __main__:trials:29 - Trial = 18756/30000 | Total reward = 37.58
2022-01-26 14:17:57.039 | DEBUG    | __main__:trials:26 - Trial = 18757/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.039 | DEBUG    | __main__:trials:29 - Trial = 18757/30000 | Total reward = 11.71
2022-01-26 14:17:57.043 | DEBUG    | __main__:trials:24 - Trial = 18758/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.045 | DEBUG    | __main__:trials:29 - Trial = 18758/30000 | Total reward = 39.42
2022-01-26 14:17:57.048 | DEBUG    | __main__:trials:24 - Trial = 18759/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.050 | DEBUG    | __main__:trials:29 - Trial = 18759/30000 | Total reward = 37.20
2022-01-26 14:17:57.054 | DEBUG    | __main__:trials:24 - Trial = 18760/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.056 | DEBUG    | __main__:trials:29 - Trial = 18760/30000 | Total reward = 53.37
2022-01-26 14:17:57.059 | DEBUG    | __main__:trials:24 - Trial = 18761/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.061 | DEBUG    | __main__:trials:29 - Trial = 18761/30000 | Total reward = 46.20
2022-01-26 14:17:57.064 | DEBUG    | __main__:trials:26 - Trial = 18762/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.066 | DEBUG    | __main__:trials:29 - Trial = 18762/30000 | Total reward = 12.71
2022-01-26 14:17:57.069 | DEBUG    | __main__:trials:26 - Trial = 18763/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.070 | DEBUG    | __main__:trials:29 - Trial = 18763/30000 | Total reward = 10.23
2022-01-26 14:17:57.074 | DEBUG    | __main__:trials:24 - Trial = 18764/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.076 | DEBUG    | __main__:trials:29 - Trial = 18764/30000 | Total reward = 37.94
2022-01-26 14:17:57.079 | DEBUG    | __main__:trials:24 - Trial = 18765/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.081 | DEBUG    | __main__:trials:29 - Trial = 18765/30000 | Total reward = 46.17
2022-01-26 14:17:57.084 | DEBUG    | __main__:trials:24 - Trial = 18766/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.086 | DEBUG    | __main__:trials:29 - Trial = 18766/30000 | Total reward = 42.66
2022-01-26 14:17:57.090 | DEBUG    | __main__:trials:24 - Trial = 18767/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.091 | DEBUG    | __main__:trials:29 - Trial = 18767/30000 | Total reward = 37.07
2022-01-26 14:17:57.095 | DEBUG    | __main__:trials:24 - Trial = 18768/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.096 | DEBUG    | __main__:trials:29 - Trial = 18768/30000 | Total reward = 33.03
2022-01-26 14:17:57.099 | DEBUG    | __main__:trials:26 - Trial = 18769/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.101 | DEBUG    | __main__:trials:29 - Trial = 18769/30000 | Total reward = 20.37
2022-01-26 14:17:57.104 | DEBUG    | __main__:trials:24 - Trial = 18770/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.106 | DEBUG    | __main__:trials:29 - Trial = 18770/30000 | Total reward = 43.00
2022-01-26 14:17:57.110 | DEBUG    | __main__:trials:24 - Trial = 18771/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.111 | DEBUG    | __main__:trials:29 - Trial = 18771/30000 | Total reward = 33.47
2022-01-26 14:17:57.114 | DEBUG    | __main__:trials:26 - Trial = 18772/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.115 | DEBUG    | __main__:trials:29 - Trial = 18772/30000 | Total reward = 9.91
2022-01-26 14:17:57.119 | DEBUG    | __main__:trials:24 - Trial = 18773/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.121 | DEBUG    | __main__:trials:29 - Trial = 18773/30000 | Total reward = 38.12
2022-01-26 14:17:57.125 | DEBUG    | __main__:trials:24 - Trial = 18774/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.126 | DEBUG    | __main__:trials:29 - Trial = 18774/30000 | Total reward = 37.16
2022-01-26 14:17:57.130 | DEBUG    | __main__:trials:24 - Trial = 18775/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.132 | DEBUG    | __main__:trials:29 - Trial = 18775/30000 | Total reward = 38.95
2022-01-26 14:17:57.135 | DEBUG    | __main__:trials:26 - Trial = 18776/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.137 | DEBUG    | __main__:trials:29 - Trial = 18776/30000 | Total reward = 18.21
2022-01-26 14:17:57.140 | DEBUG    | __main__:trials:24 - Trial = 18777/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.142 | DEBUG    | __main__:trials:29 - Trial = 18777/30000 | Total reward = 37.93
2022-01-26 14:17:57.146 | DEBUG    | __main__:trials:24 - Trial = 18778/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.147 | DEBUG    | __main__:trials:29 - Trial = 18778/30000 | Total reward = 38.89
2022-01-26 14:17:57.150 | DEBUG    | __main__:trials:24 - Trial = 18779/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.153 | DEBUG    | __main__:trials:29 - Trial = 18779/30000 | Total reward = 36.16
2022-01-26 14:17:57.156 | DEBUG    | __main__:trials:24 - Trial = 18780/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.158 | DEBUG    | __main__:trials:29 - Trial = 18780/30000 | Total reward = 23.88
2022-01-26 14:17:57.162 | DEBUG    | __main__:trials:24 - Trial = 18781/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.163 | DEBUG    | __main__:trials:29 - Trial = 18781/30000 | Total reward = 24.08
2022-01-26 14:17:57.167 | DEBUG    | __main__:trials:24 - Trial = 18782/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.168 | DEBUG    | __main__:trials:29 - Trial = 18782/30000 | Total reward = 37.65
2022-01-26 14:17:57.172 | DEBUG    | __main__:trials:24 - Trial = 18783/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.174 | DEBUG    | __main__:trials:29 - Trial = 18783/30000 | Total reward = 48.43
2022-01-26 14:17:57.177 | DEBUG    | __main__:trials:24 - Trial = 18784/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.179 | DEBUG    | __main__:trials:29 - Trial = 18784/30000 | Total reward = 37.93
2022-01-26 14:17:57.183 | DEBUG    | __main__:trials:24 - Trial = 18785/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.184 | DEBUG    | __main__:trials:29 - Trial = 18785/30000 | Total reward = 32.64
2022-01-26 14:17:57.188 | DEBUG    | __main__:trials:24 - Trial = 18786/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.190 | DEBUG    | __main__:trials:29 - Trial = 18786/30000 | Total reward = 52.09
2022-01-26 14:17:57.194 | DEBUG    | __main__:trials:24 - Trial = 18787/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.195 | DEBUG    | __main__:trials:29 - Trial = 18787/30000 | Total reward = 39.56
2022-01-26 14:17:57.198 | DEBUG    | __main__:trials:26 - Trial = 18788/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.199 | DEBUG    | __main__:trials:29 - Trial = 18788/30000 | Total reward = 13.05
2022-01-26 14:17:57.203 | DEBUG    | __main__:trials:24 - Trial = 18789/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.205 | DEBUG    | __main__:trials:29 - Trial = 18789/30000 | Total reward = 45.57
2022-01-26 14:17:57.208 | DEBUG    | __main__:trials:24 - Trial = 18790/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.210 | DEBUG    | __main__:trials:29 - Trial = 18790/30000 | Total reward = 38.80
2022-01-26 14:17:57.213 | DEBUG    | __main__:trials:24 - Trial = 18791/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.215 | DEBUG    | __main__:trials:29 - Trial = 18791/30000 | Total reward = 37.93
2022-01-26 14:17:57.218 | DEBUG    | __main__:trials:24 - Trial = 18792/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.220 | DEBUG    | __main__:trials:29 - Trial = 18792/30000 | Total reward = 39.93
2022-01-26 14:17:57.224 | DEBUG    | __main__:trials:24 - Trial = 18793/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.224 | DEBUG    | __main__:trials:29 - Trial = 18793/30000 | Total reward = 24.88
2022-01-26 14:17:57.228 | DEBUG    | __main__:trials:24 - Trial = 18794/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.230 | DEBUG    | __main__:trials:29 - Trial = 18794/30000 | Total reward = 51.77
2022-01-26 14:17:57.234 | DEBUG    | __main__:trials:24 - Trial = 18795/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.234 | DEBUG    | __main__:trials:29 - Trial = 18795/30000 | Total reward = 41.99
2022-01-26 14:17:57.238 | DEBUG    | __main__:trials:26 - Trial = 18796/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.240 | DEBUG    | __main__:trials:29 - Trial = 18796/30000 | Total reward = 30.01
2022-01-26 14:17:57.244 | DEBUG    | __main__:trials:24 - Trial = 18797/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.245 | DEBUG    | __main__:trials:29 - Trial = 18797/30000 | Total reward = 61.36
2022-01-26 14:17:57.249 | DEBUG    | __main__:trials:24 - Trial = 18798/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.251 | DEBUG    | __main__:trials:29 - Trial = 18798/30000 | Total reward = 53.29
2022-01-26 14:17:57.253 | DEBUG    | __main__:trials:26 - Trial = 18799/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.254 | DEBUG    | __main__:trials:29 - Trial = 18799/30000 | Total reward = 11.46
2022-01-26 14:17:57.258 | DEBUG    | __main__:trials:26 - Trial = 18800/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.259 | DEBUG    | __main__:trials:29 - Trial = 18800/30000 | Total reward = 27.81
2022-01-26 14:17:57.263 | DEBUG    | __main__:trials:24 - Trial = 18801/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.265 | DEBUG    | __main__:trials:29 - Trial = 18801/30000 | Total reward = 27.77
2022-01-26 14:17:57.268 | DEBUG    | __main__:trials:24 - Trial = 18802/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.270 | DEBUG    | __main__:trials:29 - Trial = 18802/30000 | Total reward = 64.08
2022-01-26 14:17:57.273 | DEBUG    | __main__:trials:24 - Trial = 18803/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.274 | DEBUG    | __main__:trials:29 - Trial = 18803/30000 | Total reward = 40.87
2022-01-26 14:17:57.278 | DEBUG    | __main__:trials:24 - Trial = 18804/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.280 | DEBUG    | __main__:trials:29 - Trial = 18804/30000 | Total reward = 39.19
2022-01-26 14:17:57.284 | DEBUG    | __main__:trials:24 - Trial = 18805/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.286 | DEBUG    | __main__:trials:29 - Trial = 18805/30000 | Total reward = 41.72
2022-01-26 14:17:57.289 | DEBUG    | __main__:trials:24 - Trial = 18806/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.291 | DEBUG    | __main__:trials:29 - Trial = 18806/30000 | Total reward = 43.41
2022-01-26 14:17:57.294 | DEBUG    | __main__:trials:24 - Trial = 18807/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.296 | DEBUG    | __main__:trials:29 - Trial = 18807/30000 | Total reward = 50.05
2022-01-26 14:17:57.300 | DEBUG    | __main__:trials:24 - Trial = 18808/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.301 | DEBUG    | __main__:trials:29 - Trial = 18808/30000 | Total reward = 40.87
2022-01-26 14:17:57.305 | DEBUG    | __main__:trials:24 - Trial = 18809/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.306 | DEBUG    | __main__:trials:29 - Trial = 18809/30000 | Total reward = 38.74
2022-01-26 14:17:57.310 | DEBUG    | __main__:trials:24 - Trial = 18810/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.312 | DEBUG    | __main__:trials:29 - Trial = 18810/30000 | Total reward = 38.17
2022-01-26 14:17:57.314 | DEBUG    | __main__:trials:26 - Trial = 18811/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.316 | DEBUG    | __main__:trials:29 - Trial = 18811/30000 | Total reward = 11.46
2022-01-26 14:17:57.320 | DEBUG    | __main__:trials:24 - Trial = 18812/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.320 | DEBUG    | __main__:trials:29 - Trial = 18812/30000 | Total reward = 37.40
2022-01-26 14:17:57.324 | DEBUG    | __main__:trials:24 - Trial = 18813/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.326 | DEBUG    | __main__:trials:29 - Trial = 18813/30000 | Total reward = 43.52
2022-01-26 14:17:57.330 | DEBUG    | __main__:trials:26 - Trial = 18814/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.331 | DEBUG    | __main__:trials:29 - Trial = 18814/30000 | Total reward = 24.26
2022-01-26 14:17:57.335 | DEBUG    | __main__:trials:26 - Trial = 18815/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.336 | DEBUG    | __main__:trials:29 - Trial = 18815/30000 | Total reward = 27.49
2022-01-26 14:17:57.339 | DEBUG    | __main__:trials:26 - Trial = 18816/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.341 | DEBUG    | __main__:trials:29 - Trial = 18816/30000 | Total reward = 16.71
2022-01-26 14:17:57.343 | DEBUG    | __main__:trials:26 - Trial = 18817/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.345 | DEBUG    | __main__:trials:29 - Trial = 18817/30000 | Total reward = 13.05
2022-01-26 14:17:57.348 | DEBUG    | __main__:trials:24 - Trial = 18818/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.350 | DEBUG    | __main__:trials:29 - Trial = 18818/30000 | Total reward = 46.45
2022-01-26 14:17:57.354 | DEBUG    | __main__:trials:24 - Trial = 18819/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.354 | DEBUG    | __main__:trials:29 - Trial = 18819/30000 | Total reward = 38.17
2022-01-26 14:17:57.358 | DEBUG    | __main__:trials:24 - Trial = 18820/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.360 | DEBUG    | __main__:trials:29 - Trial = 18820/30000 | Total reward = 42.33
2022-01-26 14:17:57.364 | DEBUG    | __main__:trials:24 - Trial = 18821/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.364 | DEBUG    | __main__:trials:29 - Trial = 18821/30000 | Total reward = 43.22
2022-01-26 14:17:57.368 | DEBUG    | __main__:trials:24 - Trial = 18822/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.370 | DEBUG    | __main__:trials:29 - Trial = 18822/30000 | Total reward = 39.88
2022-01-26 14:17:57.373 | DEBUG    | __main__:trials:24 - Trial = 18823/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.375 | DEBUG    | __main__:trials:29 - Trial = 18823/30000 | Total reward = 38.25
2022-01-26 14:17:57.379 | DEBUG    | __main__:trials:24 - Trial = 18824/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.380 | DEBUG    | __main__:trials:29 - Trial = 18824/30000 | Total reward = 39.88
2022-01-26 14:17:57.384 | DEBUG    | __main__:trials:24 - Trial = 18825/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.385 | DEBUG    | __main__:trials:29 - Trial = 18825/30000 | Total reward = 42.19
2022-01-26 14:17:57.389 | DEBUG    | __main__:trials:26 - Trial = 18826/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.390 | DEBUG    | __main__:trials:29 - Trial = 18826/30000 | Total reward = 25.85
2022-01-26 14:17:57.394 | DEBUG    | __main__:trials:24 - Trial = 18827/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.395 | DEBUG    | __main__:trials:29 - Trial = 18827/30000 | Total reward = 37.93
2022-01-26 14:17:57.398 | DEBUG    | __main__:trials:26 - Trial = 18828/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.399 | DEBUG    | __main__:trials:29 - Trial = 18828/30000 | Total reward = 11.46
2022-01-26 14:17:57.402 | DEBUG    | __main__:trials:24 - Trial = 18829/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.404 | DEBUG    | __main__:trials:29 - Trial = 18829/30000 | Total reward = 38.88
2022-01-26 14:17:57.408 | DEBUG    | __main__:trials:26 - Trial = 18830/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.409 | DEBUG    | __main__:trials:29 - Trial = 18830/30000 | Total reward = 31.73
2022-01-26 14:17:57.413 | DEBUG    | __main__:trials:24 - Trial = 18831/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.414 | DEBUG    | __main__:trials:29 - Trial = 18831/30000 | Total reward = 35.60
2022-01-26 14:17:57.418 | DEBUG    | __main__:trials:24 - Trial = 18832/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.419 | DEBUG    | __main__:trials:29 - Trial = 18832/30000 | Total reward = 42.92
2022-01-26 14:17:57.423 | DEBUG    | __main__:trials:24 - Trial = 18833/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.425 | DEBUG    | __main__:trials:29 - Trial = 18833/30000 | Total reward = 47.07
2022-01-26 14:17:57.429 | DEBUG    | __main__:trials:24 - Trial = 18834/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.430 | DEBUG    | __main__:trials:29 - Trial = 18834/30000 | Total reward = 42.11
2022-01-26 14:17:57.434 | DEBUG    | __main__:trials:24 - Trial = 18835/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.435 | DEBUG    | __main__:trials:29 - Trial = 18835/30000 | Total reward = 48.74
2022-01-26 14:17:57.437 | DEBUG    | __main__:trials:26 - Trial = 18836/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.438 | DEBUG    | __main__:trials:29 - Trial = 18836/30000 | Total reward = 9.40
2022-01-26 14:17:57.441 | DEBUG    | __main__:trials:24 - Trial = 18837/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.442 | DEBUG    | __main__:trials:29 - Trial = 18837/30000 | Total reward = 35.86
2022-01-26 14:17:57.445 | DEBUG    | __main__:trials:24 - Trial = 18838/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.447 | DEBUG    | __main__:trials:29 - Trial = 18838/30000 | Total reward = 35.81
2022-01-26 14:17:57.451 | DEBUG    | __main__:trials:24 - Trial = 18839/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.451 | DEBUG    | __main__:trials:29 - Trial = 18839/30000 | Total reward = 48.32
2022-01-26 14:17:57.454 | DEBUG    | __main__:trials:26 - Trial = 18840/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.456 | DEBUG    | __main__:trials:29 - Trial = 18840/30000 | Total reward = 12.58
2022-01-26 14:17:57.460 | DEBUG    | __main__:trials:24 - Trial = 18841/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.462 | DEBUG    | __main__:trials:29 - Trial = 18841/30000 | Total reward = 63.47
2022-01-26 14:17:57.465 | DEBUG    | __main__:trials:24 - Trial = 18842/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.467 | DEBUG    | __main__:trials:29 - Trial = 18842/30000 | Total reward = 34.94
2022-01-26 14:17:57.470 | DEBUG    | __main__:trials:24 - Trial = 18843/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.472 | DEBUG    | __main__:trials:29 - Trial = 18843/30000 | Total reward = 49.50
2022-01-26 14:17:57.476 | DEBUG    | __main__:trials:24 - Trial = 18844/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.477 | DEBUG    | __main__:trials:29 - Trial = 18844/30000 | Total reward = 49.19
2022-01-26 14:17:57.481 | DEBUG    | __main__:trials:24 - Trial = 18845/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.482 | DEBUG    | __main__:trials:29 - Trial = 18845/30000 | Total reward = 37.75
2022-01-26 14:17:57.486 | DEBUG    | __main__:trials:24 - Trial = 18846/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.487 | DEBUG    | __main__:trials:29 - Trial = 18846/30000 | Total reward = 35.74
2022-01-26 14:17:57.490 | DEBUG    | __main__:trials:26 - Trial = 18847/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.492 | DEBUG    | __main__:trials:29 - Trial = 18847/30000 | Total reward = 14.96
2022-01-26 14:17:57.495 | DEBUG    | __main__:trials:24 - Trial = 18848/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.497 | DEBUG    | __main__:trials:29 - Trial = 18848/30000 | Total reward = 37.98
2022-01-26 14:17:57.499 | DEBUG    | __main__:trials:26 - Trial = 18849/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.501 | DEBUG    | __main__:trials:29 - Trial = 18849/30000 | Total reward = 14.71
2022-01-26 14:17:57.504 | DEBUG    | __main__:trials:24 - Trial = 18850/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.506 | DEBUG    | __main__:trials:29 - Trial = 18850/30000 | Total reward = 51.59
2022-01-26 14:17:57.510 | DEBUG    | __main__:trials:24 - Trial = 18851/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.511 | DEBUG    | __main__:trials:29 - Trial = 18851/30000 | Total reward = 37.03
2022-01-26 14:17:57.515 | DEBUG    | __main__:trials:24 - Trial = 18852/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.516 | DEBUG    | __main__:trials:29 - Trial = 18852/30000 | Total reward = 55.16
2022-01-26 14:17:57.519 | DEBUG    | __main__:trials:26 - Trial = 18853/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.520 | DEBUG    | __main__:trials:29 - Trial = 18853/30000 | Total reward = 13.12
2022-01-26 14:17:57.524 | DEBUG    | __main__:trials:24 - Trial = 18854/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.526 | DEBUG    | __main__:trials:29 - Trial = 18854/30000 | Total reward = 27.38
2022-01-26 14:17:57.529 | DEBUG    | __main__:trials:24 - Trial = 18855/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.531 | DEBUG    | __main__:trials:29 - Trial = 18855/30000 | Total reward = 45.76
2022-01-26 14:17:57.534 | DEBUG    | __main__:trials:26 - Trial = 18856/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.535 | DEBUG    | __main__:trials:29 - Trial = 18856/30000 | Total reward = 17.84
2022-01-26 14:17:57.538 | DEBUG    | __main__:trials:26 - Trial = 18857/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.540 | DEBUG    | __main__:trials:29 - Trial = 18857/30000 | Total reward = 10.56
2022-01-26 14:17:57.543 | DEBUG    | __main__:trials:24 - Trial = 18858/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.545 | DEBUG    | __main__:trials:29 - Trial = 18858/30000 | Total reward = 52.94
2022-01-26 14:17:57.548 | DEBUG    | __main__:trials:24 - Trial = 18859/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.550 | DEBUG    | __main__:trials:29 - Trial = 18859/30000 | Total reward = 37.55
2022-01-26 14:17:57.553 | DEBUG    | __main__:trials:24 - Trial = 18860/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.555 | DEBUG    | __main__:trials:29 - Trial = 18860/30000 | Total reward = 37.55
2022-01-26 14:17:57.559 | DEBUG    | __main__:trials:24 - Trial = 18861/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.560 | DEBUG    | __main__:trials:29 - Trial = 18861/30000 | Total reward = 38.25
2022-01-26 14:17:57.564 | DEBUG    | __main__:trials:24 - Trial = 18862/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.566 | DEBUG    | __main__:trials:29 - Trial = 18862/30000 | Total reward = 39.61
2022-01-26 14:17:57.569 | DEBUG    | __main__:trials:24 - Trial = 18863/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.570 | DEBUG    | __main__:trials:29 - Trial = 18863/30000 | Total reward = 50.73
2022-01-26 14:17:57.574 | DEBUG    | __main__:trials:24 - Trial = 18864/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.575 | DEBUG    | __main__:trials:29 - Trial = 18864/30000 | Total reward = 37.41
2022-01-26 14:17:57.579 | DEBUG    | __main__:trials:24 - Trial = 18865/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.580 | DEBUG    | __main__:trials:29 - Trial = 18865/30000 | Total reward = 33.99
2022-01-26 14:17:57.584 | DEBUG    | __main__:trials:24 - Trial = 18866/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.585 | DEBUG    | __main__:trials:29 - Trial = 18866/30000 | Total reward = 37.00
2022-01-26 14:17:57.589 | DEBUG    | __main__:trials:24 - Trial = 18867/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.590 | DEBUG    | __main__:trials:29 - Trial = 18867/30000 | Total reward = 34.94
2022-01-26 14:17:57.594 | DEBUG    | __main__:trials:24 - Trial = 18868/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.595 | DEBUG    | __main__:trials:29 - Trial = 18868/30000 | Total reward = 38.76
2022-01-26 14:17:57.599 | DEBUG    | __main__:trials:24 - Trial = 18869/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.601 | DEBUG    | __main__:trials:29 - Trial = 18869/30000 | Total reward = 48.80
2022-01-26 14:17:57.604 | DEBUG    | __main__:trials:24 - Trial = 18870/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.606 | DEBUG    | __main__:trials:29 - Trial = 18870/30000 | Total reward = 51.19
2022-01-26 14:17:57.610 | DEBUG    | __main__:trials:24 - Trial = 18871/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.611 | DEBUG    | __main__:trials:29 - Trial = 18871/30000 | Total reward = 37.19
2022-01-26 14:17:57.615 | DEBUG    | __main__:trials:24 - Trial = 18872/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.617 | DEBUG    | __main__:trials:29 - Trial = 18872/30000 | Total reward = 29.59
2022-01-26 14:17:57.620 | DEBUG    | __main__:trials:24 - Trial = 18873/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.622 | DEBUG    | __main__:trials:29 - Trial = 18873/30000 | Total reward = 22.70
2022-01-26 14:17:57.625 | DEBUG    | __main__:trials:24 - Trial = 18874/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.627 | DEBUG    | __main__:trials:29 - Trial = 18874/30000 | Total reward = 29.43
2022-01-26 14:17:57.630 | DEBUG    | __main__:trials:24 - Trial = 18875/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.632 | DEBUG    | __main__:trials:29 - Trial = 18875/30000 | Total reward = 39.21
2022-01-26 14:17:57.635 | DEBUG    | __main__:trials:24 - Trial = 18876/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.637 | DEBUG    | __main__:trials:29 - Trial = 18876/30000 | Total reward = 44.22
2022-01-26 14:17:57.641 | DEBUG    | __main__:trials:24 - Trial = 18877/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.642 | DEBUG    | __main__:trials:29 - Trial = 18877/30000 | Total reward = 46.02
2022-01-26 14:17:57.646 | DEBUG    | __main__:trials:24 - Trial = 18878/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.648 | DEBUG    | __main__:trials:29 - Trial = 18878/30000 | Total reward = 52.04
2022-01-26 14:17:57.651 | DEBUG    | __main__:trials:24 - Trial = 18879/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.653 | DEBUG    | __main__:trials:29 - Trial = 18879/30000 | Total reward = 38.64
2022-01-26 14:17:57.657 | DEBUG    | __main__:trials:24 - Trial = 18880/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.658 | DEBUG    | __main__:trials:29 - Trial = 18880/30000 | Total reward = 37.83
2022-01-26 14:17:57.661 | DEBUG    | __main__:trials:24 - Trial = 18881/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.663 | DEBUG    | __main__:trials:29 - Trial = 18881/30000 | Total reward = 39.12
2022-01-26 14:17:57.668 | DEBUG    | __main__:trials:24 - Trial = 18882/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.669 | DEBUG    | __main__:trials:29 - Trial = 18882/30000 | Total reward = 41.05
2022-01-26 14:17:57.673 | DEBUG    | __main__:trials:24 - Trial = 18883/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.675 | DEBUG    | __main__:trials:29 - Trial = 18883/30000 | Total reward = 43.29
2022-01-26 14:17:57.679 | DEBUG    | __main__:trials:24 - Trial = 18884/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.680 | DEBUG    | __main__:trials:29 - Trial = 18884/30000 | Total reward = 45.73
2022-01-26 14:17:57.684 | DEBUG    | __main__:trials:24 - Trial = 18885/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.686 | DEBUG    | __main__:trials:29 - Trial = 18885/30000 | Total reward = 49.72
2022-01-26 14:17:57.689 | DEBUG    | __main__:trials:24 - Trial = 18886/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.691 | DEBUG    | __main__:trials:29 - Trial = 18886/30000 | Total reward = 49.72
2022-01-26 14:17:57.695 | DEBUG    | __main__:trials:24 - Trial = 18887/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.696 | DEBUG    | __main__:trials:29 - Trial = 18887/30000 | Total reward = 52.45
2022-01-26 14:17:57.700 | DEBUG    | __main__:trials:24 - Trial = 18888/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.701 | DEBUG    | __main__:trials:29 - Trial = 18888/30000 | Total reward = 28.43
2022-01-26 14:17:57.705 | DEBUG    | __main__:trials:24 - Trial = 18889/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.706 | DEBUG    | __main__:trials:29 - Trial = 18889/30000 | Total reward = 37.11
2022-01-26 14:17:57.710 | DEBUG    | __main__:trials:24 - Trial = 18890/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.710 | DEBUG    | __main__:trials:29 - Trial = 18890/30000 | Total reward = 40.08
2022-01-26 14:17:57.714 | DEBUG    | __main__:trials:24 - Trial = 18891/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.715 | DEBUG    | __main__:trials:29 - Trial = 18891/30000 | Total reward = 39.63
2022-01-26 14:17:57.719 | DEBUG    | __main__:trials:24 - Trial = 18892/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.721 | DEBUG    | __main__:trials:29 - Trial = 18892/30000 | Total reward = 47.23
2022-01-26 14:17:57.724 | DEBUG    | __main__:trials:24 - Trial = 18893/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.726 | DEBUG    | __main__:trials:29 - Trial = 18893/30000 | Total reward = 58.36
2022-01-26 14:17:57.730 | DEBUG    | __main__:trials:24 - Trial = 18894/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.731 | DEBUG    | __main__:trials:29 - Trial = 18894/30000 | Total reward = 59.03
2022-01-26 14:17:57.735 | DEBUG    | __main__:trials:24 - Trial = 18895/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.737 | DEBUG    | __main__:trials:29 - Trial = 18895/30000 | Total reward = 40.78
2022-01-26 14:17:57.740 | DEBUG    | __main__:trials:24 - Trial = 18896/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.742 | DEBUG    | __main__:trials:29 - Trial = 18896/30000 | Total reward = 48.56
2022-01-26 14:17:57.746 | DEBUG    | __main__:trials:24 - Trial = 18897/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.747 | DEBUG    | __main__:trials:29 - Trial = 18897/30000 | Total reward = 40.42
2022-01-26 14:17:57.751 | DEBUG    | __main__:trials:24 - Trial = 18898/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.753 | DEBUG    | __main__:trials:29 - Trial = 18898/30000 | Total reward = 38.99
2022-01-26 14:17:57.756 | DEBUG    | __main__:trials:24 - Trial = 18899/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.758 | DEBUG    | __main__:trials:29 - Trial = 18899/30000 | Total reward = 53.58
2022-01-26 14:17:57.762 | DEBUG    | __main__:trials:24 - Trial = 18900/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.763 | DEBUG    | __main__:trials:29 - Trial = 18900/30000 | Total reward = 52.90
2022-01-26 14:17:57.767 | DEBUG    | __main__:trials:24 - Trial = 18901/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.769 | DEBUG    | __main__:trials:29 - Trial = 18901/30000 | Total reward = 50.24
2022-01-26 14:17:57.773 | DEBUG    | __main__:trials:24 - Trial = 18902/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.774 | DEBUG    | __main__:trials:29 - Trial = 18902/30000 | Total reward = 59.99
2022-01-26 14:17:57.778 | DEBUG    | __main__:trials:24 - Trial = 18903/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.780 | DEBUG    | __main__:trials:29 - Trial = 18903/30000 | Total reward = 53.56
2022-01-26 14:17:57.783 | DEBUG    | __main__:trials:24 - Trial = 18904/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.785 | DEBUG    | __main__:trials:29 - Trial = 18904/30000 | Total reward = 49.72
2022-01-26 14:17:57.789 | DEBUG    | __main__:trials:24 - Trial = 18905/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.790 | DEBUG    | __main__:trials:29 - Trial = 18905/30000 | Total reward = 52.71
2022-01-26 14:17:57.794 | DEBUG    | __main__:trials:24 - Trial = 18906/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.795 | DEBUG    | __main__:trials:29 - Trial = 18906/30000 | Total reward = 47.68
2022-01-26 14:17:57.799 | DEBUG    | __main__:trials:24 - Trial = 18907/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.801 | DEBUG    | __main__:trials:29 - Trial = 18907/30000 | Total reward = 49.26
2022-01-26 14:17:57.805 | DEBUG    | __main__:trials:24 - Trial = 18908/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.806 | DEBUG    | __main__:trials:29 - Trial = 18908/30000 | Total reward = 28.14
2022-01-26 14:17:57.809 | DEBUG    | __main__:trials:24 - Trial = 18909/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.810 | DEBUG    | __main__:trials:29 - Trial = 18909/30000 | Total reward = 48.55
2022-01-26 14:17:57.813 | DEBUG    | __main__:trials:24 - Trial = 18910/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.815 | DEBUG    | __main__:trials:29 - Trial = 18910/30000 | Total reward = 55.86
2022-01-26 14:17:57.818 | DEBUG    | __main__:trials:24 - Trial = 18911/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.820 | DEBUG    | __main__:trials:29 - Trial = 18911/30000 | Total reward = 54.22
2022-01-26 14:17:57.823 | DEBUG    | __main__:trials:24 - Trial = 18912/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.825 | DEBUG    | __main__:trials:29 - Trial = 18912/30000 | Total reward = 49.72
2022-01-26 14:17:57.828 | DEBUG    | __main__:trials:24 - Trial = 18913/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.830 | DEBUG    | __main__:trials:29 - Trial = 18913/30000 | Total reward = 49.37
2022-01-26 14:17:57.834 | DEBUG    | __main__:trials:24 - Trial = 18914/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.836 | DEBUG    | __main__:trials:29 - Trial = 18914/30000 | Total reward = 49.98
2022-01-26 14:17:57.839 | DEBUG    | __main__:trials:24 - Trial = 18915/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.841 | DEBUG    | __main__:trials:29 - Trial = 18915/30000 | Total reward = 43.83
2022-01-26 14:17:57.845 | DEBUG    | __main__:trials:24 - Trial = 18916/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.846 | DEBUG    | __main__:trials:29 - Trial = 18916/30000 | Total reward = 39.78
2022-01-26 14:17:57.851 | DEBUG    | __main__:trials:24 - Trial = 18917/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.851 | DEBUG    | __main__:trials:29 - Trial = 18917/30000 | Total reward = 49.57
2022-01-26 14:17:57.856 | DEBUG    | __main__:trials:24 - Trial = 18918/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.857 | DEBUG    | __main__:trials:29 - Trial = 18918/30000 | Total reward = 49.05
2022-01-26 14:17:57.861 | DEBUG    | __main__:trials:24 - Trial = 18919/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.863 | DEBUG    | __main__:trials:29 - Trial = 18919/30000 | Total reward = 57.28
2022-01-26 14:17:57.866 | DEBUG    | __main__:trials:24 - Trial = 18920/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.868 | DEBUG    | __main__:trials:29 - Trial = 18920/30000 | Total reward = 65.60
2022-01-26 14:17:57.871 | DEBUG    | __main__:trials:24 - Trial = 18921/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.873 | DEBUG    | __main__:trials:29 - Trial = 18921/30000 | Total reward = 43.17
2022-01-26 14:17:57.876 | DEBUG    | __main__:trials:24 - Trial = 18922/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.878 | DEBUG    | __main__:trials:29 - Trial = 18922/30000 | Total reward = 41.07
2022-01-26 14:17:57.881 | DEBUG    | __main__:trials:24 - Trial = 18923/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.883 | DEBUG    | __main__:trials:29 - Trial = 18923/30000 | Total reward = 44.75
2022-01-26 14:17:57.887 | DEBUG    | __main__:trials:24 - Trial = 18924/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.889 | DEBUG    | __main__:trials:29 - Trial = 18924/30000 | Total reward = 48.49
2022-01-26 14:17:57.892 | DEBUG    | __main__:trials:24 - Trial = 18925/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.893 | DEBUG    | __main__:trials:29 - Trial = 18925/30000 | Total reward = 50.24
2022-01-26 14:17:57.898 | DEBUG    | __main__:trials:24 - Trial = 18926/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.899 | DEBUG    | __main__:trials:29 - Trial = 18926/30000 | Total reward = 48.47
2022-01-26 14:17:57.903 | DEBUG    | __main__:trials:24 - Trial = 18927/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.905 | DEBUG    | __main__:trials:29 - Trial = 18927/30000 | Total reward = 37.79
2022-01-26 14:17:57.908 | DEBUG    | __main__:trials:24 - Trial = 18928/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.910 | DEBUG    | __main__:trials:29 - Trial = 18928/30000 | Total reward = 50.90
2022-01-26 14:17:57.914 | DEBUG    | __main__:trials:24 - Trial = 18929/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.915 | DEBUG    | __main__:trials:29 - Trial = 18929/30000 | Total reward = 33.13
2022-01-26 14:17:57.919 | DEBUG    | __main__:trials:24 - Trial = 18930/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.920 | DEBUG    | __main__:trials:29 - Trial = 18930/30000 | Total reward = 37.43
2022-01-26 14:17:57.923 | DEBUG    | __main__:trials:26 - Trial = 18931/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.924 | DEBUG    | __main__:trials:29 - Trial = 18931/30000 | Total reward = 13.05
2022-01-26 14:17:57.928 | DEBUG    | __main__:trials:24 - Trial = 18932/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.929 | DEBUG    | __main__:trials:29 - Trial = 18932/30000 | Total reward = 49.44
2022-01-26 14:17:57.932 | DEBUG    | __main__:trials:24 - Trial = 18933/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.933 | DEBUG    | __main__:trials:29 - Trial = 18933/30000 | Total reward = 40.41
2022-01-26 14:17:57.936 | DEBUG    | __main__:trials:24 - Trial = 18934/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.937 | DEBUG    | __main__:trials:29 - Trial = 18934/30000 | Total reward = 39.75
2022-01-26 14:17:57.941 | DEBUG    | __main__:trials:24 - Trial = 18935/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.941 | DEBUG    | __main__:trials:29 - Trial = 18935/30000 | Total reward = 49.20
2022-01-26 14:17:57.944 | DEBUG    | __main__:trials:26 - Trial = 18936/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.946 | DEBUG    | __main__:trials:29 - Trial = 18936/30000 | Total reward = 9.81
2022-01-26 14:17:57.950 | DEBUG    | __main__:trials:24 - Trial = 18937/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.951 | DEBUG    | __main__:trials:29 - Trial = 18937/30000 | Total reward = 49.31
2022-01-26 14:17:57.954 | DEBUG    | __main__:trials:24 - Trial = 18938/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.956 | DEBUG    | __main__:trials:29 - Trial = 18938/30000 | Total reward = 45.90
2022-01-26 14:17:57.960 | DEBUG    | __main__:trials:24 - Trial = 18939/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.961 | DEBUG    | __main__:trials:29 - Trial = 18939/30000 | Total reward = 22.71
2022-01-26 14:17:57.965 | DEBUG    | __main__:trials:24 - Trial = 18940/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.965 | DEBUG    | __main__:trials:29 - Trial = 18940/30000 | Total reward = 42.64
2022-01-26 14:17:57.969 | DEBUG    | __main__:trials:24 - Trial = 18941/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.970 | DEBUG    | __main__:trials:29 - Trial = 18941/30000 | Total reward = 37.93
2022-01-26 14:17:57.974 | DEBUG    | __main__:trials:24 - Trial = 18942/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.976 | DEBUG    | __main__:trials:29 - Trial = 18942/30000 | Total reward = 37.93
2022-01-26 14:17:57.978 | DEBUG    | __main__:trials:26 - Trial = 18943/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.979 | DEBUG    | __main__:trials:29 - Trial = 18943/30000 | Total reward = 15.74
2022-01-26 14:17:57.983 | DEBUG    | __main__:trials:24 - Trial = 18944/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.984 | DEBUG    | __main__:trials:29 - Trial = 18944/30000 | Total reward = 33.52
2022-01-26 14:17:57.987 | DEBUG    | __main__:trials:26 - Trial = 18945/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:57.989 | DEBUG    | __main__:trials:29 - Trial = 18945/30000 | Total reward = 16.10
2022-01-26 14:17:57.992 | DEBUG    | __main__:trials:24 - Trial = 18946/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.994 | DEBUG    | __main__:trials:29 - Trial = 18946/30000 | Total reward = 57.25
2022-01-26 14:17:57.997 | DEBUG    | __main__:trials:24 - Trial = 18947/30000 | Max number of steps (20) reached
2022-01-26 14:17:57.999 | DEBUG    | __main__:trials:29 - Trial = 18947/30000 | Total reward = 48.75
2022-01-26 14:17:58.002 | DEBUG    | __main__:trials:24 - Trial = 18948/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.004 | DEBUG    | __main__:trials:29 - Trial = 18948/30000 | Total reward = 33.28
2022-01-26 14:17:58.008 | DEBUG    | __main__:trials:24 - Trial = 18949/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.009 | DEBUG    | __main__:trials:29 - Trial = 18949/30000 | Total reward = 37.20
2022-01-26 14:17:58.012 | DEBUG    | __main__:trials:24 - Trial = 18950/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.014 | DEBUG    | __main__:trials:29 - Trial = 18950/30000 | Total reward = 39.33
2022-01-26 14:17:58.017 | DEBUG    | __main__:trials:24 - Trial = 18951/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.019 | DEBUG    | __main__:trials:29 - Trial = 18951/30000 | Total reward = 49.41
2022-01-26 14:17:58.022 | DEBUG    | __main__:trials:24 - Trial = 18952/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.022 | DEBUG    | __main__:trials:29 - Trial = 18952/30000 | Total reward = 37.93
2022-01-26 14:17:58.026 | DEBUG    | __main__:trials:24 - Trial = 18953/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.028 | DEBUG    | __main__:trials:29 - Trial = 18953/30000 | Total reward = 35.23
2022-01-26 14:17:58.029 | DEBUG    | __main__:trials:26 - Trial = 18954/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.030 | DEBUG    | __main__:trials:29 - Trial = 18954/30000 | Total reward = 13.05
2022-01-26 14:17:58.033 | DEBUG    | __main__:trials:24 - Trial = 18955/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.034 | DEBUG    | __main__:trials:29 - Trial = 18955/30000 | Total reward = 33.53
2022-01-26 14:17:58.037 | DEBUG    | __main__:trials:24 - Trial = 18956/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.039 | DEBUG    | __main__:trials:29 - Trial = 18956/30000 | Total reward = 37.89
2022-01-26 14:17:58.042 | DEBUG    | __main__:trials:24 - Trial = 18957/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.044 | DEBUG    | __main__:trials:29 - Trial = 18957/30000 | Total reward = 39.25
2022-01-26 14:17:58.047 | DEBUG    | __main__:trials:24 - Trial = 18958/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.049 | DEBUG    | __main__:trials:29 - Trial = 18958/30000 | Total reward = 46.17
2022-01-26 14:17:58.052 | DEBUG    | __main__:trials:24 - Trial = 18959/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.053 | DEBUG    | __main__:trials:29 - Trial = 18959/30000 | Total reward = 27.36
2022-01-26 14:17:58.057 | DEBUG    | __main__:trials:24 - Trial = 18960/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.059 | DEBUG    | __main__:trials:29 - Trial = 18960/30000 | Total reward = 37.55
2022-01-26 14:17:58.062 | DEBUG    | __main__:trials:24 - Trial = 18961/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.064 | DEBUG    | __main__:trials:29 - Trial = 18961/30000 | Total reward = 48.63
2022-01-26 14:17:58.068 | DEBUG    | __main__:trials:24 - Trial = 18962/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.069 | DEBUG    | __main__:trials:29 - Trial = 18962/30000 | Total reward = 54.15
2022-01-26 14:17:58.073 | DEBUG    | __main__:trials:24 - Trial = 18963/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.074 | DEBUG    | __main__:trials:29 - Trial = 18963/30000 | Total reward = 32.89
2022-01-26 14:17:58.079 | DEBUG    | __main__:trials:24 - Trial = 18964/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.080 | DEBUG    | __main__:trials:29 - Trial = 18964/30000 | Total reward = 36.47
2022-01-26 14:17:58.084 | DEBUG    | __main__:trials:26 - Trial = 18965/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.084 | DEBUG    | __main__:trials:29 - Trial = 18965/30000 | Total reward = 19.07
2022-01-26 14:17:58.088 | DEBUG    | __main__:trials:24 - Trial = 18966/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.089 | DEBUG    | __main__:trials:29 - Trial = 18966/30000 | Total reward = 37.30
2022-01-26 14:17:58.093 | DEBUG    | __main__:trials:24 - Trial = 18967/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.094 | DEBUG    | __main__:trials:29 - Trial = 18967/30000 | Total reward = 56.44
2022-01-26 14:17:58.097 | DEBUG    | __main__:trials:24 - Trial = 18968/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.098 | DEBUG    | __main__:trials:29 - Trial = 18968/30000 | Total reward = 42.54
2022-01-26 14:17:58.101 | DEBUG    | __main__:trials:24 - Trial = 18969/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.103 | DEBUG    | __main__:trials:29 - Trial = 18969/30000 | Total reward = 50.51
2022-01-26 14:17:58.106 | DEBUG    | __main__:trials:24 - Trial = 18970/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.107 | DEBUG    | __main__:trials:29 - Trial = 18970/30000 | Total reward = 38.55
2022-01-26 14:17:58.111 | DEBUG    | __main__:trials:24 - Trial = 18971/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.112 | DEBUG    | __main__:trials:29 - Trial = 18971/30000 | Total reward = 35.44
2022-01-26 14:17:58.116 | DEBUG    | __main__:trials:24 - Trial = 18972/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.118 | DEBUG    | __main__:trials:29 - Trial = 18972/30000 | Total reward = 35.68
2022-01-26 14:17:58.121 | DEBUG    | __main__:trials:24 - Trial = 18973/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.122 | DEBUG    | __main__:trials:29 - Trial = 18973/30000 | Total reward = 48.69
2022-01-26 14:17:58.127 | DEBUG    | __main__:trials:24 - Trial = 18974/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.128 | DEBUG    | __main__:trials:29 - Trial = 18974/30000 | Total reward = 36.05
2022-01-26 14:17:58.132 | DEBUG    | __main__:trials:24 - Trial = 18975/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.134 | DEBUG    | __main__:trials:29 - Trial = 18975/30000 | Total reward = 44.06
2022-01-26 14:17:58.137 | DEBUG    | __main__:trials:26 - Trial = 18976/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.138 | DEBUG    | __main__:trials:29 - Trial = 18976/30000 | Total reward = 22.26
2022-01-26 14:17:58.142 | DEBUG    | __main__:trials:24 - Trial = 18977/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.144 | DEBUG    | __main__:trials:29 - Trial = 18977/30000 | Total reward = 43.19
2022-01-26 14:17:58.147 | DEBUG    | __main__:trials:24 - Trial = 18978/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.149 | DEBUG    | __main__:trials:29 - Trial = 18978/30000 | Total reward = 49.34
2022-01-26 14:17:58.153 | DEBUG    | __main__:trials:24 - Trial = 18979/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.153 | DEBUG    | __main__:trials:29 - Trial = 18979/30000 | Total reward = 52.73
2022-01-26 14:17:58.158 | DEBUG    | __main__:trials:24 - Trial = 18980/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.159 | DEBUG    | __main__:trials:29 - Trial = 18980/30000 | Total reward = 55.59
2022-01-26 14:17:58.162 | DEBUG    | __main__:trials:26 - Trial = 18981/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.163 | DEBUG    | __main__:trials:29 - Trial = 18981/30000 | Total reward = 14.57
2022-01-26 14:17:58.167 | DEBUG    | __main__:trials:24 - Trial = 18982/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.168 | DEBUG    | __main__:trials:29 - Trial = 18982/30000 | Total reward = 49.43
2022-01-26 14:17:58.171 | DEBUG    | __main__:trials:24 - Trial = 18983/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.173 | DEBUG    | __main__:trials:29 - Trial = 18983/30000 | Total reward = 35.66
2022-01-26 14:17:58.176 | DEBUG    | __main__:trials:24 - Trial = 18984/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.178 | DEBUG    | __main__:trials:29 - Trial = 18984/30000 | Total reward = 49.69
2022-01-26 14:17:58.181 | DEBUG    | __main__:trials:24 - Trial = 18985/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.182 | DEBUG    | __main__:trials:29 - Trial = 18985/30000 | Total reward = 56.77
2022-01-26 14:17:58.186 | DEBUG    | __main__:trials:24 - Trial = 18986/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.187 | DEBUG    | __main__:trials:29 - Trial = 18986/30000 | Total reward = 38.73
2022-01-26 14:17:58.190 | DEBUG    | __main__:trials:24 - Trial = 18987/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.192 | DEBUG    | __main__:trials:29 - Trial = 18987/30000 | Total reward = 18.30
2022-01-26 14:17:58.195 | DEBUG    | __main__:trials:24 - Trial = 18988/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.197 | DEBUG    | __main__:trials:29 - Trial = 18988/30000 | Total reward = 29.74
2022-01-26 14:17:58.199 | DEBUG    | __main__:trials:26 - Trial = 18989/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.200 | DEBUG    | __main__:trials:29 - Trial = 18989/30000 | Total reward = 14.71
2022-01-26 14:17:58.204 | DEBUG    | __main__:trials:24 - Trial = 18990/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.206 | DEBUG    | __main__:trials:29 - Trial = 18990/30000 | Total reward = 36.52
2022-01-26 14:17:58.209 | DEBUG    | __main__:trials:24 - Trial = 18991/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.211 | DEBUG    | __main__:trials:29 - Trial = 18991/30000 | Total reward = 40.43
2022-01-26 14:17:58.214 | DEBUG    | __main__:trials:24 - Trial = 18992/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.216 | DEBUG    | __main__:trials:29 - Trial = 18992/30000 | Total reward = 37.55
2022-01-26 14:17:58.219 | DEBUG    | __main__:trials:24 - Trial = 18993/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.220 | DEBUG    | __main__:trials:29 - Trial = 18993/30000 | Total reward = 37.80
2022-01-26 14:17:58.224 | DEBUG    | __main__:trials:24 - Trial = 18994/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.226 | DEBUG    | __main__:trials:29 - Trial = 18994/30000 | Total reward = 51.24
2022-01-26 14:17:58.229 | DEBUG    | __main__:trials:24 - Trial = 18995/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.231 | DEBUG    | __main__:trials:29 - Trial = 18995/30000 | Total reward = 36.05
2022-01-26 14:17:58.233 | DEBUG    | __main__:trials:26 - Trial = 18996/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.235 | DEBUG    | __main__:trials:29 - Trial = 18996/30000 | Total reward = 14.71
2022-01-26 14:17:58.239 | DEBUG    | __main__:trials:24 - Trial = 18997/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.240 | DEBUG    | __main__:trials:29 - Trial = 18997/30000 | Total reward = 36.76
2022-01-26 14:17:58.244 | DEBUG    | __main__:trials:24 - Trial = 18998/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.245 | DEBUG    | __main__:trials:29 - Trial = 18998/30000 | Total reward = 32.57
2022-01-26 14:17:58.249 | DEBUG    | __main__:trials:24 - Trial = 18999/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.251 | DEBUG    | __main__:trials:29 - Trial = 18999/30000 | Total reward = 36.18
2022-01-26 14:17:58.255 | DEBUG    | __main__:trials:24 - Trial = 19000/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.256 | DEBUG    | __main__:trials:29 - Trial = 19000/30000 | Total reward = 53.98
2022-01-26 14:17:58.260 | DEBUG    | __main__:trials:26 - Trial = 19001/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.261 | DEBUG    | __main__:trials:29 - Trial = 19001/30000 | Total reward = 26.39
2022-01-26 14:17:58.265 | DEBUG    | __main__:trials:24 - Trial = 19002/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.266 | DEBUG    | __main__:trials:29 - Trial = 19002/30000 | Total reward = 42.89
2022-01-26 14:17:58.268 | DEBUG    | __main__:trials:26 - Trial = 19003/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.270 | DEBUG    | __main__:trials:29 - Trial = 19003/30000 | Total reward = 18.43
2022-01-26 14:17:58.273 | DEBUG    | __main__:trials:24 - Trial = 19004/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.274 | DEBUG    | __main__:trials:29 - Trial = 19004/30000 | Total reward = 46.03
2022-01-26 14:17:58.277 | DEBUG    | __main__:trials:24 - Trial = 19005/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.278 | DEBUG    | __main__:trials:29 - Trial = 19005/30000 | Total reward = 40.49
2022-01-26 14:17:58.281 | DEBUG    | __main__:trials:26 - Trial = 19006/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.281 | DEBUG    | __main__:trials:29 - Trial = 19006/30000 | Total reward = 8.86
2022-01-26 14:17:58.286 | DEBUG    | __main__:trials:24 - Trial = 19007/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.287 | DEBUG    | __main__:trials:29 - Trial = 19007/30000 | Total reward = 45.71
2022-01-26 14:17:58.291 | DEBUG    | __main__:trials:24 - Trial = 19008/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.291 | DEBUG    | __main__:trials:29 - Trial = 19008/30000 | Total reward = 41.67
2022-01-26 14:17:58.296 | DEBUG    | __main__:trials:26 - Trial = 19009/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.297 | DEBUG    | __main__:trials:29 - Trial = 19009/30000 | Total reward = 24.57
2022-01-26 14:17:58.301 | DEBUG    | __main__:trials:26 - Trial = 19010/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.301 | DEBUG    | __main__:trials:29 - Trial = 19010/30000 | Total reward = 25.74
2022-01-26 14:17:58.305 | DEBUG    | __main__:trials:24 - Trial = 19011/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.306 | DEBUG    | __main__:trials:29 - Trial = 19011/30000 | Total reward = 49.47
2022-01-26 14:17:58.311 | DEBUG    | __main__:trials:24 - Trial = 19012/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.312 | DEBUG    | __main__:trials:29 - Trial = 19012/30000 | Total reward = 41.33
2022-01-26 14:17:58.316 | DEBUG    | __main__:trials:24 - Trial = 19013/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.318 | DEBUG    | __main__:trials:29 - Trial = 19013/30000 | Total reward = 46.14
2022-01-26 14:17:58.322 | DEBUG    | __main__:trials:24 - Trial = 19014/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.322 | DEBUG    | __main__:trials:29 - Trial = 19014/30000 | Total reward = 52.13
2022-01-26 14:17:58.327 | DEBUG    | __main__:trials:24 - Trial = 19015/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.327 | DEBUG    | __main__:trials:29 - Trial = 19015/30000 | Total reward = 49.62
2022-01-26 14:17:58.331 | DEBUG    | __main__:trials:24 - Trial = 19016/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.332 | DEBUG    | __main__:trials:29 - Trial = 19016/30000 | Total reward = 42.82
2022-01-26 14:17:58.337 | DEBUG    | __main__:trials:24 - Trial = 19017/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.338 | DEBUG    | __main__:trials:29 - Trial = 19017/30000 | Total reward = 33.61
2022-01-26 14:17:58.341 | DEBUG    | __main__:trials:24 - Trial = 19018/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.343 | DEBUG    | __main__:trials:29 - Trial = 19018/30000 | Total reward = 41.46
2022-01-26 14:17:58.346 | DEBUG    | __main__:trials:24 - Trial = 19019/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.347 | DEBUG    | __main__:trials:29 - Trial = 19019/30000 | Total reward = 41.70
2022-01-26 14:17:58.350 | DEBUG    | __main__:trials:24 - Trial = 19020/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.352 | DEBUG    | __main__:trials:29 - Trial = 19020/30000 | Total reward = 48.83
2022-01-26 14:17:58.355 | DEBUG    | __main__:trials:24 - Trial = 19021/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.356 | DEBUG    | __main__:trials:29 - Trial = 19021/30000 | Total reward = 42.35
2022-01-26 14:17:58.359 | DEBUG    | __main__:trials:26 - Trial = 19022/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.361 | DEBUG    | __main__:trials:29 - Trial = 19022/30000 | Total reward = 35.33
2022-01-26 14:17:58.366 | DEBUG    | __main__:trials:24 - Trial = 19023/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.367 | DEBUG    | __main__:trials:29 - Trial = 19023/30000 | Total reward = 48.16
2022-01-26 14:17:58.371 | DEBUG    | __main__:trials:24 - Trial = 19024/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.373 | DEBUG    | __main__:trials:29 - Trial = 19024/30000 | Total reward = 49.62
2022-01-26 14:17:58.376 | DEBUG    | __main__:trials:24 - Trial = 19025/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.377 | DEBUG    | __main__:trials:29 - Trial = 19025/30000 | Total reward = 41.42
2022-01-26 14:17:58.382 | DEBUG    | __main__:trials:24 - Trial = 19026/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.383 | DEBUG    | __main__:trials:29 - Trial = 19026/30000 | Total reward = 51.43
2022-01-26 14:17:58.387 | DEBUG    | __main__:trials:24 - Trial = 19027/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.389 | DEBUG    | __main__:trials:29 - Trial = 19027/30000 | Total reward = 52.10
2022-01-26 14:17:58.392 | DEBUG    | __main__:trials:24 - Trial = 19028/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.393 | DEBUG    | __main__:trials:29 - Trial = 19028/30000 | Total reward = 50.92
2022-01-26 14:17:58.397 | DEBUG    | __main__:trials:24 - Trial = 19029/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.398 | DEBUG    | __main__:trials:29 - Trial = 19029/30000 | Total reward = 50.79
2022-01-26 14:17:58.402 | DEBUG    | __main__:trials:24 - Trial = 19030/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.403 | DEBUG    | __main__:trials:29 - Trial = 19030/30000 | Total reward = 44.86
2022-01-26 14:17:58.406 | DEBUG    | __main__:trials:24 - Trial = 19031/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.408 | DEBUG    | __main__:trials:29 - Trial = 19031/30000 | Total reward = 56.42
2022-01-26 14:17:58.412 | DEBUG    | __main__:trials:24 - Trial = 19032/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.413 | DEBUG    | __main__:trials:29 - Trial = 19032/30000 | Total reward = 49.49
2022-01-26 14:17:58.417 | DEBUG    | __main__:trials:24 - Trial = 19033/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.418 | DEBUG    | __main__:trials:29 - Trial = 19033/30000 | Total reward = 30.08
2022-01-26 14:17:58.422 | DEBUG    | __main__:trials:24 - Trial = 19034/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.424 | DEBUG    | __main__:trials:29 - Trial = 19034/30000 | Total reward = 30.68
2022-01-26 14:17:58.428 | DEBUG    | __main__:trials:24 - Trial = 19035/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.429 | DEBUG    | __main__:trials:29 - Trial = 19035/30000 | Total reward = 33.75
2022-01-26 14:17:58.432 | DEBUG    | __main__:trials:24 - Trial = 19036/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.434 | DEBUG    | __main__:trials:29 - Trial = 19036/30000 | Total reward = 25.76
2022-01-26 14:17:58.438 | DEBUG    | __main__:trials:24 - Trial = 19037/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.440 | DEBUG    | __main__:trials:29 - Trial = 19037/30000 | Total reward = 36.67
2022-01-26 14:17:58.443 | DEBUG    | __main__:trials:24 - Trial = 19038/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.444 | DEBUG    | __main__:trials:29 - Trial = 19038/30000 | Total reward = 52.25
2022-01-26 14:17:58.448 | DEBUG    | __main__:trials:24 - Trial = 19039/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.449 | DEBUG    | __main__:trials:29 - Trial = 19039/30000 | Total reward = 40.25
2022-01-26 14:17:58.452 | DEBUG    | __main__:trials:24 - Trial = 19040/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.453 | DEBUG    | __main__:trials:29 - Trial = 19040/30000 | Total reward = 41.62
2022-01-26 14:17:58.457 | DEBUG    | __main__:trials:24 - Trial = 19041/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.458 | DEBUG    | __main__:trials:29 - Trial = 19041/30000 | Total reward = 37.29
2022-01-26 14:17:58.462 | DEBUG    | __main__:trials:24 - Trial = 19042/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.463 | DEBUG    | __main__:trials:29 - Trial = 19042/30000 | Total reward = 43.19
2022-01-26 14:17:58.466 | DEBUG    | __main__:trials:24 - Trial = 19043/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.468 | DEBUG    | __main__:trials:29 - Trial = 19043/30000 | Total reward = 31.53
2022-01-26 14:17:58.472 | DEBUG    | __main__:trials:24 - Trial = 19044/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.473 | DEBUG    | __main__:trials:29 - Trial = 19044/30000 | Total reward = 55.14
2022-01-26 14:17:58.477 | DEBUG    | __main__:trials:24 - Trial = 19045/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.479 | DEBUG    | __main__:trials:29 - Trial = 19045/30000 | Total reward = 38.17
2022-01-26 14:17:58.483 | DEBUG    | __main__:trials:24 - Trial = 19046/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.483 | DEBUG    | __main__:trials:29 - Trial = 19046/30000 | Total reward = 36.32
2022-01-26 14:17:58.488 | DEBUG    | __main__:trials:24 - Trial = 19047/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.490 | DEBUG    | __main__:trials:29 - Trial = 19047/30000 | Total reward = 50.01
2022-01-26 14:17:58.493 | DEBUG    | __main__:trials:26 - Trial = 19048/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.493 | DEBUG    | __main__:trials:29 - Trial = 19048/30000 | Total reward = 10.21
2022-01-26 14:17:58.497 | DEBUG    | __main__:trials:24 - Trial = 19049/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.498 | DEBUG    | __main__:trials:29 - Trial = 19049/30000 | Total reward = 43.78
2022-01-26 14:17:58.503 | DEBUG    | __main__:trials:24 - Trial = 19050/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.505 | DEBUG    | __main__:trials:29 - Trial = 19050/30000 | Total reward = 55.05
2022-01-26 14:17:58.508 | DEBUG    | __main__:trials:24 - Trial = 19051/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.510 | DEBUG    | __main__:trials:29 - Trial = 19051/30000 | Total reward = 42.83
2022-01-26 14:17:58.514 | DEBUG    | __main__:trials:24 - Trial = 19052/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.515 | DEBUG    | __main__:trials:29 - Trial = 19052/30000 | Total reward = 44.39
2022-01-26 14:17:58.519 | DEBUG    | __main__:trials:24 - Trial = 19053/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.520 | DEBUG    | __main__:trials:29 - Trial = 19053/30000 | Total reward = 52.13
2022-01-26 14:17:58.523 | DEBUG    | __main__:trials:24 - Trial = 19054/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.525 | DEBUG    | __main__:trials:29 - Trial = 19054/30000 | Total reward = 49.49
2022-01-26 14:17:58.528 | DEBUG    | __main__:trials:24 - Trial = 19055/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.530 | DEBUG    | __main__:trials:29 - Trial = 19055/30000 | Total reward = 45.08
2022-01-26 14:17:58.534 | DEBUG    | __main__:trials:24 - Trial = 19056/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.534 | DEBUG    | __main__:trials:29 - Trial = 19056/30000 | Total reward = 25.04
2022-01-26 14:17:58.538 | DEBUG    | __main__:trials:24 - Trial = 19057/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.540 | DEBUG    | __main__:trials:29 - Trial = 19057/30000 | Total reward = 53.35
2022-01-26 14:17:58.543 | DEBUG    | __main__:trials:24 - Trial = 19058/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.545 | DEBUG    | __main__:trials:29 - Trial = 19058/30000 | Total reward = 48.81
2022-01-26 14:17:58.548 | DEBUG    | __main__:trials:24 - Trial = 19059/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.549 | DEBUG    | __main__:trials:29 - Trial = 19059/30000 | Total reward = 41.80
2022-01-26 14:17:58.553 | DEBUG    | __main__:trials:24 - Trial = 19060/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.555 | DEBUG    | __main__:trials:29 - Trial = 19060/30000 | Total reward = 49.78
2022-01-26 14:17:58.558 | DEBUG    | __main__:trials:24 - Trial = 19061/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.559 | DEBUG    | __main__:trials:29 - Trial = 19061/30000 | Total reward = 48.12
2022-01-26 14:17:58.564 | DEBUG    | __main__:trials:24 - Trial = 19062/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.565 | DEBUG    | __main__:trials:29 - Trial = 19062/30000 | Total reward = 48.98
2022-01-26 14:17:58.568 | DEBUG    | __main__:trials:24 - Trial = 19063/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.570 | DEBUG    | __main__:trials:29 - Trial = 19063/30000 | Total reward = 47.43
2022-01-26 14:17:58.573 | DEBUG    | __main__:trials:24 - Trial = 19064/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.574 | DEBUG    | __main__:trials:29 - Trial = 19064/30000 | Total reward = 49.72
2022-01-26 14:17:58.577 | DEBUG    | __main__:trials:24 - Trial = 19065/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.578 | DEBUG    | __main__:trials:29 - Trial = 19065/30000 | Total reward = 49.30
2022-01-26 14:17:58.581 | DEBUG    | __main__:trials:24 - Trial = 19066/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.582 | DEBUG    | __main__:trials:29 - Trial = 19066/30000 | Total reward = 52.09
2022-01-26 14:17:58.586 | DEBUG    | __main__:trials:24 - Trial = 19067/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.587 | DEBUG    | __main__:trials:29 - Trial = 19067/30000 | Total reward = 49.80
2022-01-26 14:17:58.591 | DEBUG    | __main__:trials:24 - Trial = 19068/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.593 | DEBUG    | __main__:trials:29 - Trial = 19068/30000 | Total reward = 50.41
2022-01-26 14:17:58.596 | DEBUG    | __main__:trials:24 - Trial = 19069/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.597 | DEBUG    | __main__:trials:29 - Trial = 19069/30000 | Total reward = 46.87
2022-01-26 14:17:58.602 | DEBUG    | __main__:trials:24 - Trial = 19070/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.602 | DEBUG    | __main__:trials:29 - Trial = 19070/30000 | Total reward = 52.86
2022-01-26 14:17:58.606 | DEBUG    | __main__:trials:24 - Trial = 19071/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.608 | DEBUG    | __main__:trials:29 - Trial = 19071/30000 | Total reward = 48.85
2022-01-26 14:17:58.612 | DEBUG    | __main__:trials:24 - Trial = 19072/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.613 | DEBUG    | __main__:trials:29 - Trial = 19072/30000 | Total reward = 48.75
2022-01-26 14:17:58.617 | DEBUG    | __main__:trials:24 - Trial = 19073/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.619 | DEBUG    | __main__:trials:29 - Trial = 19073/30000 | Total reward = 47.45
2022-01-26 14:17:58.622 | DEBUG    | __main__:trials:24 - Trial = 19074/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.623 | DEBUG    | __main__:trials:29 - Trial = 19074/30000 | Total reward = 49.96
2022-01-26 14:17:58.627 | DEBUG    | __main__:trials:24 - Trial = 19075/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.628 | DEBUG    | __main__:trials:29 - Trial = 19075/30000 | Total reward = 44.05
2022-01-26 14:17:58.632 | DEBUG    | __main__:trials:24 - Trial = 19076/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.634 | DEBUG    | __main__:trials:29 - Trial = 19076/30000 | Total reward = 39.58
2022-01-26 14:17:58.637 | DEBUG    | __main__:trials:26 - Trial = 19077/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.638 | DEBUG    | __main__:trials:29 - Trial = 19077/30000 | Total reward = 25.25
2022-01-26 14:17:58.641 | DEBUG    | __main__:trials:26 - Trial = 19078/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.643 | DEBUG    | __main__:trials:29 - Trial = 19078/30000 | Total reward = 9.99
2022-01-26 14:17:58.646 | DEBUG    | __main__:trials:24 - Trial = 19079/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.647 | DEBUG    | __main__:trials:29 - Trial = 19079/30000 | Total reward = 45.08
2022-01-26 14:17:58.651 | DEBUG    | __main__:trials:24 - Trial = 19080/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.653 | DEBUG    | __main__:trials:29 - Trial = 19080/30000 | Total reward = 48.06
2022-01-26 14:17:58.657 | DEBUG    | __main__:trials:24 - Trial = 19081/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.657 | DEBUG    | __main__:trials:29 - Trial = 19081/30000 | Total reward = 57.39
2022-01-26 14:17:58.662 | DEBUG    | __main__:trials:24 - Trial = 19082/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.663 | DEBUG    | __main__:trials:29 - Trial = 19082/30000 | Total reward = 61.56
2022-01-26 14:17:58.666 | DEBUG    | __main__:trials:24 - Trial = 19083/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.668 | DEBUG    | __main__:trials:29 - Trial = 19083/30000 | Total reward = 45.32
2022-01-26 14:17:58.672 | DEBUG    | __main__:trials:24 - Trial = 19084/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.672 | DEBUG    | __main__:trials:29 - Trial = 19084/30000 | Total reward = 55.64
2022-01-26 14:17:58.677 | DEBUG    | __main__:trials:24 - Trial = 19085/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.678 | DEBUG    | __main__:trials:29 - Trial = 19085/30000 | Total reward = 53.74
2022-01-26 14:17:58.682 | DEBUG    | __main__:trials:24 - Trial = 19086/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.683 | DEBUG    | __main__:trials:29 - Trial = 19086/30000 | Total reward = 48.79
2022-01-26 14:17:58.687 | DEBUG    | __main__:trials:24 - Trial = 19087/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.688 | DEBUG    | __main__:trials:29 - Trial = 19087/30000 | Total reward = 40.33
2022-01-26 14:17:58.692 | DEBUG    | __main__:trials:24 - Trial = 19088/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.694 | DEBUG    | __main__:trials:29 - Trial = 19088/30000 | Total reward = 52.25
2022-01-26 14:17:58.697 | DEBUG    | __main__:trials:26 - Trial = 19089/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.698 | DEBUG    | __main__:trials:29 - Trial = 19089/30000 | Total reward = 24.14
2022-01-26 14:17:58.702 | DEBUG    | __main__:trials:24 - Trial = 19090/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.702 | DEBUG    | __main__:trials:29 - Trial = 19090/30000 | Total reward = 49.01
2022-01-26 14:17:58.707 | DEBUG    | __main__:trials:24 - Trial = 19091/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.708 | DEBUG    | __main__:trials:29 - Trial = 19091/30000 | Total reward = 51.11
2022-01-26 14:17:58.712 | DEBUG    | __main__:trials:24 - Trial = 19092/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.713 | DEBUG    | __main__:trials:29 - Trial = 19092/30000 | Total reward = 56.51
2022-01-26 14:17:58.717 | DEBUG    | __main__:trials:24 - Trial = 19093/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.719 | DEBUG    | __main__:trials:29 - Trial = 19093/30000 | Total reward = 62.17
2022-01-26 14:17:58.722 | DEBUG    | __main__:trials:24 - Trial = 19094/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.724 | DEBUG    | __main__:trials:29 - Trial = 19094/30000 | Total reward = 51.60
2022-01-26 14:17:58.728 | DEBUG    | __main__:trials:24 - Trial = 19095/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.728 | DEBUG    | __main__:trials:29 - Trial = 19095/30000 | Total reward = 52.25
2022-01-26 14:17:58.733 | DEBUG    | __main__:trials:24 - Trial = 19096/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.734 | DEBUG    | __main__:trials:29 - Trial = 19096/30000 | Total reward = 51.99
2022-01-26 14:17:58.738 | DEBUG    | __main__:trials:24 - Trial = 19097/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.739 | DEBUG    | __main__:trials:29 - Trial = 19097/30000 | Total reward = 47.21
2022-01-26 14:17:58.742 | DEBUG    | __main__:trials:26 - Trial = 19098/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.744 | DEBUG    | __main__:trials:29 - Trial = 19098/30000 | Total reward = 16.66
2022-01-26 14:17:58.747 | DEBUG    | __main__:trials:24 - Trial = 19099/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.749 | DEBUG    | __main__:trials:29 - Trial = 19099/30000 | Total reward = 49.82
2022-01-26 14:17:58.752 | DEBUG    | __main__:trials:24 - Trial = 19100/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.754 | DEBUG    | __main__:trials:29 - Trial = 19100/30000 | Total reward = 51.77
2022-01-26 14:17:58.755 | DEBUG    | __main__:trials:26 - Trial = 19101/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.757 | DEBUG    | __main__:trials:29 - Trial = 19101/30000 | Total reward = 12.37
2022-01-26 14:17:58.760 | DEBUG    | __main__:trials:24 - Trial = 19102/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.762 | DEBUG    | __main__:trials:29 - Trial = 19102/30000 | Total reward = 49.63
2022-01-26 14:17:58.765 | DEBUG    | __main__:trials:26 - Trial = 19103/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.765 | DEBUG    | __main__:trials:29 - Trial = 19103/30000 | Total reward = 18.35
2022-01-26 14:17:58.769 | DEBUG    | __main__:trials:26 - Trial = 19104/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.770 | DEBUG    | __main__:trials:29 - Trial = 19104/30000 | Total reward = 35.49
2022-01-26 14:17:58.774 | DEBUG    | __main__:trials:24 - Trial = 19105/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.775 | DEBUG    | __main__:trials:29 - Trial = 19105/30000 | Total reward = 50.94
2022-01-26 14:17:58.779 | DEBUG    | __main__:trials:26 - Trial = 19106/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.780 | DEBUG    | __main__:trials:29 - Trial = 19106/30000 | Total reward = 41.71
2022-01-26 14:17:58.783 | DEBUG    | __main__:trials:26 - Trial = 19107/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.785 | DEBUG    | __main__:trials:29 - Trial = 19107/30000 | Total reward = 14.08
2022-01-26 14:17:58.788 | DEBUG    | __main__:trials:26 - Trial = 19108/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.788 | DEBUG    | __main__:trials:29 - Trial = 19108/30000 | Total reward = 26.13
2022-01-26 14:17:58.792 | DEBUG    | __main__:trials:24 - Trial = 19109/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.794 | DEBUG    | __main__:trials:29 - Trial = 19109/30000 | Total reward = 48.12
2022-01-26 14:17:58.798 | DEBUG    | __main__:trials:24 - Trial = 19110/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.798 | DEBUG    | __main__:trials:29 - Trial = 19110/30000 | Total reward = 51.61
2022-01-26 14:17:58.803 | DEBUG    | __main__:trials:24 - Trial = 19111/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.804 | DEBUG    | __main__:trials:29 - Trial = 19111/30000 | Total reward = 49.07
2022-01-26 14:17:58.808 | DEBUG    | __main__:trials:26 - Trial = 19112/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.809 | DEBUG    | __main__:trials:29 - Trial = 19112/30000 | Total reward = 29.74
2022-01-26 14:17:58.813 | DEBUG    | __main__:trials:24 - Trial = 19113/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.815 | DEBUG    | __main__:trials:29 - Trial = 19113/30000 | Total reward = 52.48
2022-01-26 14:17:58.818 | DEBUG    | __main__:trials:24 - Trial = 19114/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.820 | DEBUG    | __main__:trials:29 - Trial = 19114/30000 | Total reward = 49.32
2022-01-26 14:17:58.823 | DEBUG    | __main__:trials:24 - Trial = 19115/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.825 | DEBUG    | __main__:trials:29 - Trial = 19115/30000 | Total reward = 51.37
2022-01-26 14:17:58.829 | DEBUG    | __main__:trials:24 - Trial = 19116/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.830 | DEBUG    | __main__:trials:29 - Trial = 19116/30000 | Total reward = 57.48
2022-01-26 14:17:58.834 | DEBUG    | __main__:trials:24 - Trial = 19117/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.835 | DEBUG    | __main__:trials:29 - Trial = 19117/30000 | Total reward = 51.21
2022-01-26 14:17:58.838 | DEBUG    | __main__:trials:24 - Trial = 19118/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.840 | DEBUG    | __main__:trials:29 - Trial = 19118/30000 | Total reward = 56.54
2022-01-26 14:17:58.843 | DEBUG    | __main__:trials:24 - Trial = 19119/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.845 | DEBUG    | __main__:trials:29 - Trial = 19119/30000 | Total reward = 51.77
2022-01-26 14:17:58.848 | DEBUG    | __main__:trials:24 - Trial = 19120/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.850 | DEBUG    | __main__:trials:29 - Trial = 19120/30000 | Total reward = 50.90
2022-01-26 14:17:58.853 | DEBUG    | __main__:trials:24 - Trial = 19121/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.854 | DEBUG    | __main__:trials:29 - Trial = 19121/30000 | Total reward = 53.10
2022-01-26 14:17:58.858 | DEBUG    | __main__:trials:24 - Trial = 19122/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.860 | DEBUG    | __main__:trials:29 - Trial = 19122/30000 | Total reward = 49.53
2022-01-26 14:17:58.863 | DEBUG    | __main__:trials:24 - Trial = 19123/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.865 | DEBUG    | __main__:trials:29 - Trial = 19123/30000 | Total reward = 51.33
2022-01-26 14:17:58.868 | DEBUG    | __main__:trials:24 - Trial = 19124/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.870 | DEBUG    | __main__:trials:29 - Trial = 19124/30000 | Total reward = 54.95
2022-01-26 14:17:58.873 | DEBUG    | __main__:trials:24 - Trial = 19125/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.875 | DEBUG    | __main__:trials:29 - Trial = 19125/30000 | Total reward = 57.86
2022-01-26 14:17:58.878 | DEBUG    | __main__:trials:24 - Trial = 19126/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.880 | DEBUG    | __main__:trials:29 - Trial = 19126/30000 | Total reward = 50.86
2022-01-26 14:17:58.884 | DEBUG    | __main__:trials:24 - Trial = 19127/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.885 | DEBUG    | __main__:trials:29 - Trial = 19127/30000 | Total reward = 48.58
2022-01-26 14:17:58.888 | DEBUG    | __main__:trials:24 - Trial = 19128/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.890 | DEBUG    | __main__:trials:29 - Trial = 19128/30000 | Total reward = 51.69
2022-01-26 14:17:58.893 | DEBUG    | __main__:trials:26 - Trial = 19129/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.894 | DEBUG    | __main__:trials:29 - Trial = 19129/30000 | Total reward = 34.30
2022-01-26 14:17:58.898 | DEBUG    | __main__:trials:26 - Trial = 19130/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.899 | DEBUG    | __main__:trials:29 - Trial = 19130/30000 | Total reward = 8.99
2022-01-26 14:17:58.902 | DEBUG    | __main__:trials:24 - Trial = 19131/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.904 | DEBUG    | __main__:trials:29 - Trial = 19131/30000 | Total reward = 55.55
2022-01-26 14:17:58.906 | DEBUG    | __main__:trials:26 - Trial = 19132/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.907 | DEBUG    | __main__:trials:29 - Trial = 19132/30000 | Total reward = 7.70
2022-01-26 14:17:58.911 | DEBUG    | __main__:trials:24 - Trial = 19133/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.912 | DEBUG    | __main__:trials:29 - Trial = 19133/30000 | Total reward = 53.17
2022-01-26 14:17:58.915 | DEBUG    | __main__:trials:24 - Trial = 19134/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.917 | DEBUG    | __main__:trials:29 - Trial = 19134/30000 | Total reward = 52.93
2022-01-26 14:17:58.920 | DEBUG    | __main__:trials:24 - Trial = 19135/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.922 | DEBUG    | __main__:trials:29 - Trial = 19135/30000 | Total reward = 51.77
2022-01-26 14:17:58.926 | DEBUG    | __main__:trials:24 - Trial = 19136/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.927 | DEBUG    | __main__:trials:29 - Trial = 19136/30000 | Total reward = 51.62
2022-01-26 14:17:58.930 | DEBUG    | __main__:trials:24 - Trial = 19137/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.932 | DEBUG    | __main__:trials:29 - Trial = 19137/30000 | Total reward = 50.09
2022-01-26 14:17:58.936 | DEBUG    | __main__:trials:24 - Trial = 19138/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.937 | DEBUG    | __main__:trials:29 - Trial = 19138/30000 | Total reward = 36.49
2022-01-26 14:17:58.940 | DEBUG    | __main__:trials:24 - Trial = 19139/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.942 | DEBUG    | __main__:trials:29 - Trial = 19139/30000 | Total reward = 46.43
2022-01-26 14:17:58.946 | DEBUG    | __main__:trials:24 - Trial = 19140/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.947 | DEBUG    | __main__:trials:29 - Trial = 19140/30000 | Total reward = 51.01
2022-01-26 14:17:58.950 | DEBUG    | __main__:trials:24 - Trial = 19141/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.952 | DEBUG    | __main__:trials:29 - Trial = 19141/30000 | Total reward = 52.74
2022-01-26 14:17:58.955 | DEBUG    | __main__:trials:24 - Trial = 19142/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.957 | DEBUG    | __main__:trials:29 - Trial = 19142/30000 | Total reward = 49.62
2022-01-26 14:17:58.960 | DEBUG    | __main__:trials:24 - Trial = 19143/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.961 | DEBUG    | __main__:trials:29 - Trial = 19143/30000 | Total reward = 50.67
2022-01-26 14:17:58.965 | DEBUG    | __main__:trials:24 - Trial = 19144/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.966 | DEBUG    | __main__:trials:29 - Trial = 19144/30000 | Total reward = 51.77
2022-01-26 14:17:58.970 | DEBUG    | __main__:trials:24 - Trial = 19145/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.972 | DEBUG    | __main__:trials:29 - Trial = 19145/30000 | Total reward = 52.72
2022-01-26 14:17:58.976 | DEBUG    | __main__:trials:24 - Trial = 19146/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.977 | DEBUG    | __main__:trials:29 - Trial = 19146/30000 | Total reward = 53.14
2022-01-26 14:17:58.981 | DEBUG    | __main__:trials:24 - Trial = 19147/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.983 | DEBUG    | __main__:trials:29 - Trial = 19147/30000 | Total reward = 52.16
2022-01-26 14:17:58.985 | DEBUG    | __main__:trials:26 - Trial = 19148/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:58.986 | DEBUG    | __main__:trials:29 - Trial = 19148/30000 | Total reward = 27.02
2022-01-26 14:17:58.989 | DEBUG    | __main__:trials:24 - Trial = 19149/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.991 | DEBUG    | __main__:trials:29 - Trial = 19149/30000 | Total reward = 56.90
2022-01-26 14:17:58.994 | DEBUG    | __main__:trials:24 - Trial = 19150/30000 | Max number of steps (20) reached
2022-01-26 14:17:58.995 | DEBUG    | __main__:trials:29 - Trial = 19150/30000 | Total reward = 61.29
2022-01-26 14:17:58.999 | DEBUG    | __main__:trials:24 - Trial = 19151/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.001 | DEBUG    | __main__:trials:29 - Trial = 19151/30000 | Total reward = 50.79
2022-01-26 14:17:59.004 | DEBUG    | __main__:trials:24 - Trial = 19152/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.005 | DEBUG    | __main__:trials:29 - Trial = 19152/30000 | Total reward = 57.73
2022-01-26 14:17:59.010 | DEBUG    | __main__:trials:24 - Trial = 19153/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.011 | DEBUG    | __main__:trials:29 - Trial = 19153/30000 | Total reward = 50.57
2022-01-26 14:17:59.015 | DEBUG    | __main__:trials:24 - Trial = 19154/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.016 | DEBUG    | __main__:trials:29 - Trial = 19154/30000 | Total reward = 49.62
2022-01-26 14:17:59.020 | DEBUG    | __main__:trials:24 - Trial = 19155/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.021 | DEBUG    | __main__:trials:29 - Trial = 19155/30000 | Total reward = 53.23
2022-01-26 14:17:59.025 | DEBUG    | __main__:trials:24 - Trial = 19156/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.026 | DEBUG    | __main__:trials:29 - Trial = 19156/30000 | Total reward = 51.36
2022-01-26 14:17:59.029 | DEBUG    | __main__:trials:24 - Trial = 19157/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.031 | DEBUG    | __main__:trials:29 - Trial = 19157/30000 | Total reward = 52.14
2022-01-26 14:17:59.035 | DEBUG    | __main__:trials:24 - Trial = 19158/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.036 | DEBUG    | __main__:trials:29 - Trial = 19158/30000 | Total reward = 50.16
2022-01-26 14:17:59.039 | DEBUG    | __main__:trials:24 - Trial = 19159/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.041 | DEBUG    | __main__:trials:29 - Trial = 19159/30000 | Total reward = 53.05
2022-01-26 14:17:59.045 | DEBUG    | __main__:trials:24 - Trial = 19160/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.046 | DEBUG    | __main__:trials:29 - Trial = 19160/30000 | Total reward = 50.44
2022-01-26 14:17:59.049 | DEBUG    | __main__:trials:26 - Trial = 19161/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.050 | DEBUG    | __main__:trials:29 - Trial = 19161/30000 | Total reward = 18.23
2022-01-26 14:17:59.053 | DEBUG    | __main__:trials:24 - Trial = 19162/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.054 | DEBUG    | __main__:trials:29 - Trial = 19162/30000 | Total reward = 52.81
2022-01-26 14:17:59.057 | DEBUG    | __main__:trials:24 - Trial = 19163/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.059 | DEBUG    | __main__:trials:29 - Trial = 19163/30000 | Total reward = 37.19
2022-01-26 14:17:59.062 | DEBUG    | __main__:trials:26 - Trial = 19164/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.062 | DEBUG    | __main__:trials:29 - Trial = 19164/30000 | Total reward = 10.11
2022-01-26 14:17:59.065 | DEBUG    | __main__:trials:26 - Trial = 19165/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.066 | DEBUG    | __main__:trials:29 - Trial = 19165/30000 | Total reward = 9.99
2022-01-26 14:17:59.070 | DEBUG    | __main__:trials:26 - Trial = 19166/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.070 | DEBUG    | __main__:trials:29 - Trial = 19166/30000 | Total reward = 18.31
2022-01-26 14:17:59.075 | DEBUG    | __main__:trials:24 - Trial = 19167/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.077 | DEBUG    | __main__:trials:29 - Trial = 19167/30000 | Total reward = 58.92
2022-01-26 14:17:59.079 | DEBUG    | __main__:trials:26 - Trial = 19168/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.081 | DEBUG    | __main__:trials:29 - Trial = 19168/30000 | Total reward = 9.99
2022-01-26 14:17:59.084 | DEBUG    | __main__:trials:24 - Trial = 19169/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.084 | DEBUG    | __main__:trials:29 - Trial = 19169/30000 | Total reward = 50.17
2022-01-26 14:17:59.086 | DEBUG    | __main__:trials:26 - Trial = 19170/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.088 | DEBUG    | __main__:trials:29 - Trial = 19170/30000 | Total reward = 7.70
2022-01-26 14:17:59.091 | DEBUG    | __main__:trials:24 - Trial = 19171/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.093 | DEBUG    | __main__:trials:29 - Trial = 19171/30000 | Total reward = 52.29
2022-01-26 14:17:59.097 | DEBUG    | __main__:trials:24 - Trial = 19172/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.098 | DEBUG    | __main__:trials:29 - Trial = 19172/30000 | Total reward = 53.47
2022-01-26 14:17:59.102 | DEBUG    | __main__:trials:24 - Trial = 19173/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.104 | DEBUG    | __main__:trials:29 - Trial = 19173/30000 | Total reward = 41.30
2022-01-26 14:17:59.107 | DEBUG    | __main__:trials:24 - Trial = 19174/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.108 | DEBUG    | __main__:trials:29 - Trial = 19174/30000 | Total reward = 51.26
2022-01-26 14:17:59.112 | DEBUG    | __main__:trials:26 - Trial = 19175/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.113 | DEBUG    | __main__:trials:29 - Trial = 19175/30000 | Total reward = 29.98
2022-01-26 14:17:59.115 | DEBUG    | __main__:trials:26 - Trial = 19176/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.116 | DEBUG    | __main__:trials:29 - Trial = 19176/30000 | Total reward = 7.57
2022-01-26 14:17:59.120 | DEBUG    | __main__:trials:24 - Trial = 19177/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.121 | DEBUG    | __main__:trials:29 - Trial = 19177/30000 | Total reward = 43.17
2022-01-26 14:17:59.125 | DEBUG    | __main__:trials:26 - Trial = 19178/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.126 | DEBUG    | __main__:trials:29 - Trial = 19178/30000 | Total reward = 21.74
2022-01-26 14:17:59.128 | DEBUG    | __main__:trials:26 - Trial = 19179/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.129 | DEBUG    | __main__:trials:29 - Trial = 19179/30000 | Total reward = 9.99
2022-01-26 14:17:59.132 | DEBUG    | __main__:trials:26 - Trial = 19180/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.133 | DEBUG    | __main__:trials:29 - Trial = 19180/30000 | Total reward = 11.38
2022-01-26 14:17:59.136 | DEBUG    | __main__:trials:26 - Trial = 19181/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.137 | DEBUG    | __main__:trials:29 - Trial = 19181/30000 | Total reward = 9.99
2022-01-26 14:17:59.140 | DEBUG    | __main__:trials:26 - Trial = 19182/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.142 | DEBUG    | __main__:trials:29 - Trial = 19182/30000 | Total reward = 16.79
2022-01-26 14:17:59.144 | DEBUG    | __main__:trials:26 - Trial = 19183/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.146 | DEBUG    | __main__:trials:29 - Trial = 19183/30000 | Total reward = 9.99
2022-01-26 14:17:59.148 | DEBUG    | __main__:trials:26 - Trial = 19184/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.150 | DEBUG    | __main__:trials:29 - Trial = 19184/30000 | Total reward = 10.66
2022-01-26 14:17:59.154 | DEBUG    | __main__:trials:24 - Trial = 19185/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.155 | DEBUG    | __main__:trials:29 - Trial = 19185/30000 | Total reward = 43.96
2022-01-26 14:17:59.158 | DEBUG    | __main__:trials:26 - Trial = 19186/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.159 | DEBUG    | __main__:trials:29 - Trial = 19186/30000 | Total reward = 13.12
2022-01-26 14:17:59.161 | DEBUG    | __main__:trials:26 - Trial = 19187/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.162 | DEBUG    | __main__:trials:29 - Trial = 19187/30000 | Total reward = 9.99
2022-01-26 14:17:59.165 | DEBUG    | __main__:trials:24 - Trial = 19188/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.166 | DEBUG    | __main__:trials:29 - Trial = 19188/30000 | Total reward = 42.03
2022-01-26 14:17:59.169 | DEBUG    | __main__:trials:24 - Trial = 19189/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.171 | DEBUG    | __main__:trials:29 - Trial = 19189/30000 | Total reward = 25.83
2022-01-26 14:17:59.174 | DEBUG    | __main__:trials:26 - Trial = 19190/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.175 | DEBUG    | __main__:trials:29 - Trial = 19190/30000 | Total reward = 21.51
2022-01-26 14:17:59.177 | DEBUG    | __main__:trials:26 - Trial = 19191/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.177 | DEBUG    | __main__:trials:29 - Trial = 19191/30000 | Total reward = 9.99
2022-01-26 14:17:59.181 | DEBUG    | __main__:trials:26 - Trial = 19192/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.182 | DEBUG    | __main__:trials:29 - Trial = 19192/30000 | Total reward = 9.99
2022-01-26 14:17:59.185 | DEBUG    | __main__:trials:26 - Trial = 19193/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.186 | DEBUG    | __main__:trials:29 - Trial = 19193/30000 | Total reward = 21.67
2022-01-26 14:17:59.189 | DEBUG    | __main__:trials:26 - Trial = 19194/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.191 | DEBUG    | __main__:trials:29 - Trial = 19194/30000 | Total reward = 18.98
2022-01-26 14:17:59.195 | DEBUG    | __main__:trials:24 - Trial = 19195/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.195 | DEBUG    | __main__:trials:29 - Trial = 19195/30000 | Total reward = 42.44
2022-01-26 14:17:59.198 | DEBUG    | __main__:trials:26 - Trial = 19196/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.200 | DEBUG    | __main__:trials:29 - Trial = 19196/30000 | Total reward = 7.70
2022-01-26 14:17:59.203 | DEBUG    | __main__:trials:24 - Trial = 19197/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.204 | DEBUG    | __main__:trials:29 - Trial = 19197/30000 | Total reward = 48.98
2022-01-26 14:17:59.206 | DEBUG    | __main__:trials:26 - Trial = 19198/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.208 | DEBUG    | __main__:trials:29 - Trial = 19198/30000 | Total reward = 10.11
2022-01-26 14:17:59.211 | DEBUG    | __main__:trials:24 - Trial = 19199/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.213 | DEBUG    | __main__:trials:29 - Trial = 19199/30000 | Total reward = 49.77
2022-01-26 14:17:59.216 | DEBUG    | __main__:trials:24 - Trial = 19200/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.218 | DEBUG    | __main__:trials:29 - Trial = 19200/30000 | Total reward = 56.22
2022-01-26 14:17:59.222 | DEBUG    | __main__:trials:24 - Trial = 19201/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.223 | DEBUG    | __main__:trials:29 - Trial = 19201/30000 | Total reward = 34.96
2022-01-26 14:17:59.227 | DEBUG    | __main__:trials:24 - Trial = 19202/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.229 | DEBUG    | __main__:trials:29 - Trial = 19202/30000 | Total reward = 44.14
2022-01-26 14:17:59.231 | DEBUG    | __main__:trials:26 - Trial = 19203/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.233 | DEBUG    | __main__:trials:29 - Trial = 19203/30000 | Total reward = 20.39
2022-01-26 14:17:59.236 | DEBUG    | __main__:trials:24 - Trial = 19204/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.238 | DEBUG    | __main__:trials:29 - Trial = 19204/30000 | Total reward = 44.02
2022-01-26 14:17:59.240 | DEBUG    | __main__:trials:26 - Trial = 19205/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.242 | DEBUG    | __main__:trials:29 - Trial = 19205/30000 | Total reward = 9.99
2022-01-26 14:17:59.244 | DEBUG    | __main__:trials:26 - Trial = 19206/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.246 | DEBUG    | __main__:trials:29 - Trial = 19206/30000 | Total reward = 9.99
2022-01-26 14:17:59.250 | DEBUG    | __main__:trials:24 - Trial = 19207/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.250 | DEBUG    | __main__:trials:29 - Trial = 19207/30000 | Total reward = 43.57
2022-01-26 14:17:59.255 | DEBUG    | __main__:trials:24 - Trial = 19208/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.257 | DEBUG    | __main__:trials:29 - Trial = 19208/30000 | Total reward = 37.98
2022-01-26 14:17:59.258 | DEBUG    | __main__:trials:26 - Trial = 19209/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.260 | DEBUG    | __main__:trials:29 - Trial = 19209/30000 | Total reward = 9.99
2022-01-26 14:17:59.263 | DEBUG    | __main__:trials:26 - Trial = 19210/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.265 | DEBUG    | __main__:trials:29 - Trial = 19210/30000 | Total reward = 40.71
2022-01-26 14:17:59.268 | DEBUG    | __main__:trials:26 - Trial = 19211/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.269 | DEBUG    | __main__:trials:29 - Trial = 19211/30000 | Total reward = 24.24
2022-01-26 14:17:59.273 | DEBUG    | __main__:trials:24 - Trial = 19212/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.274 | DEBUG    | __main__:trials:29 - Trial = 19212/30000 | Total reward = 40.89
2022-01-26 14:17:59.276 | DEBUG    | __main__:trials:26 - Trial = 19213/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.277 | DEBUG    | __main__:trials:29 - Trial = 19213/30000 | Total reward = 9.99
2022-01-26 14:17:59.281 | DEBUG    | __main__:trials:26 - Trial = 19214/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.283 | DEBUG    | __main__:trials:29 - Trial = 19214/30000 | Total reward = 25.70
2022-01-26 14:17:59.287 | DEBUG    | __main__:trials:24 - Trial = 19215/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.288 | DEBUG    | __main__:trials:29 - Trial = 19215/30000 | Total reward = 49.57
2022-01-26 14:17:59.290 | DEBUG    | __main__:trials:26 - Trial = 19216/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.291 | DEBUG    | __main__:trials:29 - Trial = 19216/30000 | Total reward = 9.99
2022-01-26 14:17:59.294 | DEBUG    | __main__:trials:26 - Trial = 19217/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.295 | DEBUG    | __main__:trials:29 - Trial = 19217/30000 | Total reward = 18.59
2022-01-26 14:17:59.300 | DEBUG    | __main__:trials:24 - Trial = 19218/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.301 | DEBUG    | __main__:trials:29 - Trial = 19218/30000 | Total reward = 35.97
2022-01-26 14:17:59.304 | DEBUG    | __main__:trials:24 - Trial = 19219/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.306 | DEBUG    | __main__:trials:29 - Trial = 19219/30000 | Total reward = 34.65
2022-01-26 14:17:59.307 | DEBUG    | __main__:trials:26 - Trial = 19220/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.309 | DEBUG    | __main__:trials:29 - Trial = 19220/30000 | Total reward = 7.41
2022-01-26 14:17:59.313 | DEBUG    | __main__:trials:24 - Trial = 19221/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.314 | DEBUG    | __main__:trials:29 - Trial = 19221/30000 | Total reward = 52.83
2022-01-26 14:17:59.316 | DEBUG    | __main__:trials:26 - Trial = 19222/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.318 | DEBUG    | __main__:trials:29 - Trial = 19222/30000 | Total reward = 9.99
2022-01-26 14:17:59.321 | DEBUG    | __main__:trials:26 - Trial = 19223/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.321 | DEBUG    | __main__:trials:29 - Trial = 19223/30000 | Total reward = 6.39
2022-01-26 14:17:59.326 | DEBUG    | __main__:trials:24 - Trial = 19224/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.326 | DEBUG    | __main__:trials:29 - Trial = 19224/30000 | Total reward = 36.20
2022-01-26 14:17:59.331 | DEBUG    | __main__:trials:26 - Trial = 19225/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.331 | DEBUG    | __main__:trials:29 - Trial = 19225/30000 | Total reward = 26.77
2022-01-26 14:17:59.336 | DEBUG    | __main__:trials:24 - Trial = 19226/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.338 | DEBUG    | __main__:trials:29 - Trial = 19226/30000 | Total reward = 41.74
2022-01-26 14:17:59.340 | DEBUG    | __main__:trials:26 - Trial = 19227/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.342 | DEBUG    | __main__:trials:29 - Trial = 19227/30000 | Total reward = 13.57
2022-01-26 14:17:59.345 | DEBUG    | __main__:trials:24 - Trial = 19228/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.346 | DEBUG    | __main__:trials:29 - Trial = 19228/30000 | Total reward = 35.75
2022-01-26 14:17:59.351 | DEBUG    | __main__:trials:26 - Trial = 19229/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.352 | DEBUG    | __main__:trials:29 - Trial = 19229/30000 | Total reward = 33.07
2022-01-26 14:17:59.355 | DEBUG    | __main__:trials:26 - Trial = 19230/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.356 | DEBUG    | __main__:trials:29 - Trial = 19230/30000 | Total reward = 6.12
2022-01-26 14:17:59.358 | DEBUG    | __main__:trials:26 - Trial = 19231/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.360 | DEBUG    | __main__:trials:29 - Trial = 19231/30000 | Total reward = 9.99
2022-01-26 14:17:59.362 | DEBUG    | __main__:trials:26 - Trial = 19232/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.364 | DEBUG    | __main__:trials:29 - Trial = 19232/30000 | Total reward = 9.57
2022-01-26 14:17:59.366 | DEBUG    | __main__:trials:26 - Trial = 19233/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.368 | DEBUG    | __main__:trials:29 - Trial = 19233/30000 | Total reward = 9.99
2022-01-26 14:17:59.371 | DEBUG    | __main__:trials:24 - Trial = 19234/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.373 | DEBUG    | __main__:trials:29 - Trial = 19234/30000 | Total reward = 51.97
2022-01-26 14:17:59.375 | DEBUG    | __main__:trials:26 - Trial = 19235/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.377 | DEBUG    | __main__:trials:29 - Trial = 19235/30000 | Total reward = 18.51
2022-01-26 14:17:59.380 | DEBUG    | __main__:trials:24 - Trial = 19236/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.381 | DEBUG    | __main__:trials:29 - Trial = 19236/30000 | Total reward = 43.69
2022-01-26 14:17:59.383 | DEBUG    | __main__:trials:26 - Trial = 19237/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.385 | DEBUG    | __main__:trials:29 - Trial = 19237/30000 | Total reward = 9.99
2022-01-26 14:17:59.387 | DEBUG    | __main__:trials:26 - Trial = 19238/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.388 | DEBUG    | __main__:trials:29 - Trial = 19238/30000 | Total reward = 9.99
2022-01-26 14:17:59.391 | DEBUG    | __main__:trials:26 - Trial = 19239/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.392 | DEBUG    | __main__:trials:29 - Trial = 19239/30000 | Total reward = 16.90
2022-01-26 14:17:59.396 | DEBUG    | __main__:trials:24 - Trial = 19240/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.397 | DEBUG    | __main__:trials:29 - Trial = 19240/30000 | Total reward = 53.38
2022-01-26 14:17:59.401 | DEBUG    | __main__:trials:24 - Trial = 19241/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.402 | DEBUG    | __main__:trials:29 - Trial = 19241/30000 | Total reward = 47.85
2022-01-26 14:17:59.406 | DEBUG    | __main__:trials:24 - Trial = 19242/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.407 | DEBUG    | __main__:trials:29 - Trial = 19242/30000 | Total reward = 33.85
2022-01-26 14:17:59.410 | DEBUG    | __main__:trials:26 - Trial = 19243/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.411 | DEBUG    | __main__:trials:29 - Trial = 19243/30000 | Total reward = 9.99
2022-01-26 14:17:59.415 | DEBUG    | __main__:trials:24 - Trial = 19244/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.416 | DEBUG    | __main__:trials:29 - Trial = 19244/30000 | Total reward = 46.98
2022-01-26 14:17:59.420 | DEBUG    | __main__:trials:26 - Trial = 19245/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.421 | DEBUG    | __main__:trials:29 - Trial = 19245/30000 | Total reward = 23.11
2022-01-26 14:17:59.424 | DEBUG    | __main__:trials:26 - Trial = 19246/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.424 | DEBUG    | __main__:trials:29 - Trial = 19246/30000 | Total reward = 9.99
2022-01-26 14:17:59.428 | DEBUG    | __main__:trials:24 - Trial = 19247/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.430 | DEBUG    | __main__:trials:29 - Trial = 19247/30000 | Total reward = 49.98
2022-01-26 14:17:59.434 | DEBUG    | __main__:trials:24 - Trial = 19248/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.435 | DEBUG    | __main__:trials:29 - Trial = 19248/30000 | Total reward = 43.62
2022-01-26 14:17:59.437 | DEBUG    | __main__:trials:26 - Trial = 19249/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.439 | DEBUG    | __main__:trials:29 - Trial = 19249/30000 | Total reward = 9.99
2022-01-26 14:17:59.443 | DEBUG    | __main__:trials:26 - Trial = 19250/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.444 | DEBUG    | __main__:trials:29 - Trial = 19250/30000 | Total reward = 39.70
2022-01-26 14:17:59.447 | DEBUG    | __main__:trials:26 - Trial = 19251/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.448 | DEBUG    | __main__:trials:29 - Trial = 19251/30000 | Total reward = 9.99
2022-01-26 14:17:59.452 | DEBUG    | __main__:trials:24 - Trial = 19252/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.452 | DEBUG    | __main__:trials:29 - Trial = 19252/30000 | Total reward = 58.35
2022-01-26 14:17:59.455 | DEBUG    | __main__:trials:26 - Trial = 19253/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.456 | DEBUG    | __main__:trials:29 - Trial = 19253/30000 | Total reward = 9.99
2022-01-26 14:17:59.460 | DEBUG    | __main__:trials:24 - Trial = 19254/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.461 | DEBUG    | __main__:trials:29 - Trial = 19254/30000 | Total reward = 45.60
2022-01-26 14:17:59.464 | DEBUG    | __main__:trials:26 - Trial = 19255/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.465 | DEBUG    | __main__:trials:29 - Trial = 19255/30000 | Total reward = 9.99
2022-01-26 14:17:59.467 | DEBUG    | __main__:trials:26 - Trial = 19256/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.468 | DEBUG    | __main__:trials:29 - Trial = 19256/30000 | Total reward = 9.99
2022-01-26 14:17:59.472 | DEBUG    | __main__:trials:24 - Trial = 19257/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.473 | DEBUG    | __main__:trials:29 - Trial = 19257/30000 | Total reward = 47.50
2022-01-26 14:17:59.477 | DEBUG    | __main__:trials:24 - Trial = 19258/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.479 | DEBUG    | __main__:trials:29 - Trial = 19258/30000 | Total reward = 41.47
2022-01-26 14:17:59.481 | DEBUG    | __main__:trials:26 - Trial = 19259/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.482 | DEBUG    | __main__:trials:29 - Trial = 19259/30000 | Total reward = 10.27
2022-01-26 14:17:59.484 | DEBUG    | __main__:trials:26 - Trial = 19260/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.484 | DEBUG    | __main__:trials:29 - Trial = 19260/30000 | Total reward = 9.99
2022-01-26 14:17:59.487 | DEBUG    | __main__:trials:26 - Trial = 19261/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.488 | DEBUG    | __main__:trials:29 - Trial = 19261/30000 | Total reward = 7.70
2022-01-26 14:17:59.490 | DEBUG    | __main__:trials:26 - Trial = 19262/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.491 | DEBUG    | __main__:trials:29 - Trial = 19262/30000 | Total reward = 10.25
2022-01-26 14:17:59.495 | DEBUG    | __main__:trials:24 - Trial = 19263/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.496 | DEBUG    | __main__:trials:29 - Trial = 19263/30000 | Total reward = 34.51
2022-01-26 14:17:59.498 | DEBUG    | __main__:trials:26 - Trial = 19264/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.498 | DEBUG    | __main__:trials:29 - Trial = 19264/30000 | Total reward = 13.85
2022-01-26 14:17:59.501 | DEBUG    | __main__:trials:26 - Trial = 19265/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.502 | DEBUG    | __main__:trials:29 - Trial = 19265/30000 | Total reward = 11.14
2022-01-26 14:17:59.505 | DEBUG    | __main__:trials:24 - Trial = 19266/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.506 | DEBUG    | __main__:trials:29 - Trial = 19266/30000 | Total reward = 44.72
2022-01-26 14:17:59.509 | DEBUG    | __main__:trials:24 - Trial = 19267/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.511 | DEBUG    | __main__:trials:29 - Trial = 19267/30000 | Total reward = 40.97
2022-01-26 14:17:59.514 | DEBUG    | __main__:trials:26 - Trial = 19268/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.516 | DEBUG    | __main__:trials:29 - Trial = 19268/30000 | Total reward = 23.11
2022-01-26 14:17:59.519 | DEBUG    | __main__:trials:24 - Trial = 19269/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.519 | DEBUG    | __main__:trials:29 - Trial = 19269/30000 | Total reward = 36.75
2022-01-26 14:17:59.522 | DEBUG    | __main__:trials:26 - Trial = 19270/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.522 | DEBUG    | __main__:trials:29 - Trial = 19270/30000 | Total reward = 12.17
2022-01-26 14:17:59.525 | DEBUG    | __main__:trials:24 - Trial = 19271/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.527 | DEBUG    | __main__:trials:29 - Trial = 19271/30000 | Total reward = 36.32
2022-01-26 14:17:59.530 | DEBUG    | __main__:trials:26 - Trial = 19272/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.532 | DEBUG    | __main__:trials:29 - Trial = 19272/30000 | Total reward = 9.99
2022-01-26 14:17:59.534 | DEBUG    | __main__:trials:26 - Trial = 19273/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.535 | DEBUG    | __main__:trials:29 - Trial = 19273/30000 | Total reward = 9.99
2022-01-26 14:17:59.538 | DEBUG    | __main__:trials:26 - Trial = 19274/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.540 | DEBUG    | __main__:trials:29 - Trial = 19274/30000 | Total reward = 9.99
2022-01-26 14:17:59.542 | DEBUG    | __main__:trials:26 - Trial = 19275/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.543 | DEBUG    | __main__:trials:29 - Trial = 19275/30000 | Total reward = 9.99
2022-01-26 14:17:59.547 | DEBUG    | __main__:trials:24 - Trial = 19276/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.548 | DEBUG    | __main__:trials:29 - Trial = 19276/30000 | Total reward = 47.50
2022-01-26 14:17:59.553 | DEBUG    | __main__:trials:24 - Trial = 19277/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.554 | DEBUG    | __main__:trials:29 - Trial = 19277/30000 | Total reward = 1.45
2022-01-26 14:17:59.557 | DEBUG    | __main__:trials:26 - Trial = 19278/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.559 | DEBUG    | __main__:trials:29 - Trial = 19278/30000 | Total reward = 11.53
2022-01-26 14:17:59.563 | DEBUG    | __main__:trials:24 - Trial = 19279/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.563 | DEBUG    | __main__:trials:29 - Trial = 19279/30000 | Total reward = 45.55
2022-01-26 14:17:59.568 | DEBUG    | __main__:trials:24 - Trial = 19280/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.569 | DEBUG    | __main__:trials:29 - Trial = 19280/30000 | Total reward = 51.90
2022-01-26 14:17:59.573 | DEBUG    | __main__:trials:24 - Trial = 19281/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.574 | DEBUG    | __main__:trials:29 - Trial = 19281/30000 | Total reward = 32.82
2022-01-26 14:17:59.577 | DEBUG    | __main__:trials:26 - Trial = 19282/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.578 | DEBUG    | __main__:trials:29 - Trial = 19282/30000 | Total reward = 14.18
2022-01-26 14:17:59.580 | DEBUG    | __main__:trials:26 - Trial = 19283/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.580 | DEBUG    | __main__:trials:29 - Trial = 19283/30000 | Total reward = 9.99
2022-01-26 14:17:59.583 | DEBUG    | __main__:trials:26 - Trial = 19284/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.584 | DEBUG    | __main__:trials:29 - Trial = 19284/30000 | Total reward = 14.18
2022-01-26 14:17:59.588 | DEBUG    | __main__:trials:24 - Trial = 19285/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.589 | DEBUG    | __main__:trials:29 - Trial = 19285/30000 | Total reward = 24.51
2022-01-26 14:17:59.593 | DEBUG    | __main__:trials:26 - Trial = 19286/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.593 | DEBUG    | __main__:trials:29 - Trial = 19286/30000 | Total reward = 18.51
2022-01-26 14:17:59.598 | DEBUG    | __main__:trials:24 - Trial = 19287/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.598 | DEBUG    | __main__:trials:29 - Trial = 19287/30000 | Total reward = 8.99
2022-01-26 14:17:59.603 | DEBUG    | __main__:trials:24 - Trial = 19288/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.604 | DEBUG    | __main__:trials:29 - Trial = 19288/30000 | Total reward = 46.49
2022-01-26 14:17:59.607 | DEBUG    | __main__:trials:26 - Trial = 19289/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.608 | DEBUG    | __main__:trials:29 - Trial = 19289/30000 | Total reward = 17.88
2022-01-26 14:17:59.612 | DEBUG    | __main__:trials:24 - Trial = 19290/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.614 | DEBUG    | __main__:trials:29 - Trial = 19290/30000 | Total reward = 33.75
2022-01-26 14:17:59.616 | DEBUG    | __main__:trials:26 - Trial = 19291/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.617 | DEBUG    | __main__:trials:29 - Trial = 19291/30000 | Total reward = 16.30
2022-01-26 14:17:59.620 | DEBUG    | __main__:trials:26 - Trial = 19292/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.621 | DEBUG    | __main__:trials:29 - Trial = 19292/30000 | Total reward = 39.16
2022-01-26 14:17:59.625 | DEBUG    | __main__:trials:24 - Trial = 19293/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.626 | DEBUG    | __main__:trials:29 - Trial = 19293/30000 | Total reward = 52.56
2022-01-26 14:17:59.630 | DEBUG    | __main__:trials:24 - Trial = 19294/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.632 | DEBUG    | __main__:trials:29 - Trial = 19294/30000 | Total reward = 55.44
2022-01-26 14:17:59.633 | DEBUG    | __main__:trials:26 - Trial = 19295/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.635 | DEBUG    | __main__:trials:29 - Trial = 19295/30000 | Total reward = 8.99
2022-01-26 14:17:59.638 | DEBUG    | __main__:trials:24 - Trial = 19296/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.639 | DEBUG    | __main__:trials:29 - Trial = 19296/30000 | Total reward = 43.87
2022-01-26 14:17:59.641 | DEBUG    | __main__:trials:26 - Trial = 19297/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.643 | DEBUG    | __main__:trials:29 - Trial = 19297/30000 | Total reward = 12.86
2022-01-26 14:17:59.645 | DEBUG    | __main__:trials:26 - Trial = 19298/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.646 | DEBUG    | __main__:trials:29 - Trial = 19298/30000 | Total reward = 9.99
2022-01-26 14:17:59.649 | DEBUG    | __main__:trials:26 - Trial = 19299/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.649 | DEBUG    | __main__:trials:29 - Trial = 19299/30000 | Total reward = 14.18
2022-01-26 14:17:59.653 | DEBUG    | __main__:trials:24 - Trial = 19300/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.656 | DEBUG    | __main__:trials:29 - Trial = 19300/30000 | Total reward = 50.23
2022-01-26 14:17:59.658 | DEBUG    | __main__:trials:26 - Trial = 19301/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.660 | DEBUG    | __main__:trials:29 - Trial = 19301/30000 | Total reward = 9.99
2022-01-26 14:17:59.661 | DEBUG    | __main__:trials:26 - Trial = 19302/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.662 | DEBUG    | __main__:trials:29 - Trial = 19302/30000 | Total reward = 9.99
2022-01-26 14:17:59.665 | DEBUG    | __main__:trials:26 - Trial = 19303/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.666 | DEBUG    | __main__:trials:29 - Trial = 19303/30000 | Total reward = 29.90
2022-01-26 14:17:59.667 | DEBUG    | __main__:trials:26 - Trial = 19304/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.668 | DEBUG    | __main__:trials:29 - Trial = 19304/30000 | Total reward = 9.99
2022-01-26 14:17:59.670 | DEBUG    | __main__:trials:26 - Trial = 19305/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.671 | DEBUG    | __main__:trials:29 - Trial = 19305/30000 | Total reward = 7.41
2022-01-26 14:17:59.673 | DEBUG    | __main__:trials:26 - Trial = 19306/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.674 | DEBUG    | __main__:trials:29 - Trial = 19306/30000 | Total reward = 9.87
2022-01-26 14:17:59.677 | DEBUG    | __main__:trials:24 - Trial = 19307/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.679 | DEBUG    | __main__:trials:29 - Trial = 19307/30000 | Total reward = 50.03
2022-01-26 14:17:59.682 | DEBUG    | __main__:trials:24 - Trial = 19308/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.684 | DEBUG    | __main__:trials:29 - Trial = 19308/30000 | Total reward = 47.78
2022-01-26 14:17:59.687 | DEBUG    | __main__:trials:24 - Trial = 19309/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.688 | DEBUG    | __main__:trials:29 - Trial = 19309/30000 | Total reward = 38.59
2022-01-26 14:17:59.692 | DEBUG    | __main__:trials:24 - Trial = 19310/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.694 | DEBUG    | __main__:trials:29 - Trial = 19310/30000 | Total reward = 48.58
2022-01-26 14:17:59.698 | DEBUG    | __main__:trials:24 - Trial = 19311/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.698 | DEBUG    | __main__:trials:29 - Trial = 19311/30000 | Total reward = 50.76
2022-01-26 14:17:59.702 | DEBUG    | __main__:trials:24 - Trial = 19312/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.703 | DEBUG    | __main__:trials:29 - Trial = 19312/30000 | Total reward = 51.96
2022-01-26 14:17:59.705 | DEBUG    | __main__:trials:26 - Trial = 19313/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.707 | DEBUG    | __main__:trials:29 - Trial = 19313/30000 | Total reward = 9.99
2022-01-26 14:17:59.711 | DEBUG    | __main__:trials:24 - Trial = 19314/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.713 | DEBUG    | __main__:trials:29 - Trial = 19314/30000 | Total reward = 41.06
2022-01-26 14:17:59.715 | DEBUG    | __main__:trials:26 - Trial = 19315/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.717 | DEBUG    | __main__:trials:29 - Trial = 19315/30000 | Total reward = 9.99
2022-01-26 14:17:59.718 | DEBUG    | __main__:trials:26 - Trial = 19316/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.720 | DEBUG    | __main__:trials:29 - Trial = 19316/30000 | Total reward = 18.59
2022-01-26 14:17:59.722 | DEBUG    | __main__:trials:26 - Trial = 19317/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.723 | DEBUG    | __main__:trials:29 - Trial = 19317/30000 | Total reward = 9.99
2022-01-26 14:17:59.725 | DEBUG    | __main__:trials:26 - Trial = 19318/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.726 | DEBUG    | __main__:trials:29 - Trial = 19318/30000 | Total reward = 9.99
2022-01-26 14:17:59.729 | DEBUG    | __main__:trials:24 - Trial = 19319/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.730 | DEBUG    | __main__:trials:29 - Trial = 19319/30000 | Total reward = 51.54
2022-01-26 14:17:59.732 | DEBUG    | __main__:trials:26 - Trial = 19320/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.734 | DEBUG    | __main__:trials:29 - Trial = 19320/30000 | Total reward = 12.86
2022-01-26 14:17:59.736 | DEBUG    | __main__:trials:26 - Trial = 19321/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.738 | DEBUG    | __main__:trials:29 - Trial = 19321/30000 | Total reward = 9.99
2022-01-26 14:17:59.741 | DEBUG    | __main__:trials:26 - Trial = 19322/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.741 | DEBUG    | __main__:trials:29 - Trial = 19322/30000 | Total reward = 33.39
2022-01-26 14:17:59.746 | DEBUG    | __main__:trials:24 - Trial = 19323/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.747 | DEBUG    | __main__:trials:29 - Trial = 19323/30000 | Total reward = 32.74
2022-01-26 14:17:59.750 | DEBUG    | __main__:trials:26 - Trial = 19324/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.751 | DEBUG    | __main__:trials:29 - Trial = 19324/30000 | Total reward = 9.99
2022-01-26 14:17:59.754 | DEBUG    | __main__:trials:26 - Trial = 19325/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.755 | DEBUG    | __main__:trials:29 - Trial = 19325/30000 | Total reward = 9.99
2022-01-26 14:17:59.756 | DEBUG    | __main__:trials:26 - Trial = 19326/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.758 | DEBUG    | __main__:trials:29 - Trial = 19326/30000 | Total reward = 9.99
2022-01-26 14:17:59.761 | DEBUG    | __main__:trials:24 - Trial = 19327/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.763 | DEBUG    | __main__:trials:29 - Trial = 19327/30000 | Total reward = 27.49
2022-01-26 14:17:59.767 | DEBUG    | __main__:trials:24 - Trial = 19328/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.768 | DEBUG    | __main__:trials:29 - Trial = 19328/30000 | Total reward = 53.33
2022-01-26 14:17:59.771 | DEBUG    | __main__:trials:26 - Trial = 19329/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.772 | DEBUG    | __main__:trials:29 - Trial = 19329/30000 | Total reward = 9.99
2022-01-26 14:17:59.774 | DEBUG    | __main__:trials:26 - Trial = 19330/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.775 | DEBUG    | __main__:trials:29 - Trial = 19330/30000 | Total reward = 7.70
2022-01-26 14:17:59.777 | DEBUG    | __main__:trials:26 - Trial = 19331/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.779 | DEBUG    | __main__:trials:29 - Trial = 19331/30000 | Total reward = 12.86
2022-01-26 14:17:59.782 | DEBUG    | __main__:trials:24 - Trial = 19332/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.784 | DEBUG    | __main__:trials:29 - Trial = 19332/30000 | Total reward = 45.23
2022-01-26 14:17:59.787 | DEBUG    | __main__:trials:24 - Trial = 19333/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.790 | DEBUG    | __main__:trials:29 - Trial = 19333/30000 | Total reward = 40.25
2022-01-26 14:17:59.794 | DEBUG    | __main__:trials:24 - Trial = 19334/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.794 | DEBUG    | __main__:trials:29 - Trial = 19334/30000 | Total reward = 43.25
2022-01-26 14:17:59.796 | DEBUG    | __main__:trials:26 - Trial = 19335/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.798 | DEBUG    | __main__:trials:29 - Trial = 19335/30000 | Total reward = 9.99
2022-01-26 14:17:59.800 | DEBUG    | __main__:trials:26 - Trial = 19336/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.802 | DEBUG    | __main__:trials:29 - Trial = 19336/30000 | Total reward = 9.99
2022-01-26 14:17:59.803 | DEBUG    | __main__:trials:26 - Trial = 19337/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.806 | DEBUG    | __main__:trials:29 - Trial = 19337/30000 | Total reward = 9.99
2022-01-26 14:17:59.807 | DEBUG    | __main__:trials:26 - Trial = 19338/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.809 | DEBUG    | __main__:trials:29 - Trial = 19338/30000 | Total reward = 9.99
2022-01-26 14:17:59.811 | DEBUG    | __main__:trials:26 - Trial = 19339/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.813 | DEBUG    | __main__:trials:29 - Trial = 19339/30000 | Total reward = 28.63
2022-01-26 14:17:59.817 | DEBUG    | __main__:trials:24 - Trial = 19340/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.817 | DEBUG    | __main__:trials:29 - Trial = 19340/30000 | Total reward = 33.43
2022-01-26 14:17:59.821 | DEBUG    | __main__:trials:24 - Trial = 19341/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.822 | DEBUG    | __main__:trials:29 - Trial = 19341/30000 | Total reward = 40.28
2022-01-26 14:17:59.825 | DEBUG    | __main__:trials:24 - Trial = 19342/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.827 | DEBUG    | __main__:trials:29 - Trial = 19342/30000 | Total reward = 47.73
2022-01-26 14:17:59.831 | DEBUG    | __main__:trials:24 - Trial = 19343/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.832 | DEBUG    | __main__:trials:29 - Trial = 19343/30000 | Total reward = 63.11
2022-01-26 14:17:59.834 | DEBUG    | __main__:trials:26 - Trial = 19344/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.835 | DEBUG    | __main__:trials:29 - Trial = 19344/30000 | Total reward = 9.99
2022-01-26 14:17:59.839 | DEBUG    | __main__:trials:24 - Trial = 19345/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.840 | DEBUG    | __main__:trials:29 - Trial = 19345/30000 | Total reward = 47.17
2022-01-26 14:17:59.842 | DEBUG    | __main__:trials:26 - Trial = 19346/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.844 | DEBUG    | __main__:trials:29 - Trial = 19346/30000 | Total reward = 9.99
2022-01-26 14:17:59.846 | DEBUG    | __main__:trials:26 - Trial = 19347/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.846 | DEBUG    | __main__:trials:29 - Trial = 19347/30000 | Total reward = 9.99
2022-01-26 14:17:59.850 | DEBUG    | __main__:trials:26 - Trial = 19348/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.850 | DEBUG    | __main__:trials:29 - Trial = 19348/30000 | Total reward = 19.12
2022-01-26 14:17:59.852 | DEBUG    | __main__:trials:26 - Trial = 19349/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.854 | DEBUG    | __main__:trials:29 - Trial = 19349/30000 | Total reward = 7.12
2022-01-26 14:17:59.857 | DEBUG    | __main__:trials:26 - Trial = 19350/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.859 | DEBUG    | __main__:trials:29 - Trial = 19350/30000 | Total reward = 31.49
2022-01-26 14:17:59.861 | DEBUG    | __main__:trials:26 - Trial = 19351/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.862 | DEBUG    | __main__:trials:29 - Trial = 19351/30000 | Total reward = 9.99
2022-01-26 14:17:59.864 | DEBUG    | __main__:trials:26 - Trial = 19352/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.866 | DEBUG    | __main__:trials:29 - Trial = 19352/30000 | Total reward = 9.99
2022-01-26 14:17:59.870 | DEBUG    | __main__:trials:24 - Trial = 19353/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.870 | DEBUG    | __main__:trials:29 - Trial = 19353/30000 | Total reward = 51.51
2022-01-26 14:17:59.873 | DEBUG    | __main__:trials:26 - Trial = 19354/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.875 | DEBUG    | __main__:trials:29 - Trial = 19354/30000 | Total reward = 12.80
2022-01-26 14:17:59.878 | DEBUG    | __main__:trials:26 - Trial = 19355/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.880 | DEBUG    | __main__:trials:29 - Trial = 19355/30000 | Total reward = 1.99
2022-01-26 14:17:59.882 | DEBUG    | __main__:trials:26 - Trial = 19356/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.883 | DEBUG    | __main__:trials:29 - Trial = 19356/30000 | Total reward = 9.99
2022-01-26 14:17:59.887 | DEBUG    | __main__:trials:24 - Trial = 19357/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.889 | DEBUG    | __main__:trials:29 - Trial = 19357/30000 | Total reward = 49.75
2022-01-26 14:17:59.892 | DEBUG    | __main__:trials:24 - Trial = 19358/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.893 | DEBUG    | __main__:trials:29 - Trial = 19358/30000 | Total reward = 48.65
2022-01-26 14:17:59.895 | DEBUG    | __main__:trials:26 - Trial = 19359/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.897 | DEBUG    | __main__:trials:29 - Trial = 19359/30000 | Total reward = 10.11
2022-01-26 14:17:59.901 | DEBUG    | __main__:trials:24 - Trial = 19360/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.902 | DEBUG    | __main__:trials:29 - Trial = 19360/30000 | Total reward = 31.64
2022-01-26 14:17:59.905 | DEBUG    | __main__:trials:24 - Trial = 19361/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.906 | DEBUG    | __main__:trials:29 - Trial = 19361/30000 | Total reward = 49.53
2022-01-26 14:17:59.910 | DEBUG    | __main__:trials:24 - Trial = 19362/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.911 | DEBUG    | __main__:trials:29 - Trial = 19362/30000 | Total reward = 35.48
2022-01-26 14:17:59.914 | DEBUG    | __main__:trials:24 - Trial = 19363/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.917 | DEBUG    | __main__:trials:29 - Trial = 19363/30000 | Total reward = 51.64
2022-01-26 14:17:59.920 | DEBUG    | __main__:trials:24 - Trial = 19364/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.920 | DEBUG    | __main__:trials:29 - Trial = 19364/30000 | Total reward = 55.64
2022-01-26 14:17:59.924 | DEBUG    | __main__:trials:24 - Trial = 19365/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.925 | DEBUG    | __main__:trials:29 - Trial = 19365/30000 | Total reward = 42.20
2022-01-26 14:17:59.929 | DEBUG    | __main__:trials:24 - Trial = 19366/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.930 | DEBUG    | __main__:trials:29 - Trial = 19366/30000 | Total reward = 38.07
2022-01-26 14:17:59.934 | DEBUG    | __main__:trials:24 - Trial = 19367/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.936 | DEBUG    | __main__:trials:29 - Trial = 19367/30000 | Total reward = 36.33
2022-01-26 14:17:59.939 | DEBUG    | __main__:trials:24 - Trial = 19368/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.941 | DEBUG    | __main__:trials:29 - Trial = 19368/30000 | Total reward = 52.75
2022-01-26 14:17:59.943 | DEBUG    | __main__:trials:26 - Trial = 19369/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.945 | DEBUG    | __main__:trials:29 - Trial = 19369/30000 | Total reward = 13.16
2022-01-26 14:17:59.946 | DEBUG    | __main__:trials:26 - Trial = 19370/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.948 | DEBUG    | __main__:trials:29 - Trial = 19370/30000 | Total reward = 9.99
2022-01-26 14:17:59.950 | DEBUG    | __main__:trials:26 - Trial = 19371/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.951 | DEBUG    | __main__:trials:29 - Trial = 19371/30000 | Total reward = 9.99
2022-01-26 14:17:59.953 | DEBUG    | __main__:trials:26 - Trial = 19372/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.955 | DEBUG    | __main__:trials:29 - Trial = 19372/30000 | Total reward = 9.99
2022-01-26 14:17:59.958 | DEBUG    | __main__:trials:26 - Trial = 19373/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.960 | DEBUG    | __main__:trials:29 - Trial = 19373/30000 | Total reward = 43.95
2022-01-26 14:17:59.962 | DEBUG    | __main__:trials:26 - Trial = 19374/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.963 | DEBUG    | __main__:trials:29 - Trial = 19374/30000 | Total reward = 13.39
2022-01-26 14:17:59.965 | DEBUG    | __main__:trials:26 - Trial = 19375/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.966 | DEBUG    | __main__:trials:29 - Trial = 19375/30000 | Total reward = 9.99
2022-01-26 14:17:59.969 | DEBUG    | __main__:trials:26 - Trial = 19376/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.970 | DEBUG    | __main__:trials:29 - Trial = 19376/30000 | Total reward = 16.39
2022-01-26 14:17:59.973 | DEBUG    | __main__:trials:26 - Trial = 19377/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.974 | DEBUG    | __main__:trials:29 - Trial = 19377/30000 | Total reward = 24.04
2022-01-26 14:17:59.977 | DEBUG    | __main__:trials:26 - Trial = 19378/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.979 | DEBUG    | __main__:trials:29 - Trial = 19378/30000 | Total reward = 19.62
2022-01-26 14:17:59.982 | DEBUG    | __main__:trials:26 - Trial = 19379/30000 | Agent went out of bounds, resetting
2022-01-26 14:17:59.983 | DEBUG    | __main__:trials:29 - Trial = 19379/30000 | Total reward = 21.52
2022-01-26 14:17:59.987 | DEBUG    | __main__:trials:24 - Trial = 19380/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.988 | DEBUG    | __main__:trials:29 - Trial = 19380/30000 | Total reward = 24.33
2022-01-26 14:17:59.992 | DEBUG    | __main__:trials:24 - Trial = 19381/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.994 | DEBUG    | __main__:trials:29 - Trial = 19381/30000 | Total reward = 50.81
2022-01-26 14:17:59.997 | DEBUG    | __main__:trials:24 - Trial = 19382/30000 | Max number of steps (20) reached
2022-01-26 14:17:59.999 | DEBUG    | __main__:trials:29 - Trial = 19382/30000 | Total reward = 47.11
2022-01-26 14:18:00.003 | DEBUG    | __main__:trials:24 - Trial = 19383/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.004 | DEBUG    | __main__:trials:29 - Trial = 19383/30000 | Total reward = 42.34
2022-01-26 14:18:00.007 | DEBUG    | __main__:trials:26 - Trial = 19384/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.008 | DEBUG    | __main__:trials:29 - Trial = 19384/30000 | Total reward = 9.99
2022-01-26 14:18:00.011 | DEBUG    | __main__:trials:26 - Trial = 19385/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.012 | DEBUG    | __main__:trials:29 - Trial = 19385/30000 | Total reward = 9.99
2022-01-26 14:18:00.014 | DEBUG    | __main__:trials:26 - Trial = 19386/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.014 | DEBUG    | __main__:trials:29 - Trial = 19386/30000 | Total reward = 9.99
2022-01-26 14:18:00.016 | DEBUG    | __main__:trials:26 - Trial = 19387/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.018 | DEBUG    | __main__:trials:29 - Trial = 19387/30000 | Total reward = 9.99
2022-01-26 14:18:00.020 | DEBUG    | __main__:trials:26 - Trial = 19388/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.023 | DEBUG    | __main__:trials:29 - Trial = 19388/30000 | Total reward = 9.87
2022-01-26 14:18:00.026 | DEBUG    | __main__:trials:24 - Trial = 19389/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.027 | DEBUG    | __main__:trials:29 - Trial = 19389/30000 | Total reward = 51.08
2022-01-26 14:18:00.029 | DEBUG    | __main__:trials:26 - Trial = 19390/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.030 | DEBUG    | __main__:trials:29 - Trial = 19390/30000 | Total reward = 10.25
2022-01-26 14:18:00.032 | DEBUG    | __main__:trials:26 - Trial = 19391/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.034 | DEBUG    | __main__:trials:29 - Trial = 19391/30000 | Total reward = 9.99
2022-01-26 14:18:00.036 | DEBUG    | __main__:trials:26 - Trial = 19392/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.037 | DEBUG    | __main__:trials:29 - Trial = 19392/30000 | Total reward = 9.99
2022-01-26 14:18:00.041 | DEBUG    | __main__:trials:24 - Trial = 19393/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.042 | DEBUG    | __main__:trials:29 - Trial = 19393/30000 | Total reward = 43.66
2022-01-26 14:18:00.046 | DEBUG    | __main__:trials:24 - Trial = 19394/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.047 | DEBUG    | __main__:trials:29 - Trial = 19394/30000 | Total reward = 35.46
2022-01-26 14:18:00.049 | DEBUG    | __main__:trials:26 - Trial = 19395/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.049 | DEBUG    | __main__:trials:29 - Trial = 19395/30000 | Total reward = 9.99
2022-01-26 14:18:00.053 | DEBUG    | __main__:trials:26 - Trial = 19396/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.054 | DEBUG    | __main__:trials:29 - Trial = 19396/30000 | Total reward = 29.33
2022-01-26 14:18:00.057 | DEBUG    | __main__:trials:26 - Trial = 19397/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.058 | DEBUG    | __main__:trials:29 - Trial = 19397/30000 | Total reward = 20.05
2022-01-26 14:18:00.060 | DEBUG    | __main__:trials:26 - Trial = 19398/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.061 | DEBUG    | __main__:trials:29 - Trial = 19398/30000 | Total reward = 9.99
2022-01-26 14:18:00.064 | DEBUG    | __main__:trials:24 - Trial = 19399/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.065 | DEBUG    | __main__:trials:29 - Trial = 19399/30000 | Total reward = 46.20
2022-01-26 14:18:00.066 | DEBUG    | __main__:trials:26 - Trial = 19400/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.067 | DEBUG    | __main__:trials:29 - Trial = 19400/30000 | Total reward = 9.99
2022-01-26 14:18:00.070 | DEBUG    | __main__:trials:24 - Trial = 19401/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.071 | DEBUG    | __main__:trials:29 - Trial = 19401/30000 | Total reward = 28.61
2022-01-26 14:18:00.075 | DEBUG    | __main__:trials:24 - Trial = 19402/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.075 | DEBUG    | __main__:trials:29 - Trial = 19402/30000 | Total reward = 42.47
2022-01-26 14:18:00.080 | DEBUG    | __main__:trials:24 - Trial = 19403/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.080 | DEBUG    | __main__:trials:29 - Trial = 19403/30000 | Total reward = 38.09
2022-01-26 14:18:00.087 | DEBUG    | __main__:trials:24 - Trial = 19404/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.089 | DEBUG    | __main__:trials:29 - Trial = 19404/30000 | Total reward = 42.25
2022-01-26 14:18:00.091 | DEBUG    | __main__:trials:26 - Trial = 19405/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.093 | DEBUG    | __main__:trials:29 - Trial = 19405/30000 | Total reward = 22.07
2022-01-26 14:18:00.097 | DEBUG    | __main__:trials:24 - Trial = 19406/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.099 | DEBUG    | __main__:trials:29 - Trial = 19406/30000 | Total reward = 43.50
2022-01-26 14:18:00.102 | DEBUG    | __main__:trials:24 - Trial = 19407/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.104 | DEBUG    | __main__:trials:29 - Trial = 19407/30000 | Total reward = 40.66
2022-01-26 14:18:00.108 | DEBUG    | __main__:trials:24 - Trial = 19408/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.108 | DEBUG    | __main__:trials:29 - Trial = 19408/30000 | Total reward = 48.48
2022-01-26 14:18:00.113 | DEBUG    | __main__:trials:24 - Trial = 19409/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.114 | DEBUG    | __main__:trials:29 - Trial = 19409/30000 | Total reward = 23.36
2022-01-26 14:18:00.117 | DEBUG    | __main__:trials:24 - Trial = 19410/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.118 | DEBUG    | __main__:trials:29 - Trial = 19410/30000 | Total reward = 39.91
2022-01-26 14:18:00.121 | DEBUG    | __main__:trials:24 - Trial = 19411/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.123 | DEBUG    | __main__:trials:29 - Trial = 19411/30000 | Total reward = 50.12
2022-01-26 14:18:00.124 | DEBUG    | __main__:trials:26 - Trial = 19412/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.125 | DEBUG    | __main__:trials:29 - Trial = 19412/30000 | Total reward = 7.57
2022-01-26 14:18:00.127 | DEBUG    | __main__:trials:26 - Trial = 19413/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.129 | DEBUG    | __main__:trials:29 - Trial = 19413/30000 | Total reward = 9.99
2022-01-26 14:18:00.132 | DEBUG    | __main__:trials:24 - Trial = 19414/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.132 | DEBUG    | __main__:trials:29 - Trial = 19414/30000 | Total reward = 48.07
2022-01-26 14:18:00.135 | DEBUG    | __main__:trials:26 - Trial = 19415/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.136 | DEBUG    | __main__:trials:29 - Trial = 19415/30000 | Total reward = 13.16
2022-01-26 14:18:00.138 | DEBUG    | __main__:trials:26 - Trial = 19416/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.140 | DEBUG    | __main__:trials:29 - Trial = 19416/30000 | Total reward = 7.70
2022-01-26 14:18:00.142 | DEBUG    | __main__:trials:26 - Trial = 19417/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.143 | DEBUG    | __main__:trials:29 - Trial = 19417/30000 | Total reward = 20.62
2022-01-26 14:18:00.146 | DEBUG    | __main__:trials:26 - Trial = 19418/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.148 | DEBUG    | __main__:trials:29 - Trial = 19418/30000 | Total reward = 23.93
2022-01-26 14:18:00.151 | DEBUG    | __main__:trials:24 - Trial = 19419/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.153 | DEBUG    | __main__:trials:29 - Trial = 19419/30000 | Total reward = 51.54
2022-01-26 14:18:00.156 | DEBUG    | __main__:trials:24 - Trial = 19420/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.158 | DEBUG    | __main__:trials:29 - Trial = 19420/30000 | Total reward = 53.35
2022-01-26 14:18:00.161 | DEBUG    | __main__:trials:24 - Trial = 19421/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.162 | DEBUG    | __main__:trials:29 - Trial = 19421/30000 | Total reward = 51.91
2022-01-26 14:18:00.166 | DEBUG    | __main__:trials:24 - Trial = 19422/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.168 | DEBUG    | __main__:trials:29 - Trial = 19422/30000 | Total reward = 51.28
2022-01-26 14:18:00.172 | DEBUG    | __main__:trials:24 - Trial = 19423/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.173 | DEBUG    | __main__:trials:29 - Trial = 19423/30000 | Total reward = 35.76
2022-01-26 14:18:00.177 | DEBUG    | __main__:trials:24 - Trial = 19424/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.178 | DEBUG    | __main__:trials:29 - Trial = 19424/30000 | Total reward = 57.42
2022-01-26 14:18:00.182 | DEBUG    | __main__:trials:24 - Trial = 19425/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.184 | DEBUG    | __main__:trials:29 - Trial = 19425/30000 | Total reward = 38.67
2022-01-26 14:18:00.188 | DEBUG    | __main__:trials:24 - Trial = 19426/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.189 | DEBUG    | __main__:trials:29 - Trial = 19426/30000 | Total reward = 57.70
2022-01-26 14:18:00.192 | DEBUG    | __main__:trials:26 - Trial = 19427/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.193 | DEBUG    | __main__:trials:29 - Trial = 19427/30000 | Total reward = 36.04
2022-01-26 14:18:00.196 | DEBUG    | __main__:trials:26 - Trial = 19428/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.198 | DEBUG    | __main__:trials:29 - Trial = 19428/30000 | Total reward = 7.12
2022-01-26 14:18:00.202 | DEBUG    | __main__:trials:24 - Trial = 19429/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.203 | DEBUG    | __main__:trials:29 - Trial = 19429/30000 | Total reward = 45.00
2022-01-26 14:18:00.206 | DEBUG    | __main__:trials:26 - Trial = 19430/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.208 | DEBUG    | __main__:trials:29 - Trial = 19430/30000 | Total reward = 38.51
2022-01-26 14:18:00.212 | DEBUG    | __main__:trials:24 - Trial = 19431/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.212 | DEBUG    | __main__:trials:29 - Trial = 19431/30000 | Total reward = 52.26
2022-01-26 14:18:00.216 | DEBUG    | __main__:trials:24 - Trial = 19432/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.218 | DEBUG    | __main__:trials:29 - Trial = 19432/30000 | Total reward = 51.82
2022-01-26 14:18:00.222 | DEBUG    | __main__:trials:24 - Trial = 19433/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.224 | DEBUG    | __main__:trials:29 - Trial = 19433/30000 | Total reward = 60.95
2022-01-26 14:18:00.227 | DEBUG    | __main__:trials:24 - Trial = 19434/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.229 | DEBUG    | __main__:trials:29 - Trial = 19434/30000 | Total reward = 58.42
2022-01-26 14:18:00.232 | DEBUG    | __main__:trials:24 - Trial = 19435/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.233 | DEBUG    | __main__:trials:29 - Trial = 19435/30000 | Total reward = 52.33
2022-01-26 14:18:00.238 | DEBUG    | __main__:trials:24 - Trial = 19436/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.239 | DEBUG    | __main__:trials:29 - Trial = 19436/30000 | Total reward = 47.94
2022-01-26 14:18:00.243 | DEBUG    | __main__:trials:24 - Trial = 19437/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.244 | DEBUG    | __main__:trials:29 - Trial = 19437/30000 | Total reward = 52.24
2022-01-26 14:18:00.248 | DEBUG    | __main__:trials:24 - Trial = 19438/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.250 | DEBUG    | __main__:trials:29 - Trial = 19438/30000 | Total reward = 40.27
2022-01-26 14:18:00.253 | DEBUG    | __main__:trials:26 - Trial = 19439/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.254 | DEBUG    | __main__:trials:29 - Trial = 19439/30000 | Total reward = 29.66
2022-01-26 14:18:00.257 | DEBUG    | __main__:trials:24 - Trial = 19440/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.258 | DEBUG    | __main__:trials:29 - Trial = 19440/30000 | Total reward = 51.54
2022-01-26 14:18:00.261 | DEBUG    | __main__:trials:24 - Trial = 19441/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.263 | DEBUG    | __main__:trials:29 - Trial = 19441/30000 | Total reward = 48.66
2022-01-26 14:18:00.266 | DEBUG    | __main__:trials:24 - Trial = 19442/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.267 | DEBUG    | __main__:trials:29 - Trial = 19442/30000 | Total reward = 52.34
2022-01-26 14:18:00.270 | DEBUG    | __main__:trials:24 - Trial = 19443/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.271 | DEBUG    | __main__:trials:29 - Trial = 19443/30000 | Total reward = 51.12
2022-01-26 14:18:00.274 | DEBUG    | __main__:trials:24 - Trial = 19444/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.277 | DEBUG    | __main__:trials:29 - Trial = 19444/30000 | Total reward = 43.85
2022-01-26 14:18:00.280 | DEBUG    | __main__:trials:24 - Trial = 19445/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.282 | DEBUG    | __main__:trials:29 - Trial = 19445/30000 | Total reward = 53.27
2022-01-26 14:18:00.285 | DEBUG    | __main__:trials:24 - Trial = 19446/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.286 | DEBUG    | __main__:trials:29 - Trial = 19446/30000 | Total reward = 57.42
2022-01-26 14:18:00.289 | DEBUG    | __main__:trials:24 - Trial = 19447/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.291 | DEBUG    | __main__:trials:29 - Trial = 19447/30000 | Total reward = 53.13
2022-01-26 14:18:00.295 | DEBUG    | __main__:trials:24 - Trial = 19448/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.296 | DEBUG    | __main__:trials:29 - Trial = 19448/30000 | Total reward = 52.65
2022-01-26 14:18:00.300 | DEBUG    | __main__:trials:24 - Trial = 19449/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.302 | DEBUG    | __main__:trials:29 - Trial = 19449/30000 | Total reward = 52.10
2022-01-26 14:18:00.305 | DEBUG    | __main__:trials:24 - Trial = 19450/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.306 | DEBUG    | __main__:trials:29 - Trial = 19450/30000 | Total reward = 50.20
2022-01-26 14:18:00.311 | DEBUG    | __main__:trials:24 - Trial = 19451/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.312 | DEBUG    | __main__:trials:29 - Trial = 19451/30000 | Total reward = 56.98
2022-01-26 14:18:00.316 | DEBUG    | __main__:trials:24 - Trial = 19452/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.318 | DEBUG    | __main__:trials:29 - Trial = 19452/30000 | Total reward = 51.99
2022-01-26 14:18:00.322 | DEBUG    | __main__:trials:24 - Trial = 19453/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.323 | DEBUG    | __main__:trials:29 - Trial = 19453/30000 | Total reward = 53.45
2022-01-26 14:18:00.328 | DEBUG    | __main__:trials:24 - Trial = 19454/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.329 | DEBUG    | __main__:trials:29 - Trial = 19454/30000 | Total reward = 53.57
2022-01-26 14:18:00.333 | DEBUG    | __main__:trials:24 - Trial = 19455/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.335 | DEBUG    | __main__:trials:29 - Trial = 19455/30000 | Total reward = 38.68
2022-01-26 14:18:00.338 | DEBUG    | __main__:trials:26 - Trial = 19456/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.339 | DEBUG    | __main__:trials:29 - Trial = 19456/30000 | Total reward = 9.27
2022-01-26 14:18:00.343 | DEBUG    | __main__:trials:24 - Trial = 19457/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.345 | DEBUG    | __main__:trials:29 - Trial = 19457/30000 | Total reward = 47.45
2022-01-26 14:18:00.348 | DEBUG    | __main__:trials:26 - Trial = 19458/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.349 | DEBUG    | __main__:trials:29 - Trial = 19458/30000 | Total reward = 22.28
2022-01-26 14:18:00.351 | DEBUG    | __main__:trials:26 - Trial = 19459/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.353 | DEBUG    | __main__:trials:29 - Trial = 19459/30000 | Total reward = 7.70
2022-01-26 14:18:00.355 | DEBUG    | __main__:trials:26 - Trial = 19460/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.356 | DEBUG    | __main__:trials:29 - Trial = 19460/30000 | Total reward = 10.11
2022-01-26 14:18:00.360 | DEBUG    | __main__:trials:24 - Trial = 19461/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.361 | DEBUG    | __main__:trials:29 - Trial = 19461/30000 | Total reward = 52.13
2022-01-26 14:18:00.365 | DEBUG    | __main__:trials:24 - Trial = 19462/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.367 | DEBUG    | __main__:trials:29 - Trial = 19462/30000 | Total reward = 36.62
2022-01-26 14:18:00.371 | DEBUG    | __main__:trials:24 - Trial = 19463/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.372 | DEBUG    | __main__:trials:29 - Trial = 19463/30000 | Total reward = 36.54
2022-01-26 14:18:00.376 | DEBUG    | __main__:trials:24 - Trial = 19464/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.377 | DEBUG    | __main__:trials:29 - Trial = 19464/30000 | Total reward = 46.83
2022-01-26 14:18:00.381 | DEBUG    | __main__:trials:24 - Trial = 19465/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.382 | DEBUG    | __main__:trials:29 - Trial = 19465/30000 | Total reward = 57.91
2022-01-26 14:18:00.385 | DEBUG    | __main__:trials:24 - Trial = 19466/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.387 | DEBUG    | __main__:trials:29 - Trial = 19466/30000 | Total reward = 44.38
2022-01-26 14:18:00.390 | DEBUG    | __main__:trials:24 - Trial = 19467/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.391 | DEBUG    | __main__:trials:29 - Trial = 19467/30000 | Total reward = 37.10
2022-01-26 14:18:00.395 | DEBUG    | __main__:trials:24 - Trial = 19468/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.396 | DEBUG    | __main__:trials:29 - Trial = 19468/30000 | Total reward = 47.57
2022-01-26 14:18:00.400 | DEBUG    | __main__:trials:24 - Trial = 19469/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.402 | DEBUG    | __main__:trials:29 - Trial = 19469/30000 | Total reward = 38.22
2022-01-26 14:18:00.406 | DEBUG    | __main__:trials:24 - Trial = 19470/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.407 | DEBUG    | __main__:trials:29 - Trial = 19470/30000 | Total reward = 37.91
2022-01-26 14:18:00.410 | DEBUG    | __main__:trials:26 - Trial = 19471/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.412 | DEBUG    | __main__:trials:29 - Trial = 19471/30000 | Total reward = 22.03
2022-01-26 14:18:00.415 | DEBUG    | __main__:trials:26 - Trial = 19472/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.416 | DEBUG    | __main__:trials:29 - Trial = 19472/30000 | Total reward = 18.09
2022-01-26 14:18:00.418 | DEBUG    | __main__:trials:26 - Trial = 19473/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.420 | DEBUG    | __main__:trials:29 - Trial = 19473/30000 | Total reward = 7.12
2022-01-26 14:18:00.422 | DEBUG    | __main__:trials:26 - Trial = 19474/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.424 | DEBUG    | __main__:trials:29 - Trial = 19474/30000 | Total reward = 21.20
2022-01-26 14:18:00.427 | DEBUG    | __main__:trials:24 - Trial = 19475/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.429 | DEBUG    | __main__:trials:29 - Trial = 19475/30000 | Total reward = 50.82
2022-01-26 14:18:00.432 | DEBUG    | __main__:trials:24 - Trial = 19476/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.434 | DEBUG    | __main__:trials:29 - Trial = 19476/30000 | Total reward = 50.68
2022-01-26 14:18:00.438 | DEBUG    | __main__:trials:24 - Trial = 19477/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.438 | DEBUG    | __main__:trials:29 - Trial = 19477/30000 | Total reward = 43.09
2022-01-26 14:18:00.441 | DEBUG    | __main__:trials:26 - Trial = 19478/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.443 | DEBUG    | __main__:trials:29 - Trial = 19478/30000 | Total reward = 9.99
2022-01-26 14:18:00.445 | DEBUG    | __main__:trials:24 - Trial = 19479/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.447 | DEBUG    | __main__:trials:29 - Trial = 19479/30000 | Total reward = 47.78
2022-01-26 14:18:00.451 | DEBUG    | __main__:trials:24 - Trial = 19480/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.453 | DEBUG    | __main__:trials:29 - Trial = 19480/30000 | Total reward = 51.16
2022-01-26 14:18:00.456 | DEBUG    | __main__:trials:24 - Trial = 19481/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.458 | DEBUG    | __main__:trials:29 - Trial = 19481/30000 | Total reward = 53.29
2022-01-26 14:18:00.462 | DEBUG    | __main__:trials:24 - Trial = 19482/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.463 | DEBUG    | __main__:trials:29 - Trial = 19482/30000 | Total reward = 52.24
2022-01-26 14:18:00.467 | DEBUG    | __main__:trials:24 - Trial = 19483/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.468 | DEBUG    | __main__:trials:29 - Trial = 19483/30000 | Total reward = 52.26
2022-01-26 14:18:00.471 | DEBUG    | __main__:trials:24 - Trial = 19484/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.473 | DEBUG    | __main__:trials:29 - Trial = 19484/30000 | Total reward = 46.44
2022-01-26 14:18:00.476 | DEBUG    | __main__:trials:26 - Trial = 19485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.478 | DEBUG    | __main__:trials:29 - Trial = 19485/30000 | Total reward = 43.66
2022-01-26 14:18:00.481 | DEBUG    | __main__:trials:24 - Trial = 19486/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.482 | DEBUG    | __main__:trials:29 - Trial = 19486/30000 | Total reward = 33.51
2022-01-26 14:18:00.485 | DEBUG    | __main__:trials:24 - Trial = 19487/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.486 | DEBUG    | __main__:trials:29 - Trial = 19487/30000 | Total reward = 51.13
2022-01-26 14:18:00.490 | DEBUG    | __main__:trials:24 - Trial = 19488/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.492 | DEBUG    | __main__:trials:29 - Trial = 19488/30000 | Total reward = 47.12
2022-01-26 14:18:00.495 | DEBUG    | __main__:trials:24 - Trial = 19489/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.496 | DEBUG    | __main__:trials:29 - Trial = 19489/30000 | Total reward = 53.09
2022-01-26 14:18:00.499 | DEBUG    | __main__:trials:24 - Trial = 19490/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.501 | DEBUG    | __main__:trials:29 - Trial = 19490/30000 | Total reward = 53.94
2022-01-26 14:18:00.505 | DEBUG    | __main__:trials:24 - Trial = 19491/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.507 | DEBUG    | __main__:trials:29 - Trial = 19491/30000 | Total reward = 49.67
2022-01-26 14:18:00.509 | DEBUG    | __main__:trials:26 - Trial = 19492/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.510 | DEBUG    | __main__:trials:29 - Trial = 19492/30000 | Total reward = 2.12
2022-01-26 14:18:00.514 | DEBUG    | __main__:trials:24 - Trial = 19493/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.516 | DEBUG    | __main__:trials:29 - Trial = 19493/30000 | Total reward = 49.83
2022-01-26 14:18:00.519 | DEBUG    | __main__:trials:24 - Trial = 19494/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.521 | DEBUG    | __main__:trials:29 - Trial = 19494/30000 | Total reward = 45.79
2022-01-26 14:18:00.524 | DEBUG    | __main__:trials:24 - Trial = 19495/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.526 | DEBUG    | __main__:trials:29 - Trial = 19495/30000 | Total reward = 50.16
2022-01-26 14:18:00.530 | DEBUG    | __main__:trials:26 - Trial = 19496/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.531 | DEBUG    | __main__:trials:29 - Trial = 19496/30000 | Total reward = 37.55
2022-01-26 14:18:00.534 | DEBUG    | __main__:trials:24 - Trial = 19497/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.536 | DEBUG    | __main__:trials:29 - Trial = 19497/30000 | Total reward = 60.60
2022-01-26 14:18:00.540 | DEBUG    | __main__:trials:24 - Trial = 19498/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.542 | DEBUG    | __main__:trials:29 - Trial = 19498/30000 | Total reward = 50.16
2022-01-26 14:18:00.545 | DEBUG    | __main__:trials:24 - Trial = 19499/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.547 | DEBUG    | __main__:trials:29 - Trial = 19499/30000 | Total reward = 53.94
2022-01-26 14:18:00.551 | DEBUG    | __main__:trials:24 - Trial = 19500/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.551 | DEBUG    | __main__:trials:29 - Trial = 19500/30000 | Total reward = 44.31
2022-01-26 14:18:00.556 | DEBUG    | __main__:trials:24 - Trial = 19501/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.557 | DEBUG    | __main__:trials:29 - Trial = 19501/30000 | Total reward = 42.77
2022-01-26 14:18:00.561 | DEBUG    | __main__:trials:24 - Trial = 19502/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.563 | DEBUG    | __main__:trials:29 - Trial = 19502/30000 | Total reward = 47.85
2022-01-26 14:18:00.566 | DEBUG    | __main__:trials:24 - Trial = 19503/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.567 | DEBUG    | __main__:trials:29 - Trial = 19503/30000 | Total reward = 48.44
2022-01-26 14:18:00.570 | DEBUG    | __main__:trials:24 - Trial = 19504/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.572 | DEBUG    | __main__:trials:29 - Trial = 19504/30000 | Total reward = 52.63
2022-01-26 14:18:00.574 | DEBUG    | __main__:trials:24 - Trial = 19505/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.576 | DEBUG    | __main__:trials:29 - Trial = 19505/30000 | Total reward = 50.53
2022-01-26 14:18:00.580 | DEBUG    | __main__:trials:24 - Trial = 19506/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.581 | DEBUG    | __main__:trials:29 - Trial = 19506/30000 | Total reward = 47.68
2022-01-26 14:18:00.584 | DEBUG    | __main__:trials:24 - Trial = 19507/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.586 | DEBUG    | __main__:trials:29 - Trial = 19507/30000 | Total reward = 51.32
2022-01-26 14:18:00.588 | DEBUG    | __main__:trials:26 - Trial = 19508/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.590 | DEBUG    | __main__:trials:29 - Trial = 19508/30000 | Total reward = 23.06
2022-01-26 14:18:00.594 | DEBUG    | __main__:trials:24 - Trial = 19509/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.595 | DEBUG    | __main__:trials:29 - Trial = 19509/30000 | Total reward = 50.37
2022-01-26 14:18:00.598 | DEBUG    | __main__:trials:26 - Trial = 19510/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.599 | DEBUG    | __main__:trials:29 - Trial = 19510/30000 | Total reward = 9.99
2022-01-26 14:18:00.602 | DEBUG    | __main__:trials:24 - Trial = 19511/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.605 | DEBUG    | __main__:trials:29 - Trial = 19511/30000 | Total reward = 52.56
2022-01-26 14:18:00.608 | DEBUG    | __main__:trials:24 - Trial = 19512/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.610 | DEBUG    | __main__:trials:29 - Trial = 19512/30000 | Total reward = 51.95
2022-01-26 14:18:00.614 | DEBUG    | __main__:trials:24 - Trial = 19513/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.614 | DEBUG    | __main__:trials:29 - Trial = 19513/30000 | Total reward = 29.40
2022-01-26 14:18:00.619 | DEBUG    | __main__:trials:24 - Trial = 19514/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.620 | DEBUG    | __main__:trials:29 - Trial = 19514/30000 | Total reward = 47.91
2022-01-26 14:18:00.624 | DEBUG    | __main__:trials:24 - Trial = 19515/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.626 | DEBUG    | __main__:trials:29 - Trial = 19515/30000 | Total reward = 50.29
2022-01-26 14:18:00.630 | DEBUG    | __main__:trials:24 - Trial = 19516/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.630 | DEBUG    | __main__:trials:29 - Trial = 19516/30000 | Total reward = 52.27
2022-01-26 14:18:00.635 | DEBUG    | __main__:trials:24 - Trial = 19517/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.636 | DEBUG    | __main__:trials:29 - Trial = 19517/30000 | Total reward = 51.62
2022-01-26 14:18:00.640 | DEBUG    | __main__:trials:24 - Trial = 19518/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.642 | DEBUG    | __main__:trials:29 - Trial = 19518/30000 | Total reward = 47.28
2022-01-26 14:18:00.646 | DEBUG    | __main__:trials:24 - Trial = 19519/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.648 | DEBUG    | __main__:trials:29 - Trial = 19519/30000 | Total reward = 51.72
2022-01-26 14:18:00.652 | DEBUG    | __main__:trials:24 - Trial = 19520/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.653 | DEBUG    | __main__:trials:29 - Trial = 19520/30000 | Total reward = 52.12
2022-01-26 14:18:00.657 | DEBUG    | __main__:trials:24 - Trial = 19521/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.659 | DEBUG    | __main__:trials:29 - Trial = 19521/30000 | Total reward = 50.72
2022-01-26 14:18:00.663 | DEBUG    | __main__:trials:26 - Trial = 19522/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.665 | DEBUG    | __main__:trials:29 - Trial = 19522/30000 | Total reward = 33.86
2022-01-26 14:18:00.669 | DEBUG    | __main__:trials:24 - Trial = 19523/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.670 | DEBUG    | __main__:trials:29 - Trial = 19523/30000 | Total reward = 47.57
2022-01-26 14:18:00.674 | DEBUG    | __main__:trials:26 - Trial = 19524/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.675 | DEBUG    | __main__:trials:29 - Trial = 19524/30000 | Total reward = 16.40
2022-01-26 14:18:00.677 | DEBUG    | __main__:trials:26 - Trial = 19525/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.678 | DEBUG    | __main__:trials:29 - Trial = 19525/30000 | Total reward = 13.09
2022-01-26 14:18:00.681 | DEBUG    | __main__:trials:24 - Trial = 19526/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.683 | DEBUG    | __main__:trials:29 - Trial = 19526/30000 | Total reward = 38.71
2022-01-26 14:18:00.686 | DEBUG    | __main__:trials:24 - Trial = 19527/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.687 | DEBUG    | __main__:trials:29 - Trial = 19527/30000 | Total reward = 51.18
2022-01-26 14:18:00.691 | DEBUG    | __main__:trials:24 - Trial = 19528/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.692 | DEBUG    | __main__:trials:29 - Trial = 19528/30000 | Total reward = 52.13
2022-01-26 14:18:00.696 | DEBUG    | __main__:trials:24 - Trial = 19529/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.698 | DEBUG    | __main__:trials:29 - Trial = 19529/30000 | Total reward = 51.94
2022-01-26 14:18:00.701 | DEBUG    | __main__:trials:26 - Trial = 19530/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.702 | DEBUG    | __main__:trials:29 - Trial = 19530/30000 | Total reward = 16.20
2022-01-26 14:18:00.706 | DEBUG    | __main__:trials:24 - Trial = 19531/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.707 | DEBUG    | __main__:trials:29 - Trial = 19531/30000 | Total reward = 53.55
2022-01-26 14:18:00.711 | DEBUG    | __main__:trials:24 - Trial = 19532/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.713 | DEBUG    | __main__:trials:29 - Trial = 19532/30000 | Total reward = 51.94
2022-01-26 14:18:00.717 | DEBUG    | __main__:trials:26 - Trial = 19533/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.717 | DEBUG    | __main__:trials:29 - Trial = 19533/30000 | Total reward = 33.52
2022-01-26 14:18:00.722 | DEBUG    | __main__:trials:24 - Trial = 19534/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.723 | DEBUG    | __main__:trials:29 - Trial = 19534/30000 | Total reward = 51.66
2022-01-26 14:18:00.727 | DEBUG    | __main__:trials:24 - Trial = 19535/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.728 | DEBUG    | __main__:trials:29 - Trial = 19535/30000 | Total reward = 40.15
2022-01-26 14:18:00.731 | DEBUG    | __main__:trials:26 - Trial = 19536/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.732 | DEBUG    | __main__:trials:29 - Trial = 19536/30000 | Total reward = 7.70
2022-01-26 14:18:00.735 | DEBUG    | __main__:trials:24 - Trial = 19537/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.737 | DEBUG    | __main__:trials:29 - Trial = 19537/30000 | Total reward = 52.33
2022-01-26 14:18:00.740 | DEBUG    | __main__:trials:26 - Trial = 19538/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.742 | DEBUG    | __main__:trials:29 - Trial = 19538/30000 | Total reward = 39.64
2022-01-26 14:18:00.747 | DEBUG    | __main__:trials:24 - Trial = 19539/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.749 | DEBUG    | __main__:trials:29 - Trial = 19539/30000 | Total reward = 43.58
2022-01-26 14:18:00.752 | DEBUG    | __main__:trials:24 - Trial = 19540/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.754 | DEBUG    | __main__:trials:29 - Trial = 19540/30000 | Total reward = 49.97
2022-01-26 14:18:00.757 | DEBUG    | __main__:trials:26 - Trial = 19541/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.759 | DEBUG    | __main__:trials:29 - Trial = 19541/30000 | Total reward = 31.51
2022-01-26 14:18:00.761 | DEBUG    | __main__:trials:26 - Trial = 19542/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.763 | DEBUG    | __main__:trials:29 - Trial = 19542/30000 | Total reward = 7.12
2022-01-26 14:18:00.767 | DEBUG    | __main__:trials:24 - Trial = 19543/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.768 | DEBUG    | __main__:trials:29 - Trial = 19543/30000 | Total reward = 42.46
2022-01-26 14:18:00.772 | DEBUG    | __main__:trials:24 - Trial = 19544/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.773 | DEBUG    | __main__:trials:29 - Trial = 19544/30000 | Total reward = 49.66
2022-01-26 14:18:00.775 | DEBUG    | __main__:trials:26 - Trial = 19545/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.776 | DEBUG    | __main__:trials:29 - Trial = 19545/30000 | Total reward = 25.61
2022-01-26 14:18:00.780 | DEBUG    | __main__:trials:24 - Trial = 19546/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.780 | DEBUG    | __main__:trials:29 - Trial = 19546/30000 | Total reward = 52.26
2022-01-26 14:18:00.784 | DEBUG    | __main__:trials:24 - Trial = 19547/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.785 | DEBUG    | __main__:trials:29 - Trial = 19547/30000 | Total reward = 49.05
2022-01-26 14:18:00.789 | DEBUG    | __main__:trials:24 - Trial = 19548/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.790 | DEBUG    | __main__:trials:29 - Trial = 19548/30000 | Total reward = 52.71
2022-01-26 14:18:00.793 | DEBUG    | __main__:trials:24 - Trial = 19549/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.794 | DEBUG    | __main__:trials:29 - Trial = 19549/30000 | Total reward = 58.59
2022-01-26 14:18:00.798 | DEBUG    | __main__:trials:26 - Trial = 19550/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.799 | DEBUG    | __main__:trials:29 - Trial = 19550/30000 | Total reward = 18.33
2022-01-26 14:18:00.803 | DEBUG    | __main__:trials:24 - Trial = 19551/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.804 | DEBUG    | __main__:trials:29 - Trial = 19551/30000 | Total reward = 48.56
2022-01-26 14:18:00.808 | DEBUG    | __main__:trials:24 - Trial = 19552/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.810 | DEBUG    | __main__:trials:29 - Trial = 19552/30000 | Total reward = 52.13
2022-01-26 14:18:00.813 | DEBUG    | __main__:trials:24 - Trial = 19553/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.815 | DEBUG    | __main__:trials:29 - Trial = 19553/30000 | Total reward = 46.91
2022-01-26 14:18:00.819 | DEBUG    | __main__:trials:24 - Trial = 19554/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.820 | DEBUG    | __main__:trials:29 - Trial = 19554/30000 | Total reward = 53.75
2022-01-26 14:18:00.824 | DEBUG    | __main__:trials:24 - Trial = 19555/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.826 | DEBUG    | __main__:trials:29 - Trial = 19555/30000 | Total reward = 49.87
2022-01-26 14:18:00.830 | DEBUG    | __main__:trials:24 - Trial = 19556/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.830 | DEBUG    | __main__:trials:29 - Trial = 19556/30000 | Total reward = 55.13
2022-01-26 14:18:00.835 | DEBUG    | __main__:trials:24 - Trial = 19557/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.836 | DEBUG    | __main__:trials:29 - Trial = 19557/30000 | Total reward = 51.28
2022-01-26 14:18:00.840 | DEBUG    | __main__:trials:24 - Trial = 19558/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.841 | DEBUG    | __main__:trials:29 - Trial = 19558/30000 | Total reward = 48.48
2022-01-26 14:18:00.845 | DEBUG    | __main__:trials:24 - Trial = 19559/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.847 | DEBUG    | __main__:trials:29 - Trial = 19559/30000 | Total reward = 48.29
2022-01-26 14:18:00.850 | DEBUG    | __main__:trials:24 - Trial = 19560/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.852 | DEBUG    | __main__:trials:29 - Trial = 19560/30000 | Total reward = 51.80
2022-01-26 14:18:00.856 | DEBUG    | __main__:trials:24 - Trial = 19561/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.857 | DEBUG    | __main__:trials:29 - Trial = 19561/30000 | Total reward = 52.40
2022-01-26 14:18:00.861 | DEBUG    | __main__:trials:24 - Trial = 19562/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.862 | DEBUG    | __main__:trials:29 - Trial = 19562/30000 | Total reward = 41.47
2022-01-26 14:18:00.866 | DEBUG    | __main__:trials:24 - Trial = 19563/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.867 | DEBUG    | __main__:trials:29 - Trial = 19563/30000 | Total reward = 47.14
2022-01-26 14:18:00.871 | DEBUG    | __main__:trials:24 - Trial = 19564/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.872 | DEBUG    | __main__:trials:29 - Trial = 19564/30000 | Total reward = 50.12
2022-01-26 14:18:00.876 | DEBUG    | __main__:trials:26 - Trial = 19565/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.876 | DEBUG    | __main__:trials:29 - Trial = 19565/30000 | Total reward = 37.66
2022-01-26 14:18:00.880 | DEBUG    | __main__:trials:24 - Trial = 19566/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.881 | DEBUG    | __main__:trials:29 - Trial = 19566/30000 | Total reward = 52.19
2022-01-26 14:18:00.886 | DEBUG    | __main__:trials:24 - Trial = 19567/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.886 | DEBUG    | __main__:trials:29 - Trial = 19567/30000 | Total reward = 43.02
2022-01-26 14:18:00.891 | DEBUG    | __main__:trials:24 - Trial = 19568/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.892 | DEBUG    | __main__:trials:29 - Trial = 19568/30000 | Total reward = 51.62
2022-01-26 14:18:00.895 | DEBUG    | __main__:trials:24 - Trial = 19569/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.897 | DEBUG    | __main__:trials:29 - Trial = 19569/30000 | Total reward = 46.10
2022-01-26 14:18:00.899 | DEBUG    | __main__:trials:26 - Trial = 19570/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.900 | DEBUG    | __main__:trials:29 - Trial = 19570/30000 | Total reward = 7.12
2022-01-26 14:18:00.905 | DEBUG    | __main__:trials:24 - Trial = 19571/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.905 | DEBUG    | __main__:trials:29 - Trial = 19571/30000 | Total reward = 47.71
2022-01-26 14:18:00.910 | DEBUG    | __main__:trials:24 - Trial = 19572/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.911 | DEBUG    | __main__:trials:29 - Trial = 19572/30000 | Total reward = 64.91
2022-01-26 14:18:00.914 | DEBUG    | __main__:trials:24 - Trial = 19573/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.916 | DEBUG    | __main__:trials:29 - Trial = 19573/30000 | Total reward = 51.68
2022-01-26 14:18:00.919 | DEBUG    | __main__:trials:24 - Trial = 19574/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.921 | DEBUG    | __main__:trials:29 - Trial = 19574/30000 | Total reward = 52.53
2022-01-26 14:18:00.924 | DEBUG    | __main__:trials:24 - Trial = 19575/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.925 | DEBUG    | __main__:trials:29 - Trial = 19575/30000 | Total reward = 52.90
2022-01-26 14:18:00.927 | DEBUG    | __main__:trials:26 - Trial = 19576/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.929 | DEBUG    | __main__:trials:29 - Trial = 19576/30000 | Total reward = 7.12
2022-01-26 14:18:00.932 | DEBUG    | __main__:trials:24 - Trial = 19577/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.933 | DEBUG    | __main__:trials:29 - Trial = 19577/30000 | Total reward = 42.54
2022-01-26 14:18:00.937 | DEBUG    | __main__:trials:24 - Trial = 19578/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.938 | DEBUG    | __main__:trials:29 - Trial = 19578/30000 | Total reward = 49.58
2022-01-26 14:18:00.942 | DEBUG    | __main__:trials:24 - Trial = 19579/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.943 | DEBUG    | __main__:trials:29 - Trial = 19579/30000 | Total reward = 47.92
2022-01-26 14:18:00.947 | DEBUG    | __main__:trials:24 - Trial = 19580/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.949 | DEBUG    | __main__:trials:29 - Trial = 19580/30000 | Total reward = 44.63
2022-01-26 14:18:00.953 | DEBUG    | __main__:trials:24 - Trial = 19581/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.953 | DEBUG    | __main__:trials:29 - Trial = 19581/30000 | Total reward = 44.90
2022-01-26 14:18:00.957 | DEBUG    | __main__:trials:24 - Trial = 19582/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.959 | DEBUG    | __main__:trials:29 - Trial = 19582/30000 | Total reward = 50.37
2022-01-26 14:18:00.963 | DEBUG    | __main__:trials:24 - Trial = 19583/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.963 | DEBUG    | __main__:trials:29 - Trial = 19583/30000 | Total reward = 44.68
2022-01-26 14:18:00.968 | DEBUG    | __main__:trials:24 - Trial = 19584/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.970 | DEBUG    | __main__:trials:29 - Trial = 19584/30000 | Total reward = 52.66
2022-01-26 14:18:00.973 | DEBUG    | __main__:trials:24 - Trial = 19585/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.975 | DEBUG    | __main__:trials:29 - Trial = 19585/30000 | Total reward = 43.12
2022-01-26 14:18:00.979 | DEBUG    | __main__:trials:24 - Trial = 19586/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.979 | DEBUG    | __main__:trials:29 - Trial = 19586/30000 | Total reward = 49.14
2022-01-26 14:18:00.984 | DEBUG    | __main__:trials:26 - Trial = 19587/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:00.985 | DEBUG    | __main__:trials:29 - Trial = 19587/30000 | Total reward = 35.38
2022-01-26 14:18:00.989 | DEBUG    | __main__:trials:24 - Trial = 19588/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.991 | DEBUG    | __main__:trials:29 - Trial = 19588/30000 | Total reward = 53.83
2022-01-26 14:18:00.994 | DEBUG    | __main__:trials:24 - Trial = 19589/30000 | Max number of steps (20) reached
2022-01-26 14:18:00.995 | DEBUG    | __main__:trials:29 - Trial = 19589/30000 | Total reward = 46.67
2022-01-26 14:18:00.999 | DEBUG    | __main__:trials:24 - Trial = 19590/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.001 | DEBUG    | __main__:trials:29 - Trial = 19590/30000 | Total reward = 51.68
2022-01-26 14:18:01.004 | DEBUG    | __main__:trials:24 - Trial = 19591/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.006 | DEBUG    | __main__:trials:29 - Trial = 19591/30000 | Total reward = 54.13
2022-01-26 14:18:01.010 | DEBUG    | __main__:trials:24 - Trial = 19592/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.011 | DEBUG    | __main__:trials:29 - Trial = 19592/30000 | Total reward = 46.83
2022-01-26 14:18:01.014 | DEBUG    | __main__:trials:24 - Trial = 19593/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.016 | DEBUG    | __main__:trials:29 - Trial = 19593/30000 | Total reward = 43.71
2022-01-26 14:18:01.019 | DEBUG    | __main__:trials:24 - Trial = 19594/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.021 | DEBUG    | __main__:trials:29 - Trial = 19594/30000 | Total reward = 26.91
2022-01-26 14:18:01.025 | DEBUG    | __main__:trials:26 - Trial = 19595/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.027 | DEBUG    | __main__:trials:29 - Trial = 19595/30000 | Total reward = 39.24
2022-01-26 14:18:01.029 | DEBUG    | __main__:trials:26 - Trial = 19596/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.030 | DEBUG    | __main__:trials:29 - Trial = 19596/30000 | Total reward = 7.12
2022-01-26 14:18:01.034 | DEBUG    | __main__:trials:26 - Trial = 19597/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.036 | DEBUG    | __main__:trials:29 - Trial = 19597/30000 | Total reward = 22.25
2022-01-26 14:18:01.039 | DEBUG    | __main__:trials:24 - Trial = 19598/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.041 | DEBUG    | __main__:trials:29 - Trial = 19598/30000 | Total reward = 52.90
2022-01-26 14:18:01.044 | DEBUG    | __main__:trials:26 - Trial = 19599/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.045 | DEBUG    | __main__:trials:29 - Trial = 19599/30000 | Total reward = 10.66
2022-01-26 14:18:01.049 | DEBUG    | __main__:trials:24 - Trial = 19600/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.050 | DEBUG    | __main__:trials:29 - Trial = 19600/30000 | Total reward = 54.26
2022-01-26 14:18:01.053 | DEBUG    | __main__:trials:24 - Trial = 19601/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.054 | DEBUG    | __main__:trials:29 - Trial = 19601/30000 | Total reward = 55.34
2022-01-26 14:18:01.058 | DEBUG    | __main__:trials:24 - Trial = 19602/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.060 | DEBUG    | __main__:trials:29 - Trial = 19602/30000 | Total reward = 48.15
2022-01-26 14:18:01.062 | DEBUG    | __main__:trials:26 - Trial = 19603/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.064 | DEBUG    | __main__:trials:29 - Trial = 19603/30000 | Total reward = 9.99
2022-01-26 14:18:01.067 | DEBUG    | __main__:trials:24 - Trial = 19604/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.069 | DEBUG    | __main__:trials:29 - Trial = 19604/30000 | Total reward = 52.26
2022-01-26 14:18:01.072 | DEBUG    | __main__:trials:24 - Trial = 19605/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.074 | DEBUG    | __main__:trials:29 - Trial = 19605/30000 | Total reward = 51.23
2022-01-26 14:18:01.077 | DEBUG    | __main__:trials:24 - Trial = 19606/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.079 | DEBUG    | __main__:trials:29 - Trial = 19606/30000 | Total reward = 44.64
2022-01-26 14:18:01.081 | DEBUG    | __main__:trials:26 - Trial = 19607/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.082 | DEBUG    | __main__:trials:29 - Trial = 19607/30000 | Total reward = 7.12
2022-01-26 14:18:01.085 | DEBUG    | __main__:trials:26 - Trial = 19608/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.086 | DEBUG    | __main__:trials:29 - Trial = 19608/30000 | Total reward = 9.99
2022-01-26 14:18:01.090 | DEBUG    | __main__:trials:24 - Trial = 19609/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.092 | DEBUG    | __main__:trials:29 - Trial = 19609/30000 | Total reward = 51.75
2022-01-26 14:18:01.095 | DEBUG    | __main__:trials:26 - Trial = 19610/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.096 | DEBUG    | __main__:trials:29 - Trial = 19610/30000 | Total reward = 33.02
2022-01-26 14:18:01.100 | DEBUG    | __main__:trials:26 - Trial = 19611/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.102 | DEBUG    | __main__:trials:29 - Trial = 19611/30000 | Total reward = 38.79
2022-01-26 14:18:01.104 | DEBUG    | __main__:trials:26 - Trial = 19612/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.106 | DEBUG    | __main__:trials:29 - Trial = 19612/30000 | Total reward = 9.99
2022-01-26 14:18:01.109 | DEBUG    | __main__:trials:26 - Trial = 19613/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.110 | DEBUG    | __main__:trials:29 - Trial = 19613/30000 | Total reward = 30.87
2022-01-26 14:18:01.114 | DEBUG    | __main__:trials:24 - Trial = 19614/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.115 | DEBUG    | __main__:trials:29 - Trial = 19614/30000 | Total reward = 52.13
2022-01-26 14:18:01.119 | DEBUG    | __main__:trials:24 - Trial = 19615/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.120 | DEBUG    | __main__:trials:29 - Trial = 19615/30000 | Total reward = 51.40
2022-01-26 14:18:01.124 | DEBUG    | __main__:trials:24 - Trial = 19616/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.126 | DEBUG    | __main__:trials:29 - Trial = 19616/30000 | Total reward = 54.03
2022-01-26 14:18:01.129 | DEBUG    | __main__:trials:24 - Trial = 19617/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.131 | DEBUG    | __main__:trials:29 - Trial = 19617/30000 | Total reward = 51.25
2022-01-26 14:18:01.134 | DEBUG    | __main__:trials:24 - Trial = 19618/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.136 | DEBUG    | __main__:trials:29 - Trial = 19618/30000 | Total reward = 52.13
2022-01-26 14:18:01.139 | DEBUG    | __main__:trials:24 - Trial = 19619/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.141 | DEBUG    | __main__:trials:29 - Trial = 19619/30000 | Total reward = 46.89
2022-01-26 14:18:01.144 | DEBUG    | __main__:trials:24 - Trial = 19620/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.145 | DEBUG    | __main__:trials:29 - Trial = 19620/30000 | Total reward = 50.80
2022-01-26 14:18:01.148 | DEBUG    | __main__:trials:24 - Trial = 19621/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.149 | DEBUG    | __main__:trials:29 - Trial = 19621/30000 | Total reward = 52.38
2022-01-26 14:18:01.153 | DEBUG    | __main__:trials:24 - Trial = 19622/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.154 | DEBUG    | __main__:trials:29 - Trial = 19622/30000 | Total reward = 49.37
2022-01-26 14:18:01.157 | DEBUG    | __main__:trials:24 - Trial = 19623/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.159 | DEBUG    | __main__:trials:29 - Trial = 19623/30000 | Total reward = 50.87
2022-01-26 14:18:01.163 | DEBUG    | __main__:trials:24 - Trial = 19624/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.165 | DEBUG    | __main__:trials:29 - Trial = 19624/30000 | Total reward = 62.74
2022-01-26 14:18:01.168 | DEBUG    | __main__:trials:24 - Trial = 19625/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.169 | DEBUG    | __main__:trials:29 - Trial = 19625/30000 | Total reward = 55.02
2022-01-26 14:18:01.171 | DEBUG    | __main__:trials:26 - Trial = 19626/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.172 | DEBUG    | __main__:trials:29 - Trial = 19626/30000 | Total reward = 7.12
2022-01-26 14:18:01.176 | DEBUG    | __main__:trials:24 - Trial = 19627/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.178 | DEBUG    | __main__:trials:29 - Trial = 19627/30000 | Total reward = 52.13
2022-01-26 14:18:01.182 | DEBUG    | __main__:trials:24 - Trial = 19628/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.183 | DEBUG    | __main__:trials:29 - Trial = 19628/30000 | Total reward = 51.87
2022-01-26 14:18:01.186 | DEBUG    | __main__:trials:24 - Trial = 19629/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.188 | DEBUG    | __main__:trials:29 - Trial = 19629/30000 | Total reward = 47.15
2022-01-26 14:18:01.191 | DEBUG    | __main__:trials:24 - Trial = 19630/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.193 | DEBUG    | __main__:trials:29 - Trial = 19630/30000 | Total reward = 60.47
2022-01-26 14:18:01.197 | DEBUG    | __main__:trials:24 - Trial = 19631/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.197 | DEBUG    | __main__:trials:29 - Trial = 19631/30000 | Total reward = 53.04
2022-01-26 14:18:01.201 | DEBUG    | __main__:trials:24 - Trial = 19632/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.203 | DEBUG    | __main__:trials:29 - Trial = 19632/30000 | Total reward = 52.91
2022-01-26 14:18:01.207 | DEBUG    | __main__:trials:24 - Trial = 19633/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.208 | DEBUG    | __main__:trials:29 - Trial = 19633/30000 | Total reward = 50.37
2022-01-26 14:18:01.211 | DEBUG    | __main__:trials:24 - Trial = 19634/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.213 | DEBUG    | __main__:trials:29 - Trial = 19634/30000 | Total reward = 57.03
2022-01-26 14:18:01.217 | DEBUG    | __main__:trials:24 - Trial = 19635/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.218 | DEBUG    | __main__:trials:29 - Trial = 19635/30000 | Total reward = 52.03
2022-01-26 14:18:01.221 | DEBUG    | __main__:trials:24 - Trial = 19636/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.223 | DEBUG    | __main__:trials:29 - Trial = 19636/30000 | Total reward = 36.92
2022-01-26 14:18:01.226 | DEBUG    | __main__:trials:24 - Trial = 19637/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.227 | DEBUG    | __main__:trials:29 - Trial = 19637/30000 | Total reward = 44.27
2022-01-26 14:18:01.231 | DEBUG    | __main__:trials:24 - Trial = 19638/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.233 | DEBUG    | __main__:trials:29 - Trial = 19638/30000 | Total reward = 58.81
2022-01-26 14:18:01.236 | DEBUG    | __main__:trials:24 - Trial = 19639/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.238 | DEBUG    | __main__:trials:29 - Trial = 19639/30000 | Total reward = 48.05
2022-01-26 14:18:01.242 | DEBUG    | __main__:trials:24 - Trial = 19640/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.243 | DEBUG    | __main__:trials:29 - Trial = 19640/30000 | Total reward = 53.60
2022-01-26 14:18:01.246 | DEBUG    | __main__:trials:24 - Trial = 19641/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.248 | DEBUG    | __main__:trials:29 - Trial = 19641/30000 | Total reward = 53.03
2022-01-26 14:18:01.251 | DEBUG    | __main__:trials:24 - Trial = 19642/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.253 | DEBUG    | __main__:trials:29 - Trial = 19642/30000 | Total reward = 50.66
2022-01-26 14:18:01.256 | DEBUG    | __main__:trials:24 - Trial = 19643/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.257 | DEBUG    | __main__:trials:29 - Trial = 19643/30000 | Total reward = 51.76
2022-01-26 14:18:01.261 | DEBUG    | __main__:trials:24 - Trial = 19644/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.262 | DEBUG    | __main__:trials:29 - Trial = 19644/30000 | Total reward = 54.46
2022-01-26 14:18:01.265 | DEBUG    | __main__:trials:26 - Trial = 19645/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.266 | DEBUG    | __main__:trials:29 - Trial = 19645/30000 | Total reward = 23.64
2022-01-26 14:18:01.269 | DEBUG    | __main__:trials:26 - Trial = 19646/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.271 | DEBUG    | __main__:trials:29 - Trial = 19646/30000 | Total reward = 23.64
2022-01-26 14:18:01.275 | DEBUG    | __main__:trials:24 - Trial = 19647/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.276 | DEBUG    | __main__:trials:29 - Trial = 19647/30000 | Total reward = 37.25
2022-01-26 14:18:01.280 | DEBUG    | __main__:trials:26 - Trial = 19648/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.281 | DEBUG    | __main__:trials:29 - Trial = 19648/30000 | Total reward = 26.31
2022-01-26 14:18:01.285 | DEBUG    | __main__:trials:24 - Trial = 19649/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.286 | DEBUG    | __main__:trials:29 - Trial = 19649/30000 | Total reward = 49.57
2022-01-26 14:18:01.289 | DEBUG    | __main__:trials:26 - Trial = 19650/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.290 | DEBUG    | __main__:trials:29 - Trial = 19650/30000 | Total reward = 9.99
2022-01-26 14:18:01.292 | DEBUG    | __main__:trials:26 - Trial = 19651/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.294 | DEBUG    | __main__:trials:29 - Trial = 19651/30000 | Total reward = 9.99
2022-01-26 14:18:01.298 | DEBUG    | __main__:trials:24 - Trial = 19652/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.299 | DEBUG    | __main__:trials:29 - Trial = 19652/30000 | Total reward = 32.63
2022-01-26 14:18:01.302 | DEBUG    | __main__:trials:24 - Trial = 19653/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.305 | DEBUG    | __main__:trials:29 - Trial = 19653/30000 | Total reward = 52.81
2022-01-26 14:18:01.308 | DEBUG    | __main__:trials:24 - Trial = 19654/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.310 | DEBUG    | __main__:trials:29 - Trial = 19654/30000 | Total reward = 50.83
2022-01-26 14:18:01.313 | DEBUG    | __main__:trials:24 - Trial = 19655/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.315 | DEBUG    | __main__:trials:29 - Trial = 19655/30000 | Total reward = 50.87
2022-01-26 14:18:01.319 | DEBUG    | __main__:trials:24 - Trial = 19656/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.320 | DEBUG    | __main__:trials:29 - Trial = 19656/30000 | Total reward = 46.96
2022-01-26 14:18:01.323 | DEBUG    | __main__:trials:24 - Trial = 19657/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.325 | DEBUG    | __main__:trials:29 - Trial = 19657/30000 | Total reward = 53.35
2022-01-26 14:18:01.329 | DEBUG    | __main__:trials:24 - Trial = 19658/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.330 | DEBUG    | __main__:trials:29 - Trial = 19658/30000 | Total reward = 44.27
2022-01-26 14:18:01.334 | DEBUG    | __main__:trials:24 - Trial = 19659/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.336 | DEBUG    | __main__:trials:29 - Trial = 19659/30000 | Total reward = 28.63
2022-01-26 14:18:01.339 | DEBUG    | __main__:trials:24 - Trial = 19660/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.340 | DEBUG    | __main__:trials:29 - Trial = 19660/30000 | Total reward = 48.46
2022-01-26 14:18:01.344 | DEBUG    | __main__:trials:24 - Trial = 19661/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.345 | DEBUG    | __main__:trials:29 - Trial = 19661/30000 | Total reward = 49.60
2022-01-26 14:18:01.349 | DEBUG    | __main__:trials:24 - Trial = 19662/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.351 | DEBUG    | __main__:trials:29 - Trial = 19662/30000 | Total reward = 54.06
2022-01-26 14:18:01.354 | DEBUG    | __main__:trials:24 - Trial = 19663/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.356 | DEBUG    | __main__:trials:29 - Trial = 19663/30000 | Total reward = 50.82
2022-01-26 14:18:01.360 | DEBUG    | __main__:trials:24 - Trial = 19664/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.360 | DEBUG    | __main__:trials:29 - Trial = 19664/30000 | Total reward = 51.72
2022-01-26 14:18:01.364 | DEBUG    | __main__:trials:24 - Trial = 19665/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.366 | DEBUG    | __main__:trials:29 - Trial = 19665/30000 | Total reward = 56.70
2022-01-26 14:18:01.369 | DEBUG    | __main__:trials:24 - Trial = 19666/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.371 | DEBUG    | __main__:trials:29 - Trial = 19666/30000 | Total reward = 53.87
2022-01-26 14:18:01.374 | DEBUG    | __main__:trials:24 - Trial = 19667/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.375 | DEBUG    | __main__:trials:29 - Trial = 19667/30000 | Total reward = 48.73
2022-01-26 14:18:01.378 | DEBUG    | __main__:trials:24 - Trial = 19668/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.380 | DEBUG    | __main__:trials:29 - Trial = 19668/30000 | Total reward = 49.32
2022-01-26 14:18:01.384 | DEBUG    | __main__:trials:24 - Trial = 19669/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.386 | DEBUG    | __main__:trials:29 - Trial = 19669/30000 | Total reward = 36.67
2022-01-26 14:18:01.390 | DEBUG    | __main__:trials:24 - Trial = 19670/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.392 | DEBUG    | __main__:trials:29 - Trial = 19670/30000 | Total reward = 52.13
2022-01-26 14:18:01.396 | DEBUG    | __main__:trials:26 - Trial = 19671/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.396 | DEBUG    | __main__:trials:29 - Trial = 19671/30000 | Total reward = 43.41
2022-01-26 14:18:01.401 | DEBUG    | __main__:trials:24 - Trial = 19672/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.402 | DEBUG    | __main__:trials:29 - Trial = 19672/30000 | Total reward = 53.29
2022-01-26 14:18:01.405 | DEBUG    | __main__:trials:24 - Trial = 19673/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.407 | DEBUG    | __main__:trials:29 - Trial = 19673/30000 | Total reward = 46.89
2022-01-26 14:18:01.411 | DEBUG    | __main__:trials:24 - Trial = 19674/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.412 | DEBUG    | __main__:trials:29 - Trial = 19674/30000 | Total reward = 52.64
2022-01-26 14:18:01.416 | DEBUG    | __main__:trials:24 - Trial = 19675/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.417 | DEBUG    | __main__:trials:29 - Trial = 19675/30000 | Total reward = 52.91
2022-01-26 14:18:01.421 | DEBUG    | __main__:trials:24 - Trial = 19676/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.423 | DEBUG    | __main__:trials:29 - Trial = 19676/30000 | Total reward = 51.15
2022-01-26 14:18:01.426 | DEBUG    | __main__:trials:24 - Trial = 19677/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.428 | DEBUG    | __main__:trials:29 - Trial = 19677/30000 | Total reward = 52.12
2022-01-26 14:18:01.431 | DEBUG    | __main__:trials:24 - Trial = 19678/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.433 | DEBUG    | __main__:trials:29 - Trial = 19678/30000 | Total reward = 54.14
2022-01-26 14:18:01.437 | DEBUG    | __main__:trials:24 - Trial = 19679/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.438 | DEBUG    | __main__:trials:29 - Trial = 19679/30000 | Total reward = 53.06
2022-01-26 14:18:01.442 | DEBUG    | __main__:trials:24 - Trial = 19680/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.444 | DEBUG    | __main__:trials:29 - Trial = 19680/30000 | Total reward = 46.16
2022-01-26 14:18:01.445 | DEBUG    | __main__:trials:26 - Trial = 19681/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.446 | DEBUG    | __main__:trials:29 - Trial = 19681/30000 | Total reward = 9.99
2022-01-26 14:18:01.449 | DEBUG    | __main__:trials:26 - Trial = 19682/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.450 | DEBUG    | __main__:trials:29 - Trial = 19682/30000 | Total reward = 23.83
2022-01-26 14:18:01.453 | DEBUG    | __main__:trials:26 - Trial = 19683/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.455 | DEBUG    | __main__:trials:29 - Trial = 19683/30000 | Total reward = 39.81
2022-01-26 14:18:01.457 | DEBUG    | __main__:trials:26 - Trial = 19684/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.458 | DEBUG    | __main__:trials:29 - Trial = 19684/30000 | Total reward = 26.89
2022-01-26 14:18:01.462 | DEBUG    | __main__:trials:24 - Trial = 19685/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.463 | DEBUG    | __main__:trials:29 - Trial = 19685/30000 | Total reward = 52.60
2022-01-26 14:18:01.466 | DEBUG    | __main__:trials:24 - Trial = 19686/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.468 | DEBUG    | __main__:trials:29 - Trial = 19686/30000 | Total reward = 52.35
2022-01-26 14:18:01.472 | DEBUG    | __main__:trials:24 - Trial = 19687/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.472 | DEBUG    | __main__:trials:29 - Trial = 19687/30000 | Total reward = 51.46
2022-01-26 14:18:01.476 | DEBUG    | __main__:trials:24 - Trial = 19688/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.478 | DEBUG    | __main__:trials:29 - Trial = 19688/30000 | Total reward = 51.64
2022-01-26 14:18:01.481 | DEBUG    | __main__:trials:24 - Trial = 19689/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.482 | DEBUG    | __main__:trials:29 - Trial = 19689/30000 | Total reward = 50.83
2022-01-26 14:18:01.486 | DEBUG    | __main__:trials:24 - Trial = 19690/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.487 | DEBUG    | __main__:trials:29 - Trial = 19690/30000 | Total reward = 56.89
2022-01-26 14:18:01.490 | DEBUG    | __main__:trials:24 - Trial = 19691/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.492 | DEBUG    | __main__:trials:29 - Trial = 19691/30000 | Total reward = 52.01
2022-01-26 14:18:01.496 | DEBUG    | __main__:trials:24 - Trial = 19692/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.497 | DEBUG    | __main__:trials:29 - Trial = 19692/30000 | Total reward = 57.40
2022-01-26 14:18:01.500 | DEBUG    | __main__:trials:26 - Trial = 19693/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.501 | DEBUG    | __main__:trials:29 - Trial = 19693/30000 | Total reward = 11.73
2022-01-26 14:18:01.505 | DEBUG    | __main__:trials:24 - Trial = 19694/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.506 | DEBUG    | __main__:trials:29 - Trial = 19694/30000 | Total reward = 48.14
2022-01-26 14:18:01.509 | DEBUG    | __main__:trials:24 - Trial = 19695/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.510 | DEBUG    | __main__:trials:29 - Trial = 19695/30000 | Total reward = 46.82
2022-01-26 14:18:01.513 | DEBUG    | __main__:trials:24 - Trial = 19696/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.515 | DEBUG    | __main__:trials:29 - Trial = 19696/30000 | Total reward = 54.73
2022-01-26 14:18:01.518 | DEBUG    | __main__:trials:24 - Trial = 19697/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.519 | DEBUG    | __main__:trials:29 - Trial = 19697/30000 | Total reward = 56.44
2022-01-26 14:18:01.522 | DEBUG    | __main__:trials:24 - Trial = 19698/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.524 | DEBUG    | __main__:trials:29 - Trial = 19698/30000 | Total reward = 56.39
2022-01-26 14:18:01.528 | DEBUG    | __main__:trials:24 - Trial = 19699/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.529 | DEBUG    | __main__:trials:29 - Trial = 19699/30000 | Total reward = 48.74
2022-01-26 14:18:01.533 | DEBUG    | __main__:trials:26 - Trial = 19700/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.534 | DEBUG    | __main__:trials:29 - Trial = 19700/30000 | Total reward = 35.87
2022-01-26 14:18:01.538 | DEBUG    | __main__:trials:24 - Trial = 19701/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.540 | DEBUG    | __main__:trials:29 - Trial = 19701/30000 | Total reward = 52.26
2022-01-26 14:18:01.543 | DEBUG    | __main__:trials:24 - Trial = 19702/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.545 | DEBUG    | __main__:trials:29 - Trial = 19702/30000 | Total reward = 51.46
2022-01-26 14:18:01.548 | DEBUG    | __main__:trials:24 - Trial = 19703/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.549 | DEBUG    | __main__:trials:29 - Trial = 19703/30000 | Total reward = 49.90
2022-01-26 14:18:01.553 | DEBUG    | __main__:trials:24 - Trial = 19704/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.554 | DEBUG    | __main__:trials:29 - Trial = 19704/30000 | Total reward = 56.95
2022-01-26 14:18:01.558 | DEBUG    | __main__:trials:24 - Trial = 19705/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.560 | DEBUG    | __main__:trials:29 - Trial = 19705/30000 | Total reward = 52.01
2022-01-26 14:18:01.562 | DEBUG    | __main__:trials:26 - Trial = 19706/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.564 | DEBUG    | __main__:trials:29 - Trial = 19706/30000 | Total reward = 10.12
2022-01-26 14:18:01.567 | DEBUG    | __main__:trials:24 - Trial = 19707/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.569 | DEBUG    | __main__:trials:29 - Trial = 19707/30000 | Total reward = 51.35
2022-01-26 14:18:01.571 | DEBUG    | __main__:trials:26 - Trial = 19708/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.573 | DEBUG    | __main__:trials:29 - Trial = 19708/30000 | Total reward = 10.12
2022-01-26 14:18:01.577 | DEBUG    | __main__:trials:24 - Trial = 19709/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.578 | DEBUG    | __main__:trials:29 - Trial = 19709/30000 | Total reward = 52.56
2022-01-26 14:18:01.581 | DEBUG    | __main__:trials:24 - Trial = 19710/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.582 | DEBUG    | __main__:trials:29 - Trial = 19710/30000 | Total reward = 45.95
2022-01-26 14:18:01.585 | DEBUG    | __main__:trials:26 - Trial = 19711/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.586 | DEBUG    | __main__:trials:29 - Trial = 19711/30000 | Total reward = 37.48
2022-01-26 14:18:01.590 | DEBUG    | __main__:trials:24 - Trial = 19712/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.592 | DEBUG    | __main__:trials:29 - Trial = 19712/30000 | Total reward = 53.73
2022-01-26 14:18:01.595 | DEBUG    | __main__:trials:26 - Trial = 19713/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.596 | DEBUG    | __main__:trials:29 - Trial = 19713/30000 | Total reward = 27.37
2022-01-26 14:18:01.599 | DEBUG    | __main__:trials:26 - Trial = 19714/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.599 | DEBUG    | __main__:trials:29 - Trial = 19714/30000 | Total reward = 9.99
2022-01-26 14:18:01.602 | DEBUG    | __main__:trials:26 - Trial = 19715/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.603 | DEBUG    | __main__:trials:29 - Trial = 19715/30000 | Total reward = 9.99
2022-01-26 14:18:01.607 | DEBUG    | __main__:trials:24 - Trial = 19716/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.609 | DEBUG    | __main__:trials:29 - Trial = 19716/30000 | Total reward = 28.44
2022-01-26 14:18:01.611 | DEBUG    | __main__:trials:26 - Trial = 19717/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.613 | DEBUG    | __main__:trials:29 - Trial = 19717/30000 | Total reward = 9.99
2022-01-26 14:18:01.615 | DEBUG    | __main__:trials:26 - Trial = 19718/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.616 | DEBUG    | __main__:trials:29 - Trial = 19718/30000 | Total reward = 9.99
2022-01-26 14:18:01.619 | DEBUG    | __main__:trials:26 - Trial = 19719/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.621 | DEBUG    | __main__:trials:29 - Trial = 19719/30000 | Total reward = 23.01
2022-01-26 14:18:01.623 | DEBUG    | __main__:trials:26 - Trial = 19720/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.623 | DEBUG    | __main__:trials:29 - Trial = 19720/30000 | Total reward = 9.99
2022-01-26 14:18:01.626 | DEBUG    | __main__:trials:26 - Trial = 19721/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.626 | DEBUG    | __main__:trials:29 - Trial = 19721/30000 | Total reward = 9.99
2022-01-26 14:18:01.630 | DEBUG    | __main__:trials:26 - Trial = 19722/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.632 | DEBUG    | __main__:trials:29 - Trial = 19722/30000 | Total reward = 29.19
2022-01-26 14:18:01.635 | DEBUG    | __main__:trials:26 - Trial = 19723/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.637 | DEBUG    | __main__:trials:29 - Trial = 19723/30000 | Total reward = 17.30
2022-01-26 14:18:01.641 | DEBUG    | __main__:trials:24 - Trial = 19724/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.641 | DEBUG    | __main__:trials:29 - Trial = 19724/30000 | Total reward = 47.27
2022-01-26 14:18:01.645 | DEBUG    | __main__:trials:24 - Trial = 19725/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.647 | DEBUG    | __main__:trials:29 - Trial = 19725/30000 | Total reward = 56.25
2022-01-26 14:18:01.651 | DEBUG    | __main__:trials:24 - Trial = 19726/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.652 | DEBUG    | __main__:trials:29 - Trial = 19726/30000 | Total reward = 50.16
2022-01-26 14:18:01.656 | DEBUG    | __main__:trials:24 - Trial = 19727/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.658 | DEBUG    | __main__:trials:29 - Trial = 19727/30000 | Total reward = 52.48
2022-01-26 14:18:01.661 | DEBUG    | __main__:trials:24 - Trial = 19728/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.663 | DEBUG    | __main__:trials:29 - Trial = 19728/30000 | Total reward = 39.05
2022-01-26 14:18:01.666 | DEBUG    | __main__:trials:26 - Trial = 19729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.667 | DEBUG    | __main__:trials:29 - Trial = 19729/30000 | Total reward = 12.05
2022-01-26 14:18:01.671 | DEBUG    | __main__:trials:24 - Trial = 19730/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.673 | DEBUG    | __main__:trials:29 - Trial = 19730/30000 | Total reward = 43.15
2022-01-26 14:18:01.676 | DEBUG    | __main__:trials:24 - Trial = 19731/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.677 | DEBUG    | __main__:trials:29 - Trial = 19731/30000 | Total reward = 55.40
2022-01-26 14:18:01.681 | DEBUG    | __main__:trials:24 - Trial = 19732/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.682 | DEBUG    | __main__:trials:29 - Trial = 19732/30000 | Total reward = 55.96
2022-01-26 14:18:01.686 | DEBUG    | __main__:trials:24 - Trial = 19733/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.686 | DEBUG    | __main__:trials:29 - Trial = 19733/30000 | Total reward = 43.17
2022-01-26 14:18:01.691 | DEBUG    | __main__:trials:24 - Trial = 19734/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.692 | DEBUG    | __main__:trials:29 - Trial = 19734/30000 | Total reward = 54.78
2022-01-26 14:18:01.696 | DEBUG    | __main__:trials:24 - Trial = 19735/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.697 | DEBUG    | __main__:trials:29 - Trial = 19735/30000 | Total reward = 38.64
2022-01-26 14:18:01.701 | DEBUG    | __main__:trials:24 - Trial = 19736/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.703 | DEBUG    | __main__:trials:29 - Trial = 19736/30000 | Total reward = 26.87
2022-01-26 14:18:01.707 | DEBUG    | __main__:trials:24 - Trial = 19737/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.708 | DEBUG    | __main__:trials:29 - Trial = 19737/30000 | Total reward = 52.19
2022-01-26 14:18:01.711 | DEBUG    | __main__:trials:24 - Trial = 19738/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.713 | DEBUG    | __main__:trials:29 - Trial = 19738/30000 | Total reward = 54.87
2022-01-26 14:18:01.717 | DEBUG    | __main__:trials:24 - Trial = 19739/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.718 | DEBUG    | __main__:trials:29 - Trial = 19739/30000 | Total reward = 52.23
2022-01-26 14:18:01.721 | DEBUG    | __main__:trials:24 - Trial = 19740/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.722 | DEBUG    | __main__:trials:29 - Trial = 19740/30000 | Total reward = 52.54
2022-01-26 14:18:01.727 | DEBUG    | __main__:trials:24 - Trial = 19741/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.728 | DEBUG    | __main__:trials:29 - Trial = 19741/30000 | Total reward = 53.80
2022-01-26 14:18:01.732 | DEBUG    | __main__:trials:24 - Trial = 19742/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.734 | DEBUG    | __main__:trials:29 - Trial = 19742/30000 | Total reward = 47.91
2022-01-26 14:18:01.737 | DEBUG    | __main__:trials:24 - Trial = 19743/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.739 | DEBUG    | __main__:trials:29 - Trial = 19743/30000 | Total reward = 47.11
2022-01-26 14:18:01.742 | DEBUG    | __main__:trials:24 - Trial = 19744/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.744 | DEBUG    | __main__:trials:29 - Trial = 19744/30000 | Total reward = 48.89
2022-01-26 14:18:01.748 | DEBUG    | __main__:trials:24 - Trial = 19745/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.749 | DEBUG    | __main__:trials:29 - Trial = 19745/30000 | Total reward = 61.83
2022-01-26 14:18:01.752 | DEBUG    | __main__:trials:26 - Trial = 19746/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.753 | DEBUG    | __main__:trials:29 - Trial = 19746/30000 | Total reward = 10.15
2022-01-26 14:18:01.757 | DEBUG    | __main__:trials:24 - Trial = 19747/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.758 | DEBUG    | __main__:trials:29 - Trial = 19747/30000 | Total reward = 49.01
2022-01-26 14:18:01.761 | DEBUG    | __main__:trials:24 - Trial = 19748/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.762 | DEBUG    | __main__:trials:29 - Trial = 19748/30000 | Total reward = 52.78
2022-01-26 14:18:01.765 | DEBUG    | __main__:trials:24 - Trial = 19749/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.768 | DEBUG    | __main__:trials:29 - Trial = 19749/30000 | Total reward = 49.65
2022-01-26 14:18:01.771 | DEBUG    | __main__:trials:26 - Trial = 19750/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.773 | DEBUG    | __main__:trials:29 - Trial = 19750/30000 | Total reward = 34.47
2022-01-26 14:18:01.776 | DEBUG    | __main__:trials:26 - Trial = 19751/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.777 | DEBUG    | __main__:trials:29 - Trial = 19751/30000 | Total reward = 41.15
2022-01-26 14:18:01.780 | DEBUG    | __main__:trials:24 - Trial = 19752/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.781 | DEBUG    | __main__:trials:29 - Trial = 19752/30000 | Total reward = 52.20
2022-01-26 14:18:01.784 | DEBUG    | __main__:trials:24 - Trial = 19753/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.786 | DEBUG    | __main__:trials:29 - Trial = 19753/30000 | Total reward = 49.23
2022-01-26 14:18:01.788 | DEBUG    | __main__:trials:26 - Trial = 19754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.789 | DEBUG    | __main__:trials:29 - Trial = 19754/30000 | Total reward = 17.30
2022-01-26 14:18:01.793 | DEBUG    | __main__:trials:24 - Trial = 19755/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.795 | DEBUG    | __main__:trials:29 - Trial = 19755/30000 | Total reward = 49.37
2022-01-26 14:18:01.798 | DEBUG    | __main__:trials:24 - Trial = 19756/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.800 | DEBUG    | __main__:trials:29 - Trial = 19756/30000 | Total reward = 55.70
2022-01-26 14:18:01.803 | DEBUG    | __main__:trials:24 - Trial = 19757/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.804 | DEBUG    | __main__:trials:29 - Trial = 19757/30000 | Total reward = 51.32
2022-01-26 14:18:01.808 | DEBUG    | __main__:trials:26 - Trial = 19758/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.810 | DEBUG    | __main__:trials:29 - Trial = 19758/30000 | Total reward = 43.85
2022-01-26 14:18:01.814 | DEBUG    | __main__:trials:24 - Trial = 19759/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.815 | DEBUG    | __main__:trials:29 - Trial = 19759/30000 | Total reward = 56.15
2022-01-26 14:18:01.819 | DEBUG    | __main__:trials:24 - Trial = 19760/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.821 | DEBUG    | __main__:trials:29 - Trial = 19760/30000 | Total reward = 27.17
2022-01-26 14:18:01.825 | DEBUG    | __main__:trials:24 - Trial = 19761/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.826 | DEBUG    | __main__:trials:29 - Trial = 19761/30000 | Total reward = 48.40
2022-01-26 14:18:01.829 | DEBUG    | __main__:trials:24 - Trial = 19762/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.830 | DEBUG    | __main__:trials:29 - Trial = 19762/30000 | Total reward = 51.02
2022-01-26 14:18:01.833 | DEBUG    | __main__:trials:24 - Trial = 19763/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.835 | DEBUG    | __main__:trials:29 - Trial = 19763/30000 | Total reward = 46.49
2022-01-26 14:18:01.837 | DEBUG    | __main__:trials:26 - Trial = 19764/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.838 | DEBUG    | __main__:trials:29 - Trial = 19764/30000 | Total reward = 7.70
2022-01-26 14:18:01.840 | DEBUG    | __main__:trials:26 - Trial = 19765/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.841 | DEBUG    | __main__:trials:29 - Trial = 19765/30000 | Total reward = 7.70
2022-01-26 14:18:01.845 | DEBUG    | __main__:trials:24 - Trial = 19766/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.846 | DEBUG    | __main__:trials:29 - Trial = 19766/30000 | Total reward = 54.24
2022-01-26 14:18:01.849 | DEBUG    | __main__:trials:24 - Trial = 19767/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.850 | DEBUG    | __main__:trials:29 - Trial = 19767/30000 | Total reward = 56.77
2022-01-26 14:18:01.854 | DEBUG    | __main__:trials:24 - Trial = 19768/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.856 | DEBUG    | __main__:trials:29 - Trial = 19768/30000 | Total reward = 52.45
2022-01-26 14:18:01.859 | DEBUG    | __main__:trials:24 - Trial = 19769/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.861 | DEBUG    | __main__:trials:29 - Trial = 19769/30000 | Total reward = 52.13
2022-01-26 14:18:01.864 | DEBUG    | __main__:trials:24 - Trial = 19770/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.866 | DEBUG    | __main__:trials:29 - Trial = 19770/30000 | Total reward = 50.61
2022-01-26 14:18:01.870 | DEBUG    | __main__:trials:24 - Trial = 19771/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.870 | DEBUG    | __main__:trials:29 - Trial = 19771/30000 | Total reward = 39.88
2022-01-26 14:18:01.875 | DEBUG    | __main__:trials:24 - Trial = 19772/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.876 | DEBUG    | __main__:trials:29 - Trial = 19772/30000 | Total reward = 33.24
2022-01-26 14:18:01.880 | DEBUG    | __main__:trials:24 - Trial = 19773/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.882 | DEBUG    | __main__:trials:29 - Trial = 19773/30000 | Total reward = 51.56
2022-01-26 14:18:01.886 | DEBUG    | __main__:trials:24 - Trial = 19774/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.887 | DEBUG    | __main__:trials:29 - Trial = 19774/30000 | Total reward = 37.16
2022-01-26 14:18:01.890 | DEBUG    | __main__:trials:24 - Trial = 19775/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.892 | DEBUG    | __main__:trials:29 - Trial = 19775/30000 | Total reward = 51.75
2022-01-26 14:18:01.896 | DEBUG    | __main__:trials:24 - Trial = 19776/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.897 | DEBUG    | __main__:trials:29 - Trial = 19776/30000 | Total reward = 56.30
2022-01-26 14:18:01.901 | DEBUG    | __main__:trials:24 - Trial = 19777/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.903 | DEBUG    | __main__:trials:29 - Trial = 19777/30000 | Total reward = 36.37
2022-01-26 14:18:01.905 | DEBUG    | __main__:trials:24 - Trial = 19778/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.906 | DEBUG    | __main__:trials:29 - Trial = 19778/30000 | Total reward = 51.87
2022-01-26 14:18:01.910 | DEBUG    | __main__:trials:24 - Trial = 19779/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.912 | DEBUG    | __main__:trials:29 - Trial = 19779/30000 | Total reward = 52.41
2022-01-26 14:18:01.914 | DEBUG    | __main__:trials:24 - Trial = 19780/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.916 | DEBUG    | __main__:trials:29 - Trial = 19780/30000 | Total reward = 50.39
2022-01-26 14:18:01.919 | DEBUG    | __main__:trials:24 - Trial = 19781/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.921 | DEBUG    | __main__:trials:29 - Trial = 19781/30000 | Total reward = 55.34
2022-01-26 14:18:01.923 | DEBUG    | __main__:trials:26 - Trial = 19782/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:01.925 | DEBUG    | __main__:trials:29 - Trial = 19782/30000 | Total reward = 12.37
2022-01-26 14:18:01.929 | DEBUG    | __main__:trials:24 - Trial = 19783/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.929 | DEBUG    | __main__:trials:29 - Trial = 19783/30000 | Total reward = 49.48
2022-01-26 14:18:01.933 | DEBUG    | __main__:trials:24 - Trial = 19784/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.935 | DEBUG    | __main__:trials:29 - Trial = 19784/30000 | Total reward = 50.66
2022-01-26 14:18:01.937 | DEBUG    | __main__:trials:24 - Trial = 19785/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.939 | DEBUG    | __main__:trials:29 - Trial = 19785/30000 | Total reward = 61.06
2022-01-26 14:18:01.942 | DEBUG    | __main__:trials:24 - Trial = 19786/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.943 | DEBUG    | __main__:trials:29 - Trial = 19786/30000 | Total reward = 57.61
2022-01-26 14:18:01.946 | DEBUG    | __main__:trials:24 - Trial = 19787/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.948 | DEBUG    | __main__:trials:29 - Trial = 19787/30000 | Total reward = 62.85
2022-01-26 14:18:01.951 | DEBUG    | __main__:trials:24 - Trial = 19788/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.953 | DEBUG    | __main__:trials:29 - Trial = 19788/30000 | Total reward = 52.93
2022-01-26 14:18:01.956 | DEBUG    | __main__:trials:24 - Trial = 19789/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.958 | DEBUG    | __main__:trials:29 - Trial = 19789/30000 | Total reward = 58.01
2022-01-26 14:18:01.961 | DEBUG    | __main__:trials:24 - Trial = 19790/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.962 | DEBUG    | __main__:trials:29 - Trial = 19790/30000 | Total reward = 48.41
2022-01-26 14:18:01.965 | DEBUG    | __main__:trials:24 - Trial = 19791/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.966 | DEBUG    | __main__:trials:29 - Trial = 19791/30000 | Total reward = 51.21
2022-01-26 14:18:01.969 | DEBUG    | __main__:trials:24 - Trial = 19792/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.971 | DEBUG    | __main__:trials:29 - Trial = 19792/30000 | Total reward = 33.06
2022-01-26 14:18:01.974 | DEBUG    | __main__:trials:24 - Trial = 19793/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.976 | DEBUG    | __main__:trials:29 - Trial = 19793/30000 | Total reward = 49.01
2022-01-26 14:18:01.979 | DEBUG    | __main__:trials:24 - Trial = 19794/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.981 | DEBUG    | __main__:trials:29 - Trial = 19794/30000 | Total reward = 51.07
2022-01-26 14:18:01.985 | DEBUG    | __main__:trials:24 - Trial = 19795/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.985 | DEBUG    | __main__:trials:29 - Trial = 19795/30000 | Total reward = 52.13
2022-01-26 14:18:01.990 | DEBUG    | __main__:trials:24 - Trial = 19796/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.991 | DEBUG    | __main__:trials:29 - Trial = 19796/30000 | Total reward = 55.84
2022-01-26 14:18:01.995 | DEBUG    | __main__:trials:24 - Trial = 19797/30000 | Max number of steps (20) reached
2022-01-26 14:18:01.996 | DEBUG    | __main__:trials:29 - Trial = 19797/30000 | Total reward = 52.13
2022-01-26 14:18:02.000 | DEBUG    | __main__:trials:24 - Trial = 19798/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.002 | DEBUG    | __main__:trials:29 - Trial = 19798/30000 | Total reward = 47.30
2022-01-26 14:18:02.006 | DEBUG    | __main__:trials:24 - Trial = 19799/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.007 | DEBUG    | __main__:trials:29 - Trial = 19799/30000 | Total reward = 53.44
2022-01-26 14:18:02.011 | DEBUG    | __main__:trials:24 - Trial = 19800/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.013 | DEBUG    | __main__:trials:29 - Trial = 19800/30000 | Total reward = 52.13
2022-01-26 14:18:02.015 | DEBUG    | __main__:trials:24 - Trial = 19801/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.017 | DEBUG    | __main__:trials:29 - Trial = 19801/30000 | Total reward = 53.42
2022-01-26 14:18:02.021 | DEBUG    | __main__:trials:24 - Trial = 19802/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.023 | DEBUG    | __main__:trials:29 - Trial = 19802/30000 | Total reward = 52.79
2022-01-26 14:18:02.027 | DEBUG    | __main__:trials:24 - Trial = 19803/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.027 | DEBUG    | __main__:trials:29 - Trial = 19803/30000 | Total reward = 51.39
2022-01-26 14:18:02.032 | DEBUG    | __main__:trials:24 - Trial = 19804/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.034 | DEBUG    | __main__:trials:29 - Trial = 19804/30000 | Total reward = 49.15
2022-01-26 14:18:02.036 | DEBUG    | __main__:trials:26 - Trial = 19805/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.037 | DEBUG    | __main__:trials:29 - Trial = 19805/30000 | Total reward = 7.12
2022-01-26 14:18:02.040 | DEBUG    | __main__:trials:26 - Trial = 19806/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.041 | DEBUG    | __main__:trials:29 - Trial = 19806/30000 | Total reward = 7.12
2022-01-26 14:18:02.044 | DEBUG    | __main__:trials:24 - Trial = 19807/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.045 | DEBUG    | __main__:trials:29 - Trial = 19807/30000 | Total reward = 52.27
2022-01-26 14:18:02.048 | DEBUG    | __main__:trials:24 - Trial = 19808/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.050 | DEBUG    | __main__:trials:29 - Trial = 19808/30000 | Total reward = 51.93
2022-01-26 14:18:02.053 | DEBUG    | __main__:trials:24 - Trial = 19809/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.054 | DEBUG    | __main__:trials:29 - Trial = 19809/30000 | Total reward = 51.87
2022-01-26 14:18:02.057 | DEBUG    | __main__:trials:24 - Trial = 19810/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.058 | DEBUG    | __main__:trials:29 - Trial = 19810/30000 | Total reward = 53.09
2022-01-26 14:18:02.062 | DEBUG    | __main__:trials:24 - Trial = 19811/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.062 | DEBUG    | __main__:trials:29 - Trial = 19811/30000 | Total reward = 48.14
2022-01-26 14:18:02.066 | DEBUG    | __main__:trials:24 - Trial = 19812/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.068 | DEBUG    | __main__:trials:29 - Trial = 19812/30000 | Total reward = 52.96
2022-01-26 14:18:02.072 | DEBUG    | __main__:trials:24 - Trial = 19813/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.074 | DEBUG    | __main__:trials:29 - Trial = 19813/30000 | Total reward = 52.11
2022-01-26 14:18:02.077 | DEBUG    | __main__:trials:24 - Trial = 19814/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.079 | DEBUG    | __main__:trials:29 - Trial = 19814/30000 | Total reward = 48.37
2022-01-26 14:18:02.083 | DEBUG    | __main__:trials:24 - Trial = 19815/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.084 | DEBUG    | __main__:trials:29 - Trial = 19815/30000 | Total reward = 51.21
2022-01-26 14:18:02.087 | DEBUG    | __main__:trials:24 - Trial = 19816/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.089 | DEBUG    | __main__:trials:29 - Trial = 19816/30000 | Total reward = 55.64
2022-01-26 14:18:02.093 | DEBUG    | __main__:trials:24 - Trial = 19817/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.094 | DEBUG    | __main__:trials:29 - Trial = 19817/30000 | Total reward = 50.67
2022-01-26 14:18:02.098 | DEBUG    | __main__:trials:24 - Trial = 19818/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.101 | DEBUG    | __main__:trials:29 - Trial = 19818/30000 | Total reward = 37.47
2022-01-26 14:18:02.104 | DEBUG    | __main__:trials:24 - Trial = 19819/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.106 | DEBUG    | __main__:trials:29 - Trial = 19819/30000 | Total reward = 50.48
2022-01-26 14:18:02.110 | DEBUG    | __main__:trials:24 - Trial = 19820/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.111 | DEBUG    | __main__:trials:29 - Trial = 19820/30000 | Total reward = 51.89
2022-01-26 14:18:02.114 | DEBUG    | __main__:trials:24 - Trial = 19821/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.116 | DEBUG    | __main__:trials:29 - Trial = 19821/30000 | Total reward = 52.79
2022-01-26 14:18:02.118 | DEBUG    | __main__:trials:26 - Trial = 19822/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.119 | DEBUG    | __main__:trials:29 - Trial = 19822/30000 | Total reward = 7.70
2022-01-26 14:18:02.123 | DEBUG    | __main__:trials:24 - Trial = 19823/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.125 | DEBUG    | __main__:trials:29 - Trial = 19823/30000 | Total reward = 52.53
2022-01-26 14:18:02.126 | DEBUG    | __main__:trials:26 - Trial = 19824/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.128 | DEBUG    | __main__:trials:29 - Trial = 19824/30000 | Total reward = 9.99
2022-01-26 14:18:02.131 | DEBUG    | __main__:trials:24 - Trial = 19825/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.133 | DEBUG    | __main__:trials:29 - Trial = 19825/30000 | Total reward = 59.71
2022-01-26 14:18:02.137 | DEBUG    | __main__:trials:24 - Trial = 19826/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.138 | DEBUG    | __main__:trials:29 - Trial = 19826/30000 | Total reward = 52.26
2022-01-26 14:18:02.141 | DEBUG    | __main__:trials:24 - Trial = 19827/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.143 | DEBUG    | __main__:trials:29 - Trial = 19827/30000 | Total reward = 51.58
2022-01-26 14:18:02.146 | DEBUG    | __main__:trials:24 - Trial = 19828/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.148 | DEBUG    | __main__:trials:29 - Trial = 19828/30000 | Total reward = 51.11
2022-01-26 14:18:02.152 | DEBUG    | __main__:trials:24 - Trial = 19829/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.153 | DEBUG    | __main__:trials:29 - Trial = 19829/30000 | Total reward = 52.28
2022-01-26 14:18:02.157 | DEBUG    | __main__:trials:24 - Trial = 19830/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.158 | DEBUG    | __main__:trials:29 - Trial = 19830/30000 | Total reward = 45.23
2022-01-26 14:18:02.163 | DEBUG    | __main__:trials:24 - Trial = 19831/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.163 | DEBUG    | __main__:trials:29 - Trial = 19831/30000 | Total reward = 61.06
2022-01-26 14:18:02.168 | DEBUG    | __main__:trials:24 - Trial = 19832/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.168 | DEBUG    | __main__:trials:29 - Trial = 19832/30000 | Total reward = 53.60
2022-01-26 14:18:02.172 | DEBUG    | __main__:trials:24 - Trial = 19833/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.173 | DEBUG    | __main__:trials:29 - Trial = 19833/30000 | Total reward = 47.43
2022-01-26 14:18:02.175 | DEBUG    | __main__:trials:26 - Trial = 19834/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.177 | DEBUG    | __main__:trials:29 - Trial = 19834/30000 | Total reward = 9.99
2022-01-26 14:18:02.181 | DEBUG    | __main__:trials:24 - Trial = 19835/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.182 | DEBUG    | __main__:trials:29 - Trial = 19835/30000 | Total reward = 51.01
2022-01-26 14:18:02.186 | DEBUG    | __main__:trials:24 - Trial = 19836/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.187 | DEBUG    | __main__:trials:29 - Trial = 19836/30000 | Total reward = 49.36
2022-01-26 14:18:02.191 | DEBUG    | __main__:trials:24 - Trial = 19837/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.191 | DEBUG    | __main__:trials:29 - Trial = 19837/30000 | Total reward = 53.39
2022-01-26 14:18:02.195 | DEBUG    | __main__:trials:24 - Trial = 19838/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.196 | DEBUG    | __main__:trials:29 - Trial = 19838/30000 | Total reward = 51.88
2022-01-26 14:18:02.200 | DEBUG    | __main__:trials:24 - Trial = 19839/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.201 | DEBUG    | __main__:trials:29 - Trial = 19839/30000 | Total reward = 53.29
2022-01-26 14:18:02.206 | DEBUG    | __main__:trials:24 - Trial = 19840/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.207 | DEBUG    | __main__:trials:29 - Trial = 19840/30000 | Total reward = 47.03
2022-01-26 14:18:02.211 | DEBUG    | __main__:trials:24 - Trial = 19841/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.212 | DEBUG    | __main__:trials:29 - Trial = 19841/30000 | Total reward = 55.46
2022-01-26 14:18:02.216 | DEBUG    | __main__:trials:26 - Trial = 19842/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.216 | DEBUG    | __main__:trials:29 - Trial = 19842/30000 | Total reward = 27.46
2022-01-26 14:18:02.221 | DEBUG    | __main__:trials:24 - Trial = 19843/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.222 | DEBUG    | __main__:trials:29 - Trial = 19843/30000 | Total reward = 52.30
2022-01-26 14:18:02.226 | DEBUG    | __main__:trials:24 - Trial = 19844/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.227 | DEBUG    | __main__:trials:29 - Trial = 19844/30000 | Total reward = 52.78
2022-01-26 14:18:02.231 | DEBUG    | __main__:trials:24 - Trial = 19845/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.232 | DEBUG    | __main__:trials:29 - Trial = 19845/30000 | Total reward = 51.76
2022-01-26 14:18:02.235 | DEBUG    | __main__:trials:24 - Trial = 19846/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.237 | DEBUG    | __main__:trials:29 - Trial = 19846/30000 | Total reward = 49.10
2022-01-26 14:18:02.241 | DEBUG    | __main__:trials:24 - Trial = 19847/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.242 | DEBUG    | __main__:trials:29 - Trial = 19847/30000 | Total reward = 52.01
2022-01-26 14:18:02.246 | DEBUG    | __main__:trials:24 - Trial = 19848/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.248 | DEBUG    | __main__:trials:29 - Trial = 19848/30000 | Total reward = 52.13
2022-01-26 14:18:02.251 | DEBUG    | __main__:trials:24 - Trial = 19849/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.253 | DEBUG    | __main__:trials:29 - Trial = 19849/30000 | Total reward = 45.74
2022-01-26 14:18:02.257 | DEBUG    | __main__:trials:24 - Trial = 19850/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.257 | DEBUG    | __main__:trials:29 - Trial = 19850/30000 | Total reward = 50.89
2022-01-26 14:18:02.261 | DEBUG    | __main__:trials:24 - Trial = 19851/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.263 | DEBUG    | __main__:trials:29 - Trial = 19851/30000 | Total reward = 45.65
2022-01-26 14:18:02.266 | DEBUG    | __main__:trials:24 - Trial = 19852/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.266 | DEBUG    | __main__:trials:29 - Trial = 19852/30000 | Total reward = 39.05
2022-01-26 14:18:02.270 | DEBUG    | __main__:trials:24 - Trial = 19853/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.272 | DEBUG    | __main__:trials:29 - Trial = 19853/30000 | Total reward = 48.93
2022-01-26 14:18:02.276 | DEBUG    | __main__:trials:24 - Trial = 19854/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.276 | DEBUG    | __main__:trials:29 - Trial = 19854/30000 | Total reward = 47.49
2022-01-26 14:18:02.281 | DEBUG    | __main__:trials:24 - Trial = 19855/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.282 | DEBUG    | __main__:trials:29 - Trial = 19855/30000 | Total reward = 43.78
2022-01-26 14:18:02.287 | DEBUG    | __main__:trials:24 - Trial = 19856/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.288 | DEBUG    | __main__:trials:29 - Trial = 19856/30000 | Total reward = 40.84
2022-01-26 14:18:02.292 | DEBUG    | __main__:trials:24 - Trial = 19857/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.293 | DEBUG    | __main__:trials:29 - Trial = 19857/30000 | Total reward = 51.36
2022-01-26 14:18:02.296 | DEBUG    | __main__:trials:24 - Trial = 19858/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.298 | DEBUG    | __main__:trials:29 - Trial = 19858/30000 | Total reward = 48.22
2022-01-26 14:18:02.302 | DEBUG    | __main__:trials:24 - Trial = 19859/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.303 | DEBUG    | __main__:trials:29 - Trial = 19859/30000 | Total reward = 39.36
2022-01-26 14:18:02.306 | DEBUG    | __main__:trials:24 - Trial = 19860/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.308 | DEBUG    | __main__:trials:29 - Trial = 19860/30000 | Total reward = 46.42
2022-01-26 14:18:02.312 | DEBUG    | __main__:trials:24 - Trial = 19861/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.314 | DEBUG    | __main__:trials:29 - Trial = 19861/30000 | Total reward = 52.19
2022-01-26 14:18:02.317 | DEBUG    | __main__:trials:24 - Trial = 19862/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.319 | DEBUG    | __main__:trials:29 - Trial = 19862/30000 | Total reward = 52.15
2022-01-26 14:18:02.323 | DEBUG    | __main__:trials:24 - Trial = 19863/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.324 | DEBUG    | __main__:trials:29 - Trial = 19863/30000 | Total reward = 52.13
2022-01-26 14:18:02.328 | DEBUG    | __main__:trials:24 - Trial = 19864/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.330 | DEBUG    | __main__:trials:29 - Trial = 19864/30000 | Total reward = 53.94
2022-01-26 14:18:02.333 | DEBUG    | __main__:trials:24 - Trial = 19865/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.335 | DEBUG    | __main__:trials:29 - Trial = 19865/30000 | Total reward = 52.97
2022-01-26 14:18:02.339 | DEBUG    | __main__:trials:24 - Trial = 19866/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.340 | DEBUG    | __main__:trials:29 - Trial = 19866/30000 | Total reward = 55.55
2022-01-26 14:18:02.344 | DEBUG    | __main__:trials:24 - Trial = 19867/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.345 | DEBUG    | __main__:trials:29 - Trial = 19867/30000 | Total reward = 52.17
2022-01-26 14:18:02.349 | DEBUG    | __main__:trials:24 - Trial = 19868/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.351 | DEBUG    | __main__:trials:29 - Trial = 19868/30000 | Total reward = 47.10
2022-01-26 14:18:02.355 | DEBUG    | __main__:trials:24 - Trial = 19869/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.355 | DEBUG    | __main__:trials:29 - Trial = 19869/30000 | Total reward = 51.72
2022-01-26 14:18:02.360 | DEBUG    | __main__:trials:24 - Trial = 19870/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.360 | DEBUG    | __main__:trials:29 - Trial = 19870/30000 | Total reward = 51.26
2022-01-26 14:18:02.365 | DEBUG    | __main__:trials:24 - Trial = 19871/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.366 | DEBUG    | __main__:trials:29 - Trial = 19871/30000 | Total reward = 47.34
2022-01-26 14:18:02.369 | DEBUG    | __main__:trials:24 - Trial = 19872/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.371 | DEBUG    | __main__:trials:29 - Trial = 19872/30000 | Total reward = 45.70
2022-01-26 14:18:02.374 | DEBUG    | __main__:trials:24 - Trial = 19873/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.376 | DEBUG    | __main__:trials:29 - Trial = 19873/30000 | Total reward = 49.38
2022-01-26 14:18:02.379 | DEBUG    | __main__:trials:24 - Trial = 19874/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.381 | DEBUG    | __main__:trials:29 - Trial = 19874/30000 | Total reward = 51.29
2022-01-26 14:18:02.385 | DEBUG    | __main__:trials:24 - Trial = 19875/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.386 | DEBUG    | __main__:trials:29 - Trial = 19875/30000 | Total reward = 51.77
2022-01-26 14:18:02.389 | DEBUG    | __main__:trials:24 - Trial = 19876/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.390 | DEBUG    | __main__:trials:29 - Trial = 19876/30000 | Total reward = 46.13
2022-01-26 14:18:02.394 | DEBUG    | __main__:trials:24 - Trial = 19877/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.396 | DEBUG    | __main__:trials:29 - Trial = 19877/30000 | Total reward = 52.13
2022-01-26 14:18:02.400 | DEBUG    | __main__:trials:24 - Trial = 19878/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.402 | DEBUG    | __main__:trials:29 - Trial = 19878/30000 | Total reward = 60.04
2022-01-26 14:18:02.406 | DEBUG    | __main__:trials:24 - Trial = 19879/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.406 | DEBUG    | __main__:trials:29 - Trial = 19879/30000 | Total reward = 50.04
2022-01-26 14:18:02.411 | DEBUG    | __main__:trials:24 - Trial = 19880/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.412 | DEBUG    | __main__:trials:29 - Trial = 19880/30000 | Total reward = 46.01
2022-01-26 14:18:02.416 | DEBUG    | __main__:trials:24 - Trial = 19881/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.417 | DEBUG    | __main__:trials:29 - Trial = 19881/30000 | Total reward = 45.01
2022-01-26 14:18:02.421 | DEBUG    | __main__:trials:24 - Trial = 19882/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.422 | DEBUG    | __main__:trials:29 - Trial = 19882/30000 | Total reward = 49.66
2022-01-26 14:18:02.425 | DEBUG    | __main__:trials:24 - Trial = 19883/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.426 | DEBUG    | __main__:trials:29 - Trial = 19883/30000 | Total reward = 53.71
2022-01-26 14:18:02.431 | DEBUG    | __main__:trials:24 - Trial = 19884/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.432 | DEBUG    | __main__:trials:29 - Trial = 19884/30000 | Total reward = 49.78
2022-01-26 14:18:02.436 | DEBUG    | __main__:trials:24 - Trial = 19885/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.437 | DEBUG    | __main__:trials:29 - Trial = 19885/30000 | Total reward = 45.99
2022-01-26 14:18:02.441 | DEBUG    | __main__:trials:24 - Trial = 19886/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.442 | DEBUG    | __main__:trials:29 - Trial = 19886/30000 | Total reward = 52.43
2022-01-26 14:18:02.446 | DEBUG    | __main__:trials:24 - Trial = 19887/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.448 | DEBUG    | __main__:trials:29 - Trial = 19887/30000 | Total reward = 45.09
2022-01-26 14:18:02.451 | DEBUG    | __main__:trials:24 - Trial = 19888/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.452 | DEBUG    | __main__:trials:29 - Trial = 19888/30000 | Total reward = 55.73
2022-01-26 14:18:02.456 | DEBUG    | __main__:trials:24 - Trial = 19889/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.457 | DEBUG    | __main__:trials:29 - Trial = 19889/30000 | Total reward = 51.69
2022-01-26 14:18:02.462 | DEBUG    | __main__:trials:24 - Trial = 19890/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.463 | DEBUG    | __main__:trials:29 - Trial = 19890/30000 | Total reward = 43.93
2022-01-26 14:18:02.467 | DEBUG    | __main__:trials:24 - Trial = 19891/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.468 | DEBUG    | __main__:trials:29 - Trial = 19891/30000 | Total reward = 43.72
2022-01-26 14:18:02.472 | DEBUG    | __main__:trials:24 - Trial = 19892/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.473 | DEBUG    | __main__:trials:29 - Trial = 19892/30000 | Total reward = 43.27
2022-01-26 14:18:02.477 | DEBUG    | __main__:trials:24 - Trial = 19893/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.479 | DEBUG    | __main__:trials:29 - Trial = 19893/30000 | Total reward = 47.91
2022-01-26 14:18:02.482 | DEBUG    | __main__:trials:24 - Trial = 19894/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.483 | DEBUG    | __main__:trials:29 - Trial = 19894/30000 | Total reward = 52.78
2022-01-26 14:18:02.488 | DEBUG    | __main__:trials:24 - Trial = 19895/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.488 | DEBUG    | __main__:trials:29 - Trial = 19895/30000 | Total reward = 44.07
2022-01-26 14:18:02.492 | DEBUG    | __main__:trials:24 - Trial = 19896/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.494 | DEBUG    | __main__:trials:29 - Trial = 19896/30000 | Total reward = 58.38
2022-01-26 14:18:02.497 | DEBUG    | __main__:trials:24 - Trial = 19897/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.498 | DEBUG    | __main__:trials:29 - Trial = 19897/30000 | Total reward = 51.04
2022-01-26 14:18:02.502 | DEBUG    | __main__:trials:24 - Trial = 19898/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.504 | DEBUG    | __main__:trials:29 - Trial = 19898/30000 | Total reward = 47.62
2022-01-26 14:18:02.507 | DEBUG    | __main__:trials:24 - Trial = 19899/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.509 | DEBUG    | __main__:trials:29 - Trial = 19899/30000 | Total reward = 51.78
2022-01-26 14:18:02.512 | DEBUG    | __main__:trials:24 - Trial = 19900/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.514 | DEBUG    | __main__:trials:29 - Trial = 19900/30000 | Total reward = 60.92
2022-01-26 14:18:02.518 | DEBUG    | __main__:trials:24 - Trial = 19901/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.519 | DEBUG    | __main__:trials:29 - Trial = 19901/30000 | Total reward = 49.59
2022-01-26 14:18:02.522 | DEBUG    | __main__:trials:24 - Trial = 19902/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.524 | DEBUG    | __main__:trials:29 - Trial = 19902/30000 | Total reward = 36.73
2022-01-26 14:18:02.528 | DEBUG    | __main__:trials:24 - Trial = 19903/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.529 | DEBUG    | __main__:trials:29 - Trial = 19903/30000 | Total reward = 51.64
2022-01-26 14:18:02.533 | DEBUG    | __main__:trials:24 - Trial = 19904/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.534 | DEBUG    | __main__:trials:29 - Trial = 19904/30000 | Total reward = 45.08
2022-01-26 14:18:02.538 | DEBUG    | __main__:trials:24 - Trial = 19905/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.539 | DEBUG    | __main__:trials:29 - Trial = 19905/30000 | Total reward = 47.97
2022-01-26 14:18:02.543 | DEBUG    | __main__:trials:24 - Trial = 19906/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.544 | DEBUG    | __main__:trials:29 - Trial = 19906/30000 | Total reward = 45.65
2022-01-26 14:18:02.547 | DEBUG    | __main__:trials:24 - Trial = 19907/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.549 | DEBUG    | __main__:trials:29 - Trial = 19907/30000 | Total reward = 37.33
2022-01-26 14:18:02.553 | DEBUG    | __main__:trials:24 - Trial = 19908/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.554 | DEBUG    | __main__:trials:29 - Trial = 19908/30000 | Total reward = 45.04
2022-01-26 14:18:02.557 | DEBUG    | __main__:trials:24 - Trial = 19909/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.559 | DEBUG    | __main__:trials:29 - Trial = 19909/30000 | Total reward = 53.00
2022-01-26 14:18:02.563 | DEBUG    | __main__:trials:24 - Trial = 19910/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.565 | DEBUG    | __main__:trials:29 - Trial = 19910/30000 | Total reward = 50.71
2022-01-26 14:18:02.568 | DEBUG    | __main__:trials:24 - Trial = 19911/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.570 | DEBUG    | __main__:trials:29 - Trial = 19911/30000 | Total reward = 52.23
2022-01-26 14:18:02.574 | DEBUG    | __main__:trials:24 - Trial = 19912/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.575 | DEBUG    | __main__:trials:29 - Trial = 19912/30000 | Total reward = 52.38
2022-01-26 14:18:02.579 | DEBUG    | __main__:trials:24 - Trial = 19913/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.581 | DEBUG    | __main__:trials:29 - Trial = 19913/30000 | Total reward = 37.05
2022-01-26 14:18:02.585 | DEBUG    | __main__:trials:26 - Trial = 19914/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.586 | DEBUG    | __main__:trials:29 - Trial = 19914/30000 | Total reward = 25.57
2022-01-26 14:18:02.590 | DEBUG    | __main__:trials:24 - Trial = 19915/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.592 | DEBUG    | __main__:trials:29 - Trial = 19915/30000 | Total reward = 48.66
2022-01-26 14:18:02.595 | DEBUG    | __main__:trials:24 - Trial = 19916/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.597 | DEBUG    | __main__:trials:29 - Trial = 19916/30000 | Total reward = 45.13
2022-01-26 14:18:02.600 | DEBUG    | __main__:trials:26 - Trial = 19917/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.601 | DEBUG    | __main__:trials:29 - Trial = 19917/30000 | Total reward = 32.92
2022-01-26 14:18:02.606 | DEBUG    | __main__:trials:24 - Trial = 19918/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.606 | DEBUG    | __main__:trials:29 - Trial = 19918/30000 | Total reward = 49.30
2022-01-26 14:18:02.611 | DEBUG    | __main__:trials:24 - Trial = 19919/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.611 | DEBUG    | __main__:trials:29 - Trial = 19919/30000 | Total reward = 47.99
2022-01-26 14:18:02.616 | DEBUG    | __main__:trials:24 - Trial = 19920/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.618 | DEBUG    | __main__:trials:29 - Trial = 19920/30000 | Total reward = 38.79
2022-01-26 14:18:02.621 | DEBUG    | __main__:trials:24 - Trial = 19921/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.623 | DEBUG    | __main__:trials:29 - Trial = 19921/30000 | Total reward = 48.22
2022-01-26 14:18:02.627 | DEBUG    | __main__:trials:24 - Trial = 19922/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.627 | DEBUG    | __main__:trials:29 - Trial = 19922/30000 | Total reward = 52.54
2022-01-26 14:18:02.632 | DEBUG    | __main__:trials:24 - Trial = 19923/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.633 | DEBUG    | __main__:trials:29 - Trial = 19923/30000 | Total reward = 48.04
2022-01-26 14:18:02.636 | DEBUG    | __main__:trials:24 - Trial = 19924/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.638 | DEBUG    | __main__:trials:29 - Trial = 19924/30000 | Total reward = 51.23
2022-01-26 14:18:02.641 | DEBUG    | __main__:trials:24 - Trial = 19925/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.642 | DEBUG    | __main__:trials:29 - Trial = 19925/30000 | Total reward = 50.66
2022-01-26 14:18:02.645 | DEBUG    | __main__:trials:24 - Trial = 19926/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.646 | DEBUG    | __main__:trials:29 - Trial = 19926/30000 | Total reward = 52.13
2022-01-26 14:18:02.649 | DEBUG    | __main__:trials:24 - Trial = 19927/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.650 | DEBUG    | __main__:trials:29 - Trial = 19927/30000 | Total reward = 51.13
2022-01-26 14:18:02.654 | DEBUG    | __main__:trials:24 - Trial = 19928/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.655 | DEBUG    | __main__:trials:29 - Trial = 19928/30000 | Total reward = 39.80
2022-01-26 14:18:02.658 | DEBUG    | __main__:trials:24 - Trial = 19929/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.660 | DEBUG    | __main__:trials:29 - Trial = 19929/30000 | Total reward = 53.44
2022-01-26 14:18:02.663 | DEBUG    | __main__:trials:24 - Trial = 19930/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.665 | DEBUG    | __main__:trials:29 - Trial = 19930/30000 | Total reward = 53.18
2022-01-26 14:18:02.668 | DEBUG    | __main__:trials:24 - Trial = 19931/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.670 | DEBUG    | __main__:trials:29 - Trial = 19931/30000 | Total reward = 52.78
2022-01-26 14:18:02.673 | DEBUG    | __main__:trials:24 - Trial = 19932/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.675 | DEBUG    | __main__:trials:29 - Trial = 19932/30000 | Total reward = 52.97
2022-01-26 14:18:02.679 | DEBUG    | __main__:trials:24 - Trial = 19933/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.681 | DEBUG    | __main__:trials:29 - Trial = 19933/30000 | Total reward = 52.13
2022-01-26 14:18:02.684 | DEBUG    | __main__:trials:26 - Trial = 19934/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.685 | DEBUG    | __main__:trials:29 - Trial = 19934/30000 | Total reward = 22.38
2022-01-26 14:18:02.689 | DEBUG    | __main__:trials:26 - Trial = 19935/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.690 | DEBUG    | __main__:trials:29 - Trial = 19935/30000 | Total reward = 30.92
2022-01-26 14:18:02.693 | DEBUG    | __main__:trials:26 - Trial = 19936/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.693 | DEBUG    | __main__:trials:29 - Trial = 19936/30000 | Total reward = 11.80
2022-01-26 14:18:02.698 | DEBUG    | __main__:trials:24 - Trial = 19937/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.698 | DEBUG    | __main__:trials:29 - Trial = 19937/30000 | Total reward = 51.11
2022-01-26 14:18:02.701 | DEBUG    | __main__:trials:26 - Trial = 19938/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.703 | DEBUG    | __main__:trials:29 - Trial = 19938/30000 | Total reward = 24.37
2022-01-26 14:18:02.707 | DEBUG    | __main__:trials:24 - Trial = 19939/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.708 | DEBUG    | __main__:trials:29 - Trial = 19939/30000 | Total reward = 51.34
2022-01-26 14:18:02.711 | DEBUG    | __main__:trials:24 - Trial = 19940/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.713 | DEBUG    | __main__:trials:29 - Trial = 19940/30000 | Total reward = 48.99
2022-01-26 14:18:02.717 | DEBUG    | __main__:trials:24 - Trial = 19941/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.718 | DEBUG    | __main__:trials:29 - Trial = 19941/30000 | Total reward = 52.13
2022-01-26 14:18:02.721 | DEBUG    | __main__:trials:24 - Trial = 19942/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.723 | DEBUG    | __main__:trials:29 - Trial = 19942/30000 | Total reward = 41.21
2022-01-26 14:18:02.726 | DEBUG    | __main__:trials:24 - Trial = 19943/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.726 | DEBUG    | __main__:trials:29 - Trial = 19943/30000 | Total reward = 51.94
2022-01-26 14:18:02.730 | DEBUG    | __main__:trials:24 - Trial = 19944/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.730 | DEBUG    | __main__:trials:29 - Trial = 19944/30000 | Total reward = 52.13
2022-01-26 14:18:02.734 | DEBUG    | __main__:trials:24 - Trial = 19945/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.736 | DEBUG    | __main__:trials:29 - Trial = 19945/30000 | Total reward = 42.75
2022-01-26 14:18:02.738 | DEBUG    | __main__:trials:26 - Trial = 19946/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.739 | DEBUG    | __main__:trials:29 - Trial = 19946/30000 | Total reward = 14.38
2022-01-26 14:18:02.743 | DEBUG    | __main__:trials:24 - Trial = 19947/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.744 | DEBUG    | __main__:trials:29 - Trial = 19947/30000 | Total reward = 53.49
2022-01-26 14:18:02.748 | DEBUG    | __main__:trials:26 - Trial = 19948/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.749 | DEBUG    | __main__:trials:29 - Trial = 19948/30000 | Total reward = 33.70
2022-01-26 14:18:02.753 | DEBUG    | __main__:trials:24 - Trial = 19949/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.755 | DEBUG    | __main__:trials:29 - Trial = 19949/30000 | Total reward = 46.27
2022-01-26 14:18:02.759 | DEBUG    | __main__:trials:24 - Trial = 19950/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.760 | DEBUG    | __main__:trials:29 - Trial = 19950/30000 | Total reward = 53.12
2022-01-26 14:18:02.764 | DEBUG    | __main__:trials:26 - Trial = 19951/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.765 | DEBUG    | __main__:trials:29 - Trial = 19951/30000 | Total reward = 41.44
2022-01-26 14:18:02.768 | DEBUG    | __main__:trials:26 - Trial = 19952/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.769 | DEBUG    | __main__:trials:29 - Trial = 19952/30000 | Total reward = 28.34
2022-01-26 14:18:02.773 | DEBUG    | __main__:trials:24 - Trial = 19953/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.773 | DEBUG    | __main__:trials:29 - Trial = 19953/30000 | Total reward = 53.70
2022-01-26 14:18:02.777 | DEBUG    | __main__:trials:24 - Trial = 19954/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.778 | DEBUG    | __main__:trials:29 - Trial = 19954/30000 | Total reward = 45.77
2022-01-26 14:18:02.782 | DEBUG    | __main__:trials:26 - Trial = 19955/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.783 | DEBUG    | __main__:trials:29 - Trial = 19955/30000 | Total reward = 31.04
2022-01-26 14:18:02.787 | DEBUG    | __main__:trials:24 - Trial = 19956/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.788 | DEBUG    | __main__:trials:29 - Trial = 19956/30000 | Total reward = 48.88
2022-01-26 14:18:02.791 | DEBUG    | __main__:trials:26 - Trial = 19957/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.793 | DEBUG    | __main__:trials:29 - Trial = 19957/30000 | Total reward = 17.90
2022-01-26 14:18:02.795 | DEBUG    | __main__:trials:26 - Trial = 19958/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.797 | DEBUG    | __main__:trials:29 - Trial = 19958/30000 | Total reward = 30.96
2022-01-26 14:18:02.800 | DEBUG    | __main__:trials:24 - Trial = 19959/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.802 | DEBUG    | __main__:trials:29 - Trial = 19959/30000 | Total reward = 42.63
2022-01-26 14:18:02.806 | DEBUG    | __main__:trials:24 - Trial = 19960/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.808 | DEBUG    | __main__:trials:29 - Trial = 19960/30000 | Total reward = 48.40
2022-01-26 14:18:02.811 | DEBUG    | __main__:trials:26 - Trial = 19961/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.813 | DEBUG    | __main__:trials:29 - Trial = 19961/30000 | Total reward = 31.04
2022-01-26 14:18:02.814 | DEBUG    | __main__:trials:26 - Trial = 19962/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.816 | DEBUG    | __main__:trials:29 - Trial = 19962/30000 | Total reward = 9.99
2022-01-26 14:18:02.819 | DEBUG    | __main__:trials:24 - Trial = 19963/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.821 | DEBUG    | __main__:trials:29 - Trial = 19963/30000 | Total reward = 47.22
2022-01-26 14:18:02.824 | DEBUG    | __main__:trials:24 - Trial = 19964/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.825 | DEBUG    | __main__:trials:29 - Trial = 19964/30000 | Total reward = 59.46
2022-01-26 14:18:02.830 | DEBUG    | __main__:trials:24 - Trial = 19965/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.830 | DEBUG    | __main__:trials:29 - Trial = 19965/30000 | Total reward = 62.05
2022-01-26 14:18:02.834 | DEBUG    | __main__:trials:26 - Trial = 19966/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.835 | DEBUG    | __main__:trials:29 - Trial = 19966/30000 | Total reward = 17.47
2022-01-26 14:18:02.839 | DEBUG    | __main__:trials:24 - Trial = 19967/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.840 | DEBUG    | __main__:trials:29 - Trial = 19967/30000 | Total reward = 58.78
2022-01-26 14:18:02.845 | DEBUG    | __main__:trials:24 - Trial = 19968/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.846 | DEBUG    | __main__:trials:29 - Trial = 19968/30000 | Total reward = 55.76
2022-01-26 14:18:02.850 | DEBUG    | __main__:trials:24 - Trial = 19969/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.851 | DEBUG    | __main__:trials:29 - Trial = 19969/30000 | Total reward = 54.90
2022-01-26 14:18:02.855 | DEBUG    | __main__:trials:24 - Trial = 19970/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.856 | DEBUG    | __main__:trials:29 - Trial = 19970/30000 | Total reward = 49.74
2022-01-26 14:18:02.861 | DEBUG    | __main__:trials:24 - Trial = 19971/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.861 | DEBUG    | __main__:trials:29 - Trial = 19971/30000 | Total reward = 53.47
2022-01-26 14:18:02.866 | DEBUG    | __main__:trials:24 - Trial = 19972/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.867 | DEBUG    | __main__:trials:29 - Trial = 19972/30000 | Total reward = 47.17
2022-01-26 14:18:02.871 | DEBUG    | __main__:trials:24 - Trial = 19973/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.872 | DEBUG    | __main__:trials:29 - Trial = 19973/30000 | Total reward = 50.90
2022-01-26 14:18:02.876 | DEBUG    | __main__:trials:24 - Trial = 19974/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.877 | DEBUG    | __main__:trials:29 - Trial = 19974/30000 | Total reward = 52.14
2022-01-26 14:18:02.881 | DEBUG    | __main__:trials:24 - Trial = 19975/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.883 | DEBUG    | __main__:trials:29 - Trial = 19975/30000 | Total reward = 58.31
2022-01-26 14:18:02.887 | DEBUG    | __main__:trials:24 - Trial = 19976/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.888 | DEBUG    | __main__:trials:29 - Trial = 19976/30000 | Total reward = 49.89
2022-01-26 14:18:02.892 | DEBUG    | __main__:trials:24 - Trial = 19977/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.893 | DEBUG    | __main__:trials:29 - Trial = 19977/30000 | Total reward = 47.30
2022-01-26 14:18:02.897 | DEBUG    | __main__:trials:24 - Trial = 19978/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.898 | DEBUG    | __main__:trials:29 - Trial = 19978/30000 | Total reward = 60.97
2022-01-26 14:18:02.902 | DEBUG    | __main__:trials:24 - Trial = 19979/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.904 | DEBUG    | __main__:trials:29 - Trial = 19979/30000 | Total reward = 60.38
2022-01-26 14:18:02.907 | DEBUG    | __main__:trials:24 - Trial = 19980/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.909 | DEBUG    | __main__:trials:29 - Trial = 19980/30000 | Total reward = 48.37
2022-01-26 14:18:02.912 | DEBUG    | __main__:trials:24 - Trial = 19981/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.914 | DEBUG    | __main__:trials:29 - Trial = 19981/30000 | Total reward = 47.16
2022-01-26 14:18:02.918 | DEBUG    | __main__:trials:24 - Trial = 19982/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.919 | DEBUG    | __main__:trials:29 - Trial = 19982/30000 | Total reward = 47.03
2022-01-26 14:18:02.922 | DEBUG    | __main__:trials:24 - Trial = 19983/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.924 | DEBUG    | __main__:trials:29 - Trial = 19983/30000 | Total reward = 45.27
2022-01-26 14:18:02.928 | DEBUG    | __main__:trials:24 - Trial = 19984/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.929 | DEBUG    | __main__:trials:29 - Trial = 19984/30000 | Total reward = 49.45
2022-01-26 14:18:02.933 | DEBUG    | __main__:trials:24 - Trial = 19985/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.935 | DEBUG    | __main__:trials:29 - Trial = 19985/30000 | Total reward = 53.38
2022-01-26 14:18:02.938 | DEBUG    | __main__:trials:26 - Trial = 19986/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.940 | DEBUG    | __main__:trials:29 - Trial = 19986/30000 | Total reward = 27.88
2022-01-26 14:18:02.943 | DEBUG    | __main__:trials:24 - Trial = 19987/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.944 | DEBUG    | __main__:trials:29 - Trial = 19987/30000 | Total reward = 49.64
2022-01-26 14:18:02.947 | DEBUG    | __main__:trials:24 - Trial = 19988/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.949 | DEBUG    | __main__:trials:29 - Trial = 19988/30000 | Total reward = 55.99
2022-01-26 14:18:02.952 | DEBUG    | __main__:trials:24 - Trial = 19989/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.954 | DEBUG    | __main__:trials:29 - Trial = 19989/30000 | Total reward = 59.00
2022-01-26 14:18:02.958 | DEBUG    | __main__:trials:24 - Trial = 19990/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.959 | DEBUG    | __main__:trials:29 - Trial = 19990/30000 | Total reward = 57.70
2022-01-26 14:18:02.962 | DEBUG    | __main__:trials:26 - Trial = 19991/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:02.964 | DEBUG    | __main__:trials:29 - Trial = 19991/30000 | Total reward = 8.84
2022-01-26 14:18:02.968 | DEBUG    | __main__:trials:24 - Trial = 19992/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.969 | DEBUG    | __main__:trials:29 - Trial = 19992/30000 | Total reward = 41.84
2022-01-26 14:18:02.973 | DEBUG    | __main__:trials:24 - Trial = 19993/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.974 | DEBUG    | __main__:trials:29 - Trial = 19993/30000 | Total reward = 62.23
2022-01-26 14:18:02.978 | DEBUG    | __main__:trials:24 - Trial = 19994/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.979 | DEBUG    | __main__:trials:29 - Trial = 19994/30000 | Total reward = 57.21
2022-01-26 14:18:02.983 | DEBUG    | __main__:trials:24 - Trial = 19995/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.985 | DEBUG    | __main__:trials:29 - Trial = 19995/30000 | Total reward = 48.62
2022-01-26 14:18:02.988 | DEBUG    | __main__:trials:24 - Trial = 19996/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.989 | DEBUG    | __main__:trials:29 - Trial = 19996/30000 | Total reward = 40.65
2022-01-26 14:18:02.993 | DEBUG    | __main__:trials:24 - Trial = 19997/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.995 | DEBUG    | __main__:trials:29 - Trial = 19997/30000 | Total reward = 49.07
2022-01-26 14:18:02.999 | DEBUG    | __main__:trials:24 - Trial = 19998/30000 | Max number of steps (20) reached
2022-01-26 14:18:02.999 | DEBUG    | __main__:trials:29 - Trial = 19998/30000 | Total reward = 45.39
2022-01-26 14:18:03.004 | DEBUG    | __main__:trials:24 - Trial = 19999/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.005 | DEBUG    | __main__:trials:29 - Trial = 19999/30000 | Total reward = 47.87
2022-01-26 14:18:03.008 | DEBUG    | __main__:trials:24 - Trial = 20000/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.010 | DEBUG    | __main__:trials:29 - Trial = 20000/30000 | Total reward = 51.50
2022-01-26 14:18:03.013 | DEBUG    | __main__:trials:24 - Trial = 20001/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.014 | DEBUG    | __main__:trials:29 - Trial = 20001/30000 | Total reward = 48.01
2022-01-26 14:18:03.017 | DEBUG    | __main__:trials:24 - Trial = 20002/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.018 | DEBUG    | __main__:trials:29 - Trial = 20002/30000 | Total reward = 45.56
2022-01-26 14:18:03.021 | DEBUG    | __main__:trials:24 - Trial = 20003/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.022 | DEBUG    | __main__:trials:29 - Trial = 20003/30000 | Total reward = 49.18
2022-01-26 14:18:03.026 | DEBUG    | __main__:trials:24 - Trial = 20004/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.028 | DEBUG    | __main__:trials:29 - Trial = 20004/30000 | Total reward = 46.67
2022-01-26 14:18:03.031 | DEBUG    | __main__:trials:24 - Trial = 20005/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.032 | DEBUG    | __main__:trials:29 - Trial = 20005/30000 | Total reward = 47.48
2022-01-26 14:18:03.036 | DEBUG    | __main__:trials:24 - Trial = 20006/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.038 | DEBUG    | __main__:trials:29 - Trial = 20006/30000 | Total reward = 46.85
2022-01-26 14:18:03.042 | DEBUG    | __main__:trials:24 - Trial = 20007/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.043 | DEBUG    | __main__:trials:29 - Trial = 20007/30000 | Total reward = 49.12
2022-01-26 14:18:03.046 | DEBUG    | __main__:trials:24 - Trial = 20008/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.048 | DEBUG    | __main__:trials:29 - Trial = 20008/30000 | Total reward = 38.93
2022-01-26 14:18:03.051 | DEBUG    | __main__:trials:24 - Trial = 20009/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.052 | DEBUG    | __main__:trials:29 - Trial = 20009/30000 | Total reward = 37.94
2022-01-26 14:18:03.056 | DEBUG    | __main__:trials:24 - Trial = 20010/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.058 | DEBUG    | __main__:trials:29 - Trial = 20010/30000 | Total reward = 38.54
2022-01-26 14:18:03.061 | DEBUG    | __main__:trials:24 - Trial = 20011/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.063 | DEBUG    | __main__:trials:29 - Trial = 20011/30000 | Total reward = 36.27
2022-01-26 14:18:03.066 | DEBUG    | __main__:trials:24 - Trial = 20012/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.068 | DEBUG    | __main__:trials:29 - Trial = 20012/30000 | Total reward = 40.25
2022-01-26 14:18:03.071 | DEBUG    | __main__:trials:24 - Trial = 20013/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.072 | DEBUG    | __main__:trials:29 - Trial = 20013/30000 | Total reward = 48.42
2022-01-26 14:18:03.076 | DEBUG    | __main__:trials:24 - Trial = 20014/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.078 | DEBUG    | __main__:trials:29 - Trial = 20014/30000 | Total reward = 38.41
2022-01-26 14:18:03.081 | DEBUG    | __main__:trials:24 - Trial = 20015/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.083 | DEBUG    | __main__:trials:29 - Trial = 20015/30000 | Total reward = 29.90
2022-01-26 14:18:03.087 | DEBUG    | __main__:trials:24 - Trial = 20016/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.087 | DEBUG    | __main__:trials:29 - Trial = 20016/30000 | Total reward = 36.27
2022-01-26 14:18:03.092 | DEBUG    | __main__:trials:24 - Trial = 20017/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.093 | DEBUG    | __main__:trials:29 - Trial = 20017/30000 | Total reward = 42.36
2022-01-26 14:18:03.097 | DEBUG    | __main__:trials:24 - Trial = 20018/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.098 | DEBUG    | __main__:trials:29 - Trial = 20018/30000 | Total reward = 63.57
2022-01-26 14:18:03.102 | DEBUG    | __main__:trials:24 - Trial = 20019/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.103 | DEBUG    | __main__:trials:29 - Trial = 20019/30000 | Total reward = 39.88
2022-01-26 14:18:03.106 | DEBUG    | __main__:trials:24 - Trial = 20020/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.108 | DEBUG    | __main__:trials:29 - Trial = 20020/30000 | Total reward = 38.33
2022-01-26 14:18:03.112 | DEBUG    | __main__:trials:24 - Trial = 20021/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.112 | DEBUG    | __main__:trials:29 - Trial = 20021/30000 | Total reward = 41.83
2022-01-26 14:18:03.116 | DEBUG    | __main__:trials:24 - Trial = 20022/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.118 | DEBUG    | __main__:trials:29 - Trial = 20022/30000 | Total reward = 43.46
2022-01-26 14:18:03.122 | DEBUG    | __main__:trials:24 - Trial = 20023/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.123 | DEBUG    | __main__:trials:29 - Trial = 20023/30000 | Total reward = 39.12
2022-01-26 14:18:03.127 | DEBUG    | __main__:trials:24 - Trial = 20024/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.128 | DEBUG    | __main__:trials:29 - Trial = 20024/30000 | Total reward = 42.95
2022-01-26 14:18:03.132 | DEBUG    | __main__:trials:24 - Trial = 20025/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.134 | DEBUG    | __main__:trials:29 - Trial = 20025/30000 | Total reward = 37.34
2022-01-26 14:18:03.138 | DEBUG    | __main__:trials:24 - Trial = 20026/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.139 | DEBUG    | __main__:trials:29 - Trial = 20026/30000 | Total reward = 37.61
2022-01-26 14:18:03.143 | DEBUG    | __main__:trials:24 - Trial = 20027/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.144 | DEBUG    | __main__:trials:29 - Trial = 20027/30000 | Total reward = 40.25
2022-01-26 14:18:03.148 | DEBUG    | __main__:trials:24 - Trial = 20028/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.149 | DEBUG    | __main__:trials:29 - Trial = 20028/30000 | Total reward = 38.60
2022-01-26 14:18:03.154 | DEBUG    | __main__:trials:24 - Trial = 20029/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.155 | DEBUG    | __main__:trials:29 - Trial = 20029/30000 | Total reward = 40.50
2022-01-26 14:18:03.158 | DEBUG    | __main__:trials:24 - Trial = 20030/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.160 | DEBUG    | __main__:trials:29 - Trial = 20030/30000 | Total reward = 41.93
2022-01-26 14:18:03.164 | DEBUG    | __main__:trials:24 - Trial = 20031/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.165 | DEBUG    | __main__:trials:29 - Trial = 20031/30000 | Total reward = 33.39
2022-01-26 14:18:03.169 | DEBUG    | __main__:trials:24 - Trial = 20032/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.170 | DEBUG    | __main__:trials:29 - Trial = 20032/30000 | Total reward = 40.04
2022-01-26 14:18:03.174 | DEBUG    | __main__:trials:24 - Trial = 20033/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.174 | DEBUG    | __main__:trials:29 - Trial = 20033/30000 | Total reward = 50.66
2022-01-26 14:18:03.179 | DEBUG    | __main__:trials:24 - Trial = 20034/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.181 | DEBUG    | __main__:trials:29 - Trial = 20034/30000 | Total reward = 46.48
2022-01-26 14:18:03.184 | DEBUG    | __main__:trials:24 - Trial = 20035/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.185 | DEBUG    | __main__:trials:29 - Trial = 20035/30000 | Total reward = 42.26
2022-01-26 14:18:03.189 | DEBUG    | __main__:trials:26 - Trial = 20036/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.190 | DEBUG    | __main__:trials:29 - Trial = 20036/30000 | Total reward = 28.06
2022-01-26 14:18:03.193 | DEBUG    | __main__:trials:24 - Trial = 20037/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.194 | DEBUG    | __main__:trials:29 - Trial = 20037/30000 | Total reward = 37.82
2022-01-26 14:18:03.199 | DEBUG    | __main__:trials:24 - Trial = 20038/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.200 | DEBUG    | __main__:trials:29 - Trial = 20038/30000 | Total reward = 48.58
2022-01-26 14:18:03.204 | DEBUG    | __main__:trials:24 - Trial = 20039/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.205 | DEBUG    | __main__:trials:29 - Trial = 20039/30000 | Total reward = 50.02
2022-01-26 14:18:03.209 | DEBUG    | __main__:trials:24 - Trial = 20040/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.211 | DEBUG    | __main__:trials:29 - Trial = 20040/30000 | Total reward = 38.41
2022-01-26 14:18:03.214 | DEBUG    | __main__:trials:24 - Trial = 20041/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.215 | DEBUG    | __main__:trials:29 - Trial = 20041/30000 | Total reward = 36.08
2022-01-26 14:18:03.218 | DEBUG    | __main__:trials:24 - Trial = 20042/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.220 | DEBUG    | __main__:trials:29 - Trial = 20042/30000 | Total reward = 48.77
2022-01-26 14:18:03.223 | DEBUG    | __main__:trials:24 - Trial = 20043/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.225 | DEBUG    | __main__:trials:29 - Trial = 20043/30000 | Total reward = 38.64
2022-01-26 14:18:03.228 | DEBUG    | __main__:trials:24 - Trial = 20044/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.230 | DEBUG    | __main__:trials:29 - Trial = 20044/30000 | Total reward = 44.70
2022-01-26 14:18:03.234 | DEBUG    | __main__:trials:24 - Trial = 20045/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.235 | DEBUG    | __main__:trials:29 - Trial = 20045/30000 | Total reward = 40.53
2022-01-26 14:18:03.239 | DEBUG    | __main__:trials:24 - Trial = 20046/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.241 | DEBUG    | __main__:trials:29 - Trial = 20046/30000 | Total reward = 62.19
2022-01-26 14:18:03.244 | DEBUG    | __main__:trials:24 - Trial = 20047/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.245 | DEBUG    | __main__:trials:29 - Trial = 20047/30000 | Total reward = 19.82
2022-01-26 14:18:03.249 | DEBUG    | __main__:trials:24 - Trial = 20048/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.250 | DEBUG    | __main__:trials:29 - Trial = 20048/30000 | Total reward = 64.51
2022-01-26 14:18:03.254 | DEBUG    | __main__:trials:24 - Trial = 20049/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.255 | DEBUG    | __main__:trials:29 - Trial = 20049/30000 | Total reward = 47.39
2022-01-26 14:18:03.259 | DEBUG    | __main__:trials:24 - Trial = 20050/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.260 | DEBUG    | __main__:trials:29 - Trial = 20050/30000 | Total reward = 38.41
2022-01-26 14:18:03.264 | DEBUG    | __main__:trials:24 - Trial = 20051/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.266 | DEBUG    | __main__:trials:29 - Trial = 20051/30000 | Total reward = 37.71
2022-01-26 14:18:03.270 | DEBUG    | __main__:trials:24 - Trial = 20052/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.271 | DEBUG    | __main__:trials:29 - Trial = 20052/30000 | Total reward = 48.45
2022-01-26 14:18:03.275 | DEBUG    | __main__:trials:24 - Trial = 20053/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.277 | DEBUG    | __main__:trials:29 - Trial = 20053/30000 | Total reward = 28.17
2022-01-26 14:18:03.281 | DEBUG    | __main__:trials:24 - Trial = 20054/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.282 | DEBUG    | __main__:trials:29 - Trial = 20054/30000 | Total reward = 36.49
2022-01-26 14:18:03.286 | DEBUG    | __main__:trials:24 - Trial = 20055/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.286 | DEBUG    | __main__:trials:29 - Trial = 20055/30000 | Total reward = 35.43
2022-01-26 14:18:03.290 | DEBUG    | __main__:trials:24 - Trial = 20056/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.292 | DEBUG    | __main__:trials:29 - Trial = 20056/30000 | Total reward = 45.07
2022-01-26 14:18:03.296 | DEBUG    | __main__:trials:24 - Trial = 20057/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.296 | DEBUG    | __main__:trials:29 - Trial = 20057/30000 | Total reward = 36.69
2022-01-26 14:18:03.301 | DEBUG    | __main__:trials:24 - Trial = 20058/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.302 | DEBUG    | __main__:trials:29 - Trial = 20058/30000 | Total reward = 45.14
2022-01-26 14:18:03.306 | DEBUG    | __main__:trials:24 - Trial = 20059/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.308 | DEBUG    | __main__:trials:29 - Trial = 20059/30000 | Total reward = 53.97
2022-01-26 14:18:03.311 | DEBUG    | __main__:trials:24 - Trial = 20060/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.312 | DEBUG    | __main__:trials:29 - Trial = 20060/30000 | Total reward = 36.04
2022-01-26 14:18:03.316 | DEBUG    | __main__:trials:24 - Trial = 20061/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.318 | DEBUG    | __main__:trials:29 - Trial = 20061/30000 | Total reward = 44.90
2022-01-26 14:18:03.321 | DEBUG    | __main__:trials:24 - Trial = 20062/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.323 | DEBUG    | __main__:trials:29 - Trial = 20062/30000 | Total reward = 38.46
2022-01-26 14:18:03.325 | DEBUG    | __main__:trials:24 - Trial = 20063/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.327 | DEBUG    | __main__:trials:29 - Trial = 20063/30000 | Total reward = 48.69
2022-01-26 14:18:03.331 | DEBUG    | __main__:trials:24 - Trial = 20064/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.333 | DEBUG    | __main__:trials:29 - Trial = 20064/30000 | Total reward = 46.11
2022-01-26 14:18:03.336 | DEBUG    | __main__:trials:24 - Trial = 20065/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.337 | DEBUG    | __main__:trials:29 - Trial = 20065/30000 | Total reward = 40.49
2022-01-26 14:18:03.341 | DEBUG    | __main__:trials:24 - Trial = 20066/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.342 | DEBUG    | __main__:trials:29 - Trial = 20066/30000 | Total reward = 45.15
2022-01-26 14:18:03.346 | DEBUG    | __main__:trials:24 - Trial = 20067/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.347 | DEBUG    | __main__:trials:29 - Trial = 20067/30000 | Total reward = 50.26
2022-01-26 14:18:03.351 | DEBUG    | __main__:trials:26 - Trial = 20068/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.352 | DEBUG    | __main__:trials:29 - Trial = 20068/30000 | Total reward = 31.64
2022-01-26 14:18:03.356 | DEBUG    | __main__:trials:24 - Trial = 20069/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.357 | DEBUG    | __main__:trials:29 - Trial = 20069/30000 | Total reward = 49.67
2022-01-26 14:18:03.361 | DEBUG    | __main__:trials:24 - Trial = 20070/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.363 | DEBUG    | __main__:trials:29 - Trial = 20070/30000 | Total reward = 37.36
2022-01-26 14:18:03.367 | DEBUG    | __main__:trials:24 - Trial = 20071/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.369 | DEBUG    | __main__:trials:29 - Trial = 20071/30000 | Total reward = 37.44
2022-01-26 14:18:03.372 | DEBUG    | __main__:trials:24 - Trial = 20072/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.374 | DEBUG    | __main__:trials:29 - Trial = 20072/30000 | Total reward = 49.86
2022-01-26 14:18:03.378 | DEBUG    | __main__:trials:24 - Trial = 20073/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.378 | DEBUG    | __main__:trials:29 - Trial = 20073/30000 | Total reward = 43.81
2022-01-26 14:18:03.382 | DEBUG    | __main__:trials:24 - Trial = 20074/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.384 | DEBUG    | __main__:trials:29 - Trial = 20074/30000 | Total reward = 36.55
2022-01-26 14:18:03.388 | DEBUG    | __main__:trials:24 - Trial = 20075/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.389 | DEBUG    | __main__:trials:29 - Trial = 20075/30000 | Total reward = 36.26
2022-01-26 14:18:03.393 | DEBUG    | __main__:trials:24 - Trial = 20076/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.395 | DEBUG    | __main__:trials:29 - Trial = 20076/30000 | Total reward = 50.27
2022-01-26 14:18:03.398 | DEBUG    | __main__:trials:24 - Trial = 20077/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.400 | DEBUG    | __main__:trials:29 - Trial = 20077/30000 | Total reward = 36.19
2022-01-26 14:18:03.403 | DEBUG    | __main__:trials:24 - Trial = 20078/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.404 | DEBUG    | __main__:trials:29 - Trial = 20078/30000 | Total reward = 39.71
2022-01-26 14:18:03.408 | DEBUG    | __main__:trials:24 - Trial = 20079/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.409 | DEBUG    | __main__:trials:29 - Trial = 20079/30000 | Total reward = 47.03
2022-01-26 14:18:03.414 | DEBUG    | __main__:trials:24 - Trial = 20080/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.414 | DEBUG    | __main__:trials:29 - Trial = 20080/30000 | Total reward = 40.33
2022-01-26 14:18:03.419 | DEBUG    | __main__:trials:24 - Trial = 20081/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.420 | DEBUG    | __main__:trials:29 - Trial = 20081/30000 | Total reward = 38.34
2022-01-26 14:18:03.424 | DEBUG    | __main__:trials:24 - Trial = 20082/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.425 | DEBUG    | __main__:trials:29 - Trial = 20082/30000 | Total reward = 39.21
2022-01-26 14:18:03.429 | DEBUG    | __main__:trials:24 - Trial = 20083/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.431 | DEBUG    | __main__:trials:29 - Trial = 20083/30000 | Total reward = 60.40
2022-01-26 14:18:03.435 | DEBUG    | __main__:trials:24 - Trial = 20084/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.436 | DEBUG    | __main__:trials:29 - Trial = 20084/30000 | Total reward = 59.52
2022-01-26 14:18:03.440 | DEBUG    | __main__:trials:24 - Trial = 20085/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.441 | DEBUG    | __main__:trials:29 - Trial = 20085/30000 | Total reward = 54.49
2022-01-26 14:18:03.446 | DEBUG    | __main__:trials:24 - Trial = 20086/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.447 | DEBUG    | __main__:trials:29 - Trial = 20086/30000 | Total reward = 43.29
2022-01-26 14:18:03.451 | DEBUG    | __main__:trials:24 - Trial = 20087/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.452 | DEBUG    | __main__:trials:29 - Trial = 20087/30000 | Total reward = 60.92
2022-01-26 14:18:03.456 | DEBUG    | __main__:trials:24 - Trial = 20088/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.458 | DEBUG    | __main__:trials:29 - Trial = 20088/30000 | Total reward = 38.19
2022-01-26 14:18:03.462 | DEBUG    | __main__:trials:24 - Trial = 20089/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.463 | DEBUG    | __main__:trials:29 - Trial = 20089/30000 | Total reward = 60.91
2022-01-26 14:18:03.466 | DEBUG    | __main__:trials:24 - Trial = 20090/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.468 | DEBUG    | __main__:trials:29 - Trial = 20090/30000 | Total reward = 38.47
2022-01-26 14:18:03.471 | DEBUG    | __main__:trials:24 - Trial = 20091/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.473 | DEBUG    | __main__:trials:29 - Trial = 20091/30000 | Total reward = 48.01
2022-01-26 14:18:03.477 | DEBUG    | __main__:trials:24 - Trial = 20092/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.477 | DEBUG    | __main__:trials:29 - Trial = 20092/30000 | Total reward = 52.48
2022-01-26 14:18:03.482 | DEBUG    | __main__:trials:24 - Trial = 20093/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.483 | DEBUG    | __main__:trials:29 - Trial = 20093/30000 | Total reward = 42.54
2022-01-26 14:18:03.487 | DEBUG    | __main__:trials:24 - Trial = 20094/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.489 | DEBUG    | __main__:trials:29 - Trial = 20094/30000 | Total reward = 49.58
2022-01-26 14:18:03.492 | DEBUG    | __main__:trials:24 - Trial = 20095/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.493 | DEBUG    | __main__:trials:29 - Trial = 20095/30000 | Total reward = 53.61
2022-01-26 14:18:03.496 | DEBUG    | __main__:trials:24 - Trial = 20096/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.498 | DEBUG    | __main__:trials:29 - Trial = 20096/30000 | Total reward = 60.82
2022-01-26 14:18:03.502 | DEBUG    | __main__:trials:24 - Trial = 20097/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.504 | DEBUG    | __main__:trials:29 - Trial = 20097/30000 | Total reward = 36.17
2022-01-26 14:18:03.508 | DEBUG    | __main__:trials:24 - Trial = 20098/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.509 | DEBUG    | __main__:trials:29 - Trial = 20098/30000 | Total reward = 51.68
2022-01-26 14:18:03.514 | DEBUG    | __main__:trials:24 - Trial = 20099/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.515 | DEBUG    | __main__:trials:29 - Trial = 20099/30000 | Total reward = 34.94
2022-01-26 14:18:03.519 | DEBUG    | __main__:trials:24 - Trial = 20100/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.521 | DEBUG    | __main__:trials:29 - Trial = 20100/30000 | Total reward = 58.52
2022-01-26 14:18:03.524 | DEBUG    | __main__:trials:24 - Trial = 20101/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.526 | DEBUG    | __main__:trials:29 - Trial = 20101/30000 | Total reward = 46.89
2022-01-26 14:18:03.530 | DEBUG    | __main__:trials:24 - Trial = 20102/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.531 | DEBUG    | __main__:trials:29 - Trial = 20102/30000 | Total reward = 49.85
2022-01-26 14:18:03.535 | DEBUG    | __main__:trials:24 - Trial = 20103/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.536 | DEBUG    | __main__:trials:29 - Trial = 20103/30000 | Total reward = 48.33
2022-01-26 14:18:03.540 | DEBUG    | __main__:trials:24 - Trial = 20104/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.542 | DEBUG    | __main__:trials:29 - Trial = 20104/30000 | Total reward = 51.51
2022-01-26 14:18:03.546 | DEBUG    | __main__:trials:24 - Trial = 20105/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.547 | DEBUG    | __main__:trials:29 - Trial = 20105/30000 | Total reward = 42.55
2022-01-26 14:18:03.551 | DEBUG    | __main__:trials:24 - Trial = 20106/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.553 | DEBUG    | __main__:trials:29 - Trial = 20106/30000 | Total reward = 55.43
2022-01-26 14:18:03.556 | DEBUG    | __main__:trials:24 - Trial = 20107/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.558 | DEBUG    | __main__:trials:29 - Trial = 20107/30000 | Total reward = 49.17
2022-01-26 14:18:03.562 | DEBUG    | __main__:trials:24 - Trial = 20108/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.563 | DEBUG    | __main__:trials:29 - Trial = 20108/30000 | Total reward = 52.05
2022-01-26 14:18:03.567 | DEBUG    | __main__:trials:24 - Trial = 20109/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.569 | DEBUG    | __main__:trials:29 - Trial = 20109/30000 | Total reward = 34.93
2022-01-26 14:18:03.572 | DEBUG    | __main__:trials:24 - Trial = 20110/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.574 | DEBUG    | __main__:trials:29 - Trial = 20110/30000 | Total reward = 61.61
2022-01-26 14:18:03.578 | DEBUG    | __main__:trials:24 - Trial = 20111/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.580 | DEBUG    | __main__:trials:29 - Trial = 20111/30000 | Total reward = 53.22
2022-01-26 14:18:03.582 | DEBUG    | __main__:trials:26 - Trial = 20112/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.584 | DEBUG    | __main__:trials:29 - Trial = 20112/30000 | Total reward = 24.31
2022-01-26 14:18:03.587 | DEBUG    | __main__:trials:24 - Trial = 20113/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.588 | DEBUG    | __main__:trials:29 - Trial = 20113/30000 | Total reward = 56.69
2022-01-26 14:18:03.592 | DEBUG    | __main__:trials:24 - Trial = 20114/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.593 | DEBUG    | __main__:trials:29 - Trial = 20114/30000 | Total reward = 49.39
2022-01-26 14:18:03.598 | DEBUG    | __main__:trials:24 - Trial = 20115/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.599 | DEBUG    | __main__:trials:29 - Trial = 20115/30000 | Total reward = 45.41
2022-01-26 14:18:03.603 | DEBUG    | __main__:trials:24 - Trial = 20116/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.604 | DEBUG    | __main__:trials:29 - Trial = 20116/30000 | Total reward = 58.93
2022-01-26 14:18:03.609 | DEBUG    | __main__:trials:24 - Trial = 20117/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.610 | DEBUG    | __main__:trials:29 - Trial = 20117/30000 | Total reward = 48.21
2022-01-26 14:18:03.613 | DEBUG    | __main__:trials:24 - Trial = 20118/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.614 | DEBUG    | __main__:trials:29 - Trial = 20118/30000 | Total reward = 58.68
2022-01-26 14:18:03.617 | DEBUG    | __main__:trials:24 - Trial = 20119/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.619 | DEBUG    | __main__:trials:29 - Trial = 20119/30000 | Total reward = 39.57
2022-01-26 14:18:03.622 | DEBUG    | __main__:trials:24 - Trial = 20120/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.624 | DEBUG    | __main__:trials:29 - Trial = 20120/30000 | Total reward = 44.60
2022-01-26 14:18:03.628 | DEBUG    | __main__:trials:24 - Trial = 20121/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.629 | DEBUG    | __main__:trials:29 - Trial = 20121/30000 | Total reward = 43.28
2022-01-26 14:18:03.633 | DEBUG    | __main__:trials:24 - Trial = 20122/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.635 | DEBUG    | __main__:trials:29 - Trial = 20122/30000 | Total reward = 52.66
2022-01-26 14:18:03.639 | DEBUG    | __main__:trials:24 - Trial = 20123/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.640 | DEBUG    | __main__:trials:29 - Trial = 20123/30000 | Total reward = 52.66
2022-01-26 14:18:03.644 | DEBUG    | __main__:trials:24 - Trial = 20124/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.646 | DEBUG    | __main__:trials:29 - Trial = 20124/30000 | Total reward = 47.48
2022-01-26 14:18:03.650 | DEBUG    | __main__:trials:24 - Trial = 20125/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.650 | DEBUG    | __main__:trials:29 - Trial = 20125/30000 | Total reward = 52.05
2022-01-26 14:18:03.655 | DEBUG    | __main__:trials:24 - Trial = 20126/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.656 | DEBUG    | __main__:trials:29 - Trial = 20126/30000 | Total reward = 58.21
2022-01-26 14:18:03.660 | DEBUG    | __main__:trials:24 - Trial = 20127/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.661 | DEBUG    | __main__:trials:29 - Trial = 20127/30000 | Total reward = 35.75
2022-01-26 14:18:03.665 | DEBUG    | __main__:trials:24 - Trial = 20128/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.667 | DEBUG    | __main__:trials:29 - Trial = 20128/30000 | Total reward = 46.31
2022-01-26 14:18:03.671 | DEBUG    | __main__:trials:24 - Trial = 20129/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.671 | DEBUG    | __main__:trials:29 - Trial = 20129/30000 | Total reward = 55.38
2022-01-26 14:18:03.675 | DEBUG    | __main__:trials:24 - Trial = 20130/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.677 | DEBUG    | __main__:trials:29 - Trial = 20130/30000 | Total reward = 61.03
2022-01-26 14:18:03.680 | DEBUG    | __main__:trials:24 - Trial = 20131/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.682 | DEBUG    | __main__:trials:29 - Trial = 20131/30000 | Total reward = 43.00
2022-01-26 14:18:03.686 | DEBUG    | __main__:trials:24 - Trial = 20132/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.688 | DEBUG    | __main__:trials:29 - Trial = 20132/30000 | Total reward = 47.51
2022-01-26 14:18:03.691 | DEBUG    | __main__:trials:24 - Trial = 20133/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.692 | DEBUG    | __main__:trials:29 - Trial = 20133/30000 | Total reward = 52.38
2022-01-26 14:18:03.697 | DEBUG    | __main__:trials:24 - Trial = 20134/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.698 | DEBUG    | __main__:trials:29 - Trial = 20134/30000 | Total reward = 52.13
2022-01-26 14:18:03.702 | DEBUG    | __main__:trials:24 - Trial = 20135/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.703 | DEBUG    | __main__:trials:29 - Trial = 20135/30000 | Total reward = 52.99
2022-01-26 14:18:03.707 | DEBUG    | __main__:trials:24 - Trial = 20136/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.708 | DEBUG    | __main__:trials:29 - Trial = 20136/30000 | Total reward = 48.53
2022-01-26 14:18:03.713 | DEBUG    | __main__:trials:24 - Trial = 20137/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.713 | DEBUG    | __main__:trials:29 - Trial = 20137/30000 | Total reward = 49.38
2022-01-26 14:18:03.718 | DEBUG    | __main__:trials:24 - Trial = 20138/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.719 | DEBUG    | __main__:trials:29 - Trial = 20138/30000 | Total reward = 39.57
2022-01-26 14:18:03.722 | DEBUG    | __main__:trials:24 - Trial = 20139/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.724 | DEBUG    | __main__:trials:29 - Trial = 20139/30000 | Total reward = 45.57
2022-01-26 14:18:03.727 | DEBUG    | __main__:trials:24 - Trial = 20140/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.729 | DEBUG    | __main__:trials:29 - Trial = 20140/30000 | Total reward = 57.20
2022-01-26 14:18:03.732 | DEBUG    | __main__:trials:24 - Trial = 20141/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.733 | DEBUG    | __main__:trials:29 - Trial = 20141/30000 | Total reward = 45.16
2022-01-26 14:18:03.738 | DEBUG    | __main__:trials:24 - Trial = 20142/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.738 | DEBUG    | __main__:trials:29 - Trial = 20142/30000 | Total reward = 60.35
2022-01-26 14:18:03.743 | DEBUG    | __main__:trials:24 - Trial = 20143/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.744 | DEBUG    | __main__:trials:29 - Trial = 20143/30000 | Total reward = 45.63
2022-01-26 14:18:03.748 | DEBUG    | __main__:trials:24 - Trial = 20144/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.750 | DEBUG    | __main__:trials:29 - Trial = 20144/30000 | Total reward = 49.71
2022-01-26 14:18:03.754 | DEBUG    | __main__:trials:24 - Trial = 20145/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.754 | DEBUG    | __main__:trials:29 - Trial = 20145/30000 | Total reward = 41.23
2022-01-26 14:18:03.758 | DEBUG    | __main__:trials:24 - Trial = 20146/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.760 | DEBUG    | __main__:trials:29 - Trial = 20146/30000 | Total reward = 50.75
2022-01-26 14:18:03.763 | DEBUG    | __main__:trials:24 - Trial = 20147/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.765 | DEBUG    | __main__:trials:29 - Trial = 20147/30000 | Total reward = 46.58
2022-01-26 14:18:03.769 | DEBUG    | __main__:trials:24 - Trial = 20148/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.770 | DEBUG    | __main__:trials:29 - Trial = 20148/30000 | Total reward = 36.52
2022-01-26 14:18:03.773 | DEBUG    | __main__:trials:24 - Trial = 20149/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.774 | DEBUG    | __main__:trials:29 - Trial = 20149/30000 | Total reward = 38.60
2022-01-26 14:18:03.777 | DEBUG    | __main__:trials:24 - Trial = 20150/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.778 | DEBUG    | __main__:trials:29 - Trial = 20150/30000 | Total reward = 34.20
2022-01-26 14:18:03.781 | DEBUG    | __main__:trials:24 - Trial = 20151/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.782 | DEBUG    | __main__:trials:29 - Trial = 20151/30000 | Total reward = 36.62
2022-01-26 14:18:03.785 | DEBUG    | __main__:trials:24 - Trial = 20152/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.786 | DEBUG    | __main__:trials:29 - Trial = 20152/30000 | Total reward = 49.47
2022-01-26 14:18:03.790 | DEBUG    | __main__:trials:24 - Trial = 20153/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.791 | DEBUG    | __main__:trials:29 - Trial = 20153/30000 | Total reward = 45.14
2022-01-26 14:18:03.795 | DEBUG    | __main__:trials:24 - Trial = 20154/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.796 | DEBUG    | __main__:trials:29 - Trial = 20154/30000 | Total reward = 46.33
2022-01-26 14:18:03.800 | DEBUG    | __main__:trials:24 - Trial = 20155/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.802 | DEBUG    | __main__:trials:29 - Trial = 20155/30000 | Total reward = 37.36
2022-01-26 14:18:03.806 | DEBUG    | __main__:trials:24 - Trial = 20156/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.806 | DEBUG    | __main__:trials:29 - Trial = 20156/30000 | Total reward = 39.33
2022-01-26 14:18:03.811 | DEBUG    | __main__:trials:24 - Trial = 20157/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.812 | DEBUG    | __main__:trials:29 - Trial = 20157/30000 | Total reward = 44.06
2022-01-26 14:18:03.816 | DEBUG    | __main__:trials:24 - Trial = 20158/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.817 | DEBUG    | __main__:trials:29 - Trial = 20158/30000 | Total reward = 55.09
2022-01-26 14:18:03.821 | DEBUG    | __main__:trials:24 - Trial = 20159/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.822 | DEBUG    | __main__:trials:29 - Trial = 20159/30000 | Total reward = 46.28
2022-01-26 14:18:03.826 | DEBUG    | __main__:trials:24 - Trial = 20160/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.827 | DEBUG    | __main__:trials:29 - Trial = 20160/30000 | Total reward = 42.32
2022-01-26 14:18:03.831 | DEBUG    | __main__:trials:24 - Trial = 20161/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.832 | DEBUG    | __main__:trials:29 - Trial = 20161/30000 | Total reward = 46.29
2022-01-26 14:18:03.836 | DEBUG    | __main__:trials:24 - Trial = 20162/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.837 | DEBUG    | __main__:trials:29 - Trial = 20162/30000 | Total reward = 45.67
2022-01-26 14:18:03.841 | DEBUG    | __main__:trials:24 - Trial = 20163/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.842 | DEBUG    | __main__:trials:29 - Trial = 20163/30000 | Total reward = 27.01
2022-01-26 14:18:03.846 | DEBUG    | __main__:trials:24 - Trial = 20164/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.847 | DEBUG    | __main__:trials:29 - Trial = 20164/30000 | Total reward = 40.41
2022-01-26 14:18:03.850 | DEBUG    | __main__:trials:24 - Trial = 20165/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.852 | DEBUG    | __main__:trials:29 - Trial = 20165/30000 | Total reward = 40.25
2022-01-26 14:18:03.856 | DEBUG    | __main__:trials:24 - Trial = 20166/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.857 | DEBUG    | __main__:trials:29 - Trial = 20166/30000 | Total reward = 55.69
2022-01-26 14:18:03.860 | DEBUG    | __main__:trials:24 - Trial = 20167/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.862 | DEBUG    | __main__:trials:29 - Trial = 20167/30000 | Total reward = 36.39
2022-01-26 14:18:03.866 | DEBUG    | __main__:trials:24 - Trial = 20168/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.867 | DEBUG    | __main__:trials:29 - Trial = 20168/30000 | Total reward = 41.99
2022-01-26 14:18:03.871 | DEBUG    | __main__:trials:24 - Trial = 20169/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.872 | DEBUG    | __main__:trials:29 - Trial = 20169/30000 | Total reward = 49.42
2022-01-26 14:18:03.876 | DEBUG    | __main__:trials:24 - Trial = 20170/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.877 | DEBUG    | __main__:trials:29 - Trial = 20170/30000 | Total reward = 36.74
2022-01-26 14:18:03.881 | DEBUG    | __main__:trials:26 - Trial = 20171/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.883 | DEBUG    | __main__:trials:29 - Trial = 20171/30000 | Total reward = 18.78
2022-01-26 14:18:03.886 | DEBUG    | __main__:trials:24 - Trial = 20172/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.888 | DEBUG    | __main__:trials:29 - Trial = 20172/30000 | Total reward = 37.20
2022-01-26 14:18:03.892 | DEBUG    | __main__:trials:24 - Trial = 20173/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.893 | DEBUG    | __main__:trials:29 - Trial = 20173/30000 | Total reward = 38.63
2022-01-26 14:18:03.896 | DEBUG    | __main__:trials:24 - Trial = 20174/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.899 | DEBUG    | __main__:trials:29 - Trial = 20174/30000 | Total reward = 46.75
2022-01-26 14:18:03.902 | DEBUG    | __main__:trials:24 - Trial = 20175/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.903 | DEBUG    | __main__:trials:29 - Trial = 20175/30000 | Total reward = 42.96
2022-01-26 14:18:03.907 | DEBUG    | __main__:trials:26 - Trial = 20176/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.909 | DEBUG    | __main__:trials:29 - Trial = 20176/30000 | Total reward = 21.58
2022-01-26 14:18:03.913 | DEBUG    | __main__:trials:24 - Trial = 20177/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.914 | DEBUG    | __main__:trials:29 - Trial = 20177/30000 | Total reward = 37.79
2022-01-26 14:18:03.917 | DEBUG    | __main__:trials:24 - Trial = 20178/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.918 | DEBUG    | __main__:trials:29 - Trial = 20178/30000 | Total reward = 36.26
2022-01-26 14:18:03.921 | DEBUG    | __main__:trials:24 - Trial = 20179/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.923 | DEBUG    | __main__:trials:29 - Trial = 20179/30000 | Total reward = 55.49
2022-01-26 14:18:03.926 | DEBUG    | __main__:trials:24 - Trial = 20180/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.927 | DEBUG    | __main__:trials:29 - Trial = 20180/30000 | Total reward = 50.36
2022-01-26 14:18:03.931 | DEBUG    | __main__:trials:24 - Trial = 20181/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.931 | DEBUG    | __main__:trials:29 - Trial = 20181/30000 | Total reward = 45.99
2022-01-26 14:18:03.935 | DEBUG    | __main__:trials:24 - Trial = 20182/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.935 | DEBUG    | __main__:trials:29 - Trial = 20182/30000 | Total reward = 47.49
2022-01-26 14:18:03.939 | DEBUG    | __main__:trials:24 - Trial = 20183/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.940 | DEBUG    | __main__:trials:29 - Trial = 20183/30000 | Total reward = 43.60
2022-01-26 14:18:03.943 | DEBUG    | __main__:trials:24 - Trial = 20184/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.945 | DEBUG    | __main__:trials:29 - Trial = 20184/30000 | Total reward = 36.55
2022-01-26 14:18:03.949 | DEBUG    | __main__:trials:24 - Trial = 20185/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.950 | DEBUG    | __main__:trials:29 - Trial = 20185/30000 | Total reward = 45.82
2022-01-26 14:18:03.953 | DEBUG    | __main__:trials:24 - Trial = 20186/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.954 | DEBUG    | __main__:trials:29 - Trial = 20186/30000 | Total reward = 48.99
2022-01-26 14:18:03.957 | DEBUG    | __main__:trials:24 - Trial = 20187/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.959 | DEBUG    | __main__:trials:29 - Trial = 20187/30000 | Total reward = 39.48
2022-01-26 14:18:03.963 | DEBUG    | __main__:trials:26 - Trial = 20188/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:03.964 | DEBUG    | __main__:trials:29 - Trial = 20188/30000 | Total reward = 26.61
2022-01-26 14:18:03.968 | DEBUG    | __main__:trials:24 - Trial = 20189/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.970 | DEBUG    | __main__:trials:29 - Trial = 20189/30000 | Total reward = 38.35
2022-01-26 14:18:03.974 | DEBUG    | __main__:trials:24 - Trial = 20190/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.976 | DEBUG    | __main__:trials:29 - Trial = 20190/30000 | Total reward = 39.72
2022-01-26 14:18:03.980 | DEBUG    | __main__:trials:24 - Trial = 20191/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.981 | DEBUG    | __main__:trials:29 - Trial = 20191/30000 | Total reward = 43.92
2022-01-26 14:18:03.984 | DEBUG    | __main__:trials:24 - Trial = 20192/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.986 | DEBUG    | __main__:trials:29 - Trial = 20192/30000 | Total reward = 53.03
2022-01-26 14:18:03.990 | DEBUG    | __main__:trials:24 - Trial = 20193/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.991 | DEBUG    | __main__:trials:29 - Trial = 20193/30000 | Total reward = 38.72
2022-01-26 14:18:03.994 | DEBUG    | __main__:trials:24 - Trial = 20194/30000 | Max number of steps (20) reached
2022-01-26 14:18:03.996 | DEBUG    | __main__:trials:29 - Trial = 20194/30000 | Total reward = 48.17
2022-01-26 14:18:04.000 | DEBUG    | __main__:trials:24 - Trial = 20195/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.001 | DEBUG    | __main__:trials:29 - Trial = 20195/30000 | Total reward = 41.38
2022-01-26 14:18:04.005 | DEBUG    | __main__:trials:24 - Trial = 20196/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.005 | DEBUG    | __main__:trials:29 - Trial = 20196/30000 | Total reward = 41.82
2022-01-26 14:18:04.010 | DEBUG    | __main__:trials:24 - Trial = 20197/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.010 | DEBUG    | __main__:trials:29 - Trial = 20197/30000 | Total reward = 49.63
2022-01-26 14:18:04.014 | DEBUG    | __main__:trials:24 - Trial = 20198/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.015 | DEBUG    | __main__:trials:29 - Trial = 20198/30000 | Total reward = 40.25
2022-01-26 14:18:04.020 | DEBUG    | __main__:trials:24 - Trial = 20199/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.021 | DEBUG    | __main__:trials:29 - Trial = 20199/30000 | Total reward = 37.32
2022-01-26 14:18:04.025 | DEBUG    | __main__:trials:24 - Trial = 20200/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.027 | DEBUG    | __main__:trials:29 - Trial = 20200/30000 | Total reward = 31.53
2022-01-26 14:18:04.030 | DEBUG    | __main__:trials:24 - Trial = 20201/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.032 | DEBUG    | __main__:trials:29 - Trial = 20201/30000 | Total reward = 33.10
2022-01-26 14:18:04.035 | DEBUG    | __main__:trials:24 - Trial = 20202/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.036 | DEBUG    | __main__:trials:29 - Trial = 20202/30000 | Total reward = 37.57
2022-01-26 14:18:04.040 | DEBUG    | __main__:trials:24 - Trial = 20203/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.041 | DEBUG    | __main__:trials:29 - Trial = 20203/30000 | Total reward = 36.85
2022-01-26 14:18:04.045 | DEBUG    | __main__:trials:26 - Trial = 20204/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.046 | DEBUG    | __main__:trials:29 - Trial = 20204/30000 | Total reward = 25.87
2022-01-26 14:18:04.050 | DEBUG    | __main__:trials:24 - Trial = 20205/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.051 | DEBUG    | __main__:trials:29 - Trial = 20205/30000 | Total reward = 50.23
2022-01-26 14:18:04.055 | DEBUG    | __main__:trials:24 - Trial = 20206/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.057 | DEBUG    | __main__:trials:29 - Trial = 20206/30000 | Total reward = 50.71
2022-01-26 14:18:04.061 | DEBUG    | __main__:trials:24 - Trial = 20207/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.062 | DEBUG    | __main__:trials:29 - Trial = 20207/30000 | Total reward = 37.73
2022-01-26 14:18:04.065 | DEBUG    | __main__:trials:24 - Trial = 20208/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.066 | DEBUG    | __main__:trials:29 - Trial = 20208/30000 | Total reward = 38.19
2022-01-26 14:18:04.069 | DEBUG    | __main__:trials:26 - Trial = 20209/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.071 | DEBUG    | __main__:trials:29 - Trial = 20209/30000 | Total reward = 31.89
2022-01-26 14:18:04.074 | DEBUG    | __main__:trials:24 - Trial = 20210/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.074 | DEBUG    | __main__:trials:29 - Trial = 20210/30000 | Total reward = 40.60
2022-01-26 14:18:04.077 | DEBUG    | __main__:trials:26 - Trial = 20211/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.078 | DEBUG    | __main__:trials:29 - Trial = 20211/30000 | Total reward = 18.28
2022-01-26 14:18:04.081 | DEBUG    | __main__:trials:24 - Trial = 20212/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.083 | DEBUG    | __main__:trials:29 - Trial = 20212/30000 | Total reward = 44.25
2022-01-26 14:18:04.087 | DEBUG    | __main__:trials:24 - Trial = 20213/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.089 | DEBUG    | __main__:trials:29 - Trial = 20213/30000 | Total reward = 45.04
2022-01-26 14:18:04.092 | DEBUG    | __main__:trials:24 - Trial = 20214/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.093 | DEBUG    | __main__:trials:29 - Trial = 20214/30000 | Total reward = 40.11
2022-01-26 14:18:04.097 | DEBUG    | __main__:trials:24 - Trial = 20215/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.098 | DEBUG    | __main__:trials:29 - Trial = 20215/30000 | Total reward = 50.09
2022-01-26 14:18:04.101 | DEBUG    | __main__:trials:24 - Trial = 20216/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.103 | DEBUG    | __main__:trials:29 - Trial = 20216/30000 | Total reward = 38.64
2022-01-26 14:18:04.106 | DEBUG    | __main__:trials:24 - Trial = 20217/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.108 | DEBUG    | __main__:trials:29 - Trial = 20217/30000 | Total reward = 49.66
2022-01-26 14:18:04.111 | DEBUG    | __main__:trials:26 - Trial = 20218/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.111 | DEBUG    | __main__:trials:29 - Trial = 20218/30000 | Total reward = 11.25
2022-01-26 14:18:04.115 | DEBUG    | __main__:trials:24 - Trial = 20219/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.117 | DEBUG    | __main__:trials:29 - Trial = 20219/30000 | Total reward = 36.78
2022-01-26 14:18:04.120 | DEBUG    | __main__:trials:24 - Trial = 20220/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.122 | DEBUG    | __main__:trials:29 - Trial = 20220/30000 | Total reward = 41.28
2022-01-26 14:18:04.125 | DEBUG    | __main__:trials:26 - Trial = 20221/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.126 | DEBUG    | __main__:trials:29 - Trial = 20221/30000 | Total reward = 16.16
2022-01-26 14:18:04.130 | DEBUG    | __main__:trials:24 - Trial = 20222/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.132 | DEBUG    | __main__:trials:29 - Trial = 20222/30000 | Total reward = 37.87
2022-01-26 14:18:04.135 | DEBUG    | __main__:trials:24 - Trial = 20223/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.137 | DEBUG    | __main__:trials:29 - Trial = 20223/30000 | Total reward = 36.58
2022-01-26 14:18:04.140 | DEBUG    | __main__:trials:24 - Trial = 20224/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.142 | DEBUG    | __main__:trials:29 - Trial = 20224/30000 | Total reward = 41.03
2022-01-26 14:18:04.146 | DEBUG    | __main__:trials:24 - Trial = 20225/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.147 | DEBUG    | __main__:trials:29 - Trial = 20225/30000 | Total reward = 40.66
2022-01-26 14:18:04.150 | DEBUG    | __main__:trials:26 - Trial = 20226/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.151 | DEBUG    | __main__:trials:29 - Trial = 20226/30000 | Total reward = 11.38
2022-01-26 14:18:04.155 | DEBUG    | __main__:trials:24 - Trial = 20227/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.156 | DEBUG    | __main__:trials:29 - Trial = 20227/30000 | Total reward = 38.53
2022-01-26 14:18:04.159 | DEBUG    | __main__:trials:24 - Trial = 20228/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.161 | DEBUG    | __main__:trials:29 - Trial = 20228/30000 | Total reward = 34.68
2022-01-26 14:18:04.164 | DEBUG    | __main__:trials:24 - Trial = 20229/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.166 | DEBUG    | __main__:trials:29 - Trial = 20229/30000 | Total reward = 49.42
2022-01-26 14:18:04.169 | DEBUG    | __main__:trials:24 - Trial = 20230/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.170 | DEBUG    | __main__:trials:29 - Trial = 20230/30000 | Total reward = 38.62
2022-01-26 14:18:04.173 | DEBUG    | __main__:trials:24 - Trial = 20231/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.175 | DEBUG    | __main__:trials:29 - Trial = 20231/30000 | Total reward = 29.16
2022-01-26 14:18:04.178 | DEBUG    | __main__:trials:24 - Trial = 20232/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.178 | DEBUG    | __main__:trials:29 - Trial = 20232/30000 | Total reward = 47.28
2022-01-26 14:18:04.182 | DEBUG    | __main__:trials:24 - Trial = 20233/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.184 | DEBUG    | __main__:trials:29 - Trial = 20233/30000 | Total reward = 40.99
2022-01-26 14:18:04.187 | DEBUG    | __main__:trials:24 - Trial = 20234/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.189 | DEBUG    | __main__:trials:29 - Trial = 20234/30000 | Total reward = 31.82
2022-01-26 14:18:04.193 | DEBUG    | __main__:trials:24 - Trial = 20235/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.194 | DEBUG    | __main__:trials:29 - Trial = 20235/30000 | Total reward = 41.50
2022-01-26 14:18:04.197 | DEBUG    | __main__:trials:26 - Trial = 20236/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.199 | DEBUG    | __main__:trials:29 - Trial = 20236/30000 | Total reward = 30.50
2022-01-26 14:18:04.203 | DEBUG    | __main__:trials:24 - Trial = 20237/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.204 | DEBUG    | __main__:trials:29 - Trial = 20237/30000 | Total reward = 34.57
2022-01-26 14:18:04.207 | DEBUG    | __main__:trials:24 - Trial = 20238/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.209 | DEBUG    | __main__:trials:29 - Trial = 20238/30000 | Total reward = 41.04
2022-01-26 14:18:04.212 | DEBUG    | __main__:trials:24 - Trial = 20239/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.214 | DEBUG    | __main__:trials:29 - Trial = 20239/30000 | Total reward = 39.65
2022-01-26 14:18:04.218 | DEBUG    | __main__:trials:24 - Trial = 20240/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.219 | DEBUG    | __main__:trials:29 - Trial = 20240/30000 | Total reward = 46.99
2022-01-26 14:18:04.223 | DEBUG    | __main__:trials:24 - Trial = 20241/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.224 | DEBUG    | __main__:trials:29 - Trial = 20241/30000 | Total reward = 46.26
2022-01-26 14:18:04.228 | DEBUG    | __main__:trials:24 - Trial = 20242/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.229 | DEBUG    | __main__:trials:29 - Trial = 20242/30000 | Total reward = 47.32
2022-01-26 14:18:04.233 | DEBUG    | __main__:trials:24 - Trial = 20243/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.234 | DEBUG    | __main__:trials:29 - Trial = 20243/30000 | Total reward = 38.11
2022-01-26 14:18:04.237 | DEBUG    | __main__:trials:24 - Trial = 20244/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.239 | DEBUG    | __main__:trials:29 - Trial = 20244/30000 | Total reward = 33.29
2022-01-26 14:18:04.242 | DEBUG    | __main__:trials:24 - Trial = 20245/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.243 | DEBUG    | __main__:trials:29 - Trial = 20245/30000 | Total reward = 46.23
2022-01-26 14:18:04.247 | DEBUG    | __main__:trials:24 - Trial = 20246/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.249 | DEBUG    | __main__:trials:29 - Trial = 20246/30000 | Total reward = 47.08
2022-01-26 14:18:04.252 | DEBUG    | __main__:trials:24 - Trial = 20247/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.253 | DEBUG    | __main__:trials:29 - Trial = 20247/30000 | Total reward = 32.34
2022-01-26 14:18:04.256 | DEBUG    | __main__:trials:24 - Trial = 20248/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.258 | DEBUG    | __main__:trials:29 - Trial = 20248/30000 | Total reward = 38.21
2022-01-26 14:18:04.261 | DEBUG    | __main__:trials:24 - Trial = 20249/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.263 | DEBUG    | __main__:trials:29 - Trial = 20249/30000 | Total reward = 38.10
2022-01-26 14:18:04.266 | DEBUG    | __main__:trials:24 - Trial = 20250/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.266 | DEBUG    | __main__:trials:29 - Trial = 20250/30000 | Total reward = 37.94
2022-01-26 14:18:04.270 | DEBUG    | __main__:trials:24 - Trial = 20251/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.272 | DEBUG    | __main__:trials:29 - Trial = 20251/30000 | Total reward = 50.52
2022-01-26 14:18:04.276 | DEBUG    | __main__:trials:24 - Trial = 20252/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.277 | DEBUG    | __main__:trials:29 - Trial = 20252/30000 | Total reward = 27.70
2022-01-26 14:18:04.281 | DEBUG    | __main__:trials:24 - Trial = 20253/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.282 | DEBUG    | __main__:trials:29 - Trial = 20253/30000 | Total reward = 44.79
2022-01-26 14:18:04.286 | DEBUG    | __main__:trials:24 - Trial = 20254/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.287 | DEBUG    | __main__:trials:29 - Trial = 20254/30000 | Total reward = 43.94
2022-01-26 14:18:04.291 | DEBUG    | __main__:trials:24 - Trial = 20255/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.293 | DEBUG    | __main__:trials:29 - Trial = 20255/30000 | Total reward = 46.31
2022-01-26 14:18:04.296 | DEBUG    | __main__:trials:24 - Trial = 20256/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.297 | DEBUG    | __main__:trials:29 - Trial = 20256/30000 | Total reward = 35.12
2022-01-26 14:18:04.301 | DEBUG    | __main__:trials:24 - Trial = 20257/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.302 | DEBUG    | __main__:trials:29 - Trial = 20257/30000 | Total reward = 34.46
2022-01-26 14:18:04.306 | DEBUG    | __main__:trials:24 - Trial = 20258/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.307 | DEBUG    | __main__:trials:29 - Trial = 20258/30000 | Total reward = 37.66
2022-01-26 14:18:04.311 | DEBUG    | __main__:trials:26 - Trial = 20259/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.312 | DEBUG    | __main__:trials:29 - Trial = 20259/30000 | Total reward = 17.90
2022-01-26 14:18:04.316 | DEBUG    | __main__:trials:24 - Trial = 20260/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.318 | DEBUG    | __main__:trials:29 - Trial = 20260/30000 | Total reward = 44.92
2022-01-26 14:18:04.322 | DEBUG    | __main__:trials:24 - Trial = 20261/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.323 | DEBUG    | __main__:trials:29 - Trial = 20261/30000 | Total reward = 48.94
2022-01-26 14:18:04.326 | DEBUG    | __main__:trials:24 - Trial = 20262/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.328 | DEBUG    | __main__:trials:29 - Trial = 20262/30000 | Total reward = 34.91
2022-01-26 14:18:04.332 | DEBUG    | __main__:trials:24 - Trial = 20263/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.334 | DEBUG    | __main__:trials:29 - Trial = 20263/30000 | Total reward = 40.03
2022-01-26 14:18:04.338 | DEBUG    | __main__:trials:24 - Trial = 20264/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.339 | DEBUG    | __main__:trials:29 - Trial = 20264/30000 | Total reward = 43.35
2022-01-26 14:18:04.343 | DEBUG    | __main__:trials:24 - Trial = 20265/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.344 | DEBUG    | __main__:trials:29 - Trial = 20265/30000 | Total reward = 39.60
2022-01-26 14:18:04.348 | DEBUG    | __main__:trials:24 - Trial = 20266/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.349 | DEBUG    | __main__:trials:29 - Trial = 20266/30000 | Total reward = 48.58
2022-01-26 14:18:04.354 | DEBUG    | __main__:trials:24 - Trial = 20267/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.355 | DEBUG    | __main__:trials:29 - Trial = 20267/30000 | Total reward = 33.57
2022-01-26 14:18:04.359 | DEBUG    | __main__:trials:24 - Trial = 20268/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.360 | DEBUG    | __main__:trials:29 - Trial = 20268/30000 | Total reward = 37.95
2022-01-26 14:18:04.364 | DEBUG    | __main__:trials:24 - Trial = 20269/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.365 | DEBUG    | __main__:trials:29 - Trial = 20269/30000 | Total reward = 44.01
2022-01-26 14:18:04.370 | DEBUG    | __main__:trials:24 - Trial = 20270/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.371 | DEBUG    | __main__:trials:29 - Trial = 20270/30000 | Total reward = 38.26
2022-01-26 14:18:04.375 | DEBUG    | __main__:trials:24 - Trial = 20271/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.377 | DEBUG    | __main__:trials:29 - Trial = 20271/30000 | Total reward = 44.88
2022-01-26 14:18:04.380 | DEBUG    | __main__:trials:24 - Trial = 20272/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.382 | DEBUG    | __main__:trials:29 - Trial = 20272/30000 | Total reward = 41.54
2022-01-26 14:18:04.386 | DEBUG    | __main__:trials:24 - Trial = 20273/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.387 | DEBUG    | __main__:trials:29 - Trial = 20273/30000 | Total reward = 34.01
2022-01-26 14:18:04.391 | DEBUG    | __main__:trials:24 - Trial = 20274/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.392 | DEBUG    | __main__:trials:29 - Trial = 20274/30000 | Total reward = 54.31
2022-01-26 14:18:04.396 | DEBUG    | __main__:trials:24 - Trial = 20275/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.398 | DEBUG    | __main__:trials:29 - Trial = 20275/30000 | Total reward = 39.39
2022-01-26 14:18:04.401 | DEBUG    | __main__:trials:24 - Trial = 20276/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.403 | DEBUG    | __main__:trials:29 - Trial = 20276/30000 | Total reward = 36.72
2022-01-26 14:18:04.406 | DEBUG    | __main__:trials:24 - Trial = 20277/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.407 | DEBUG    | __main__:trials:29 - Trial = 20277/30000 | Total reward = 40.61
2022-01-26 14:18:04.411 | DEBUG    | __main__:trials:24 - Trial = 20278/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.413 | DEBUG    | __main__:trials:29 - Trial = 20278/30000 | Total reward = 37.43
2022-01-26 14:18:04.416 | DEBUG    | __main__:trials:24 - Trial = 20279/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.418 | DEBUG    | __main__:trials:29 - Trial = 20279/30000 | Total reward = 40.25
2022-01-26 14:18:04.422 | DEBUG    | __main__:trials:24 - Trial = 20280/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.423 | DEBUG    | __main__:trials:29 - Trial = 20280/30000 | Total reward = 43.97
2022-01-26 14:18:04.427 | DEBUG    | __main__:trials:24 - Trial = 20281/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.429 | DEBUG    | __main__:trials:29 - Trial = 20281/30000 | Total reward = 32.51
2022-01-26 14:18:04.433 | DEBUG    | __main__:trials:24 - Trial = 20282/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.434 | DEBUG    | __main__:trials:29 - Trial = 20282/30000 | Total reward = 32.91
2022-01-26 14:18:04.437 | DEBUG    | __main__:trials:24 - Trial = 20283/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.438 | DEBUG    | __main__:trials:29 - Trial = 20283/30000 | Total reward = 35.00
2022-01-26 14:18:04.443 | DEBUG    | __main__:trials:26 - Trial = 20284/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.445 | DEBUG    | __main__:trials:29 - Trial = 20284/30000 | Total reward = 34.52
2022-01-26 14:18:04.448 | DEBUG    | __main__:trials:24 - Trial = 20285/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.449 | DEBUG    | __main__:trials:29 - Trial = 20285/30000 | Total reward = 38.08
2022-01-26 14:18:04.453 | DEBUG    | __main__:trials:24 - Trial = 20286/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.453 | DEBUG    | __main__:trials:29 - Trial = 20286/30000 | Total reward = 47.32
2022-01-26 14:18:04.457 | DEBUG    | __main__:trials:24 - Trial = 20287/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.458 | DEBUG    | __main__:trials:29 - Trial = 20287/30000 | Total reward = 37.87
2022-01-26 14:18:04.462 | DEBUG    | __main__:trials:24 - Trial = 20288/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.463 | DEBUG    | __main__:trials:29 - Trial = 20288/30000 | Total reward = 38.21
2022-01-26 14:18:04.467 | DEBUG    | __main__:trials:24 - Trial = 20289/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.468 | DEBUG    | __main__:trials:29 - Trial = 20289/30000 | Total reward = 36.48
2022-01-26 14:18:04.472 | DEBUG    | __main__:trials:24 - Trial = 20290/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.473 | DEBUG    | __main__:trials:29 - Trial = 20290/30000 | Total reward = 45.49
2022-01-26 14:18:04.477 | DEBUG    | __main__:trials:24 - Trial = 20291/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.478 | DEBUG    | __main__:trials:29 - Trial = 20291/30000 | Total reward = 40.41
2022-01-26 14:18:04.482 | DEBUG    | __main__:trials:24 - Trial = 20292/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.483 | DEBUG    | __main__:trials:29 - Trial = 20292/30000 | Total reward = 41.76
2022-01-26 14:18:04.487 | DEBUG    | __main__:trials:24 - Trial = 20293/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.489 | DEBUG    | __main__:trials:29 - Trial = 20293/30000 | Total reward = 37.00
2022-01-26 14:18:04.492 | DEBUG    | __main__:trials:24 - Trial = 20294/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.494 | DEBUG    | __main__:trials:29 - Trial = 20294/30000 | Total reward = 35.55
2022-01-26 14:18:04.498 | DEBUG    | __main__:trials:24 - Trial = 20295/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.498 | DEBUG    | __main__:trials:29 - Trial = 20295/30000 | Total reward = 41.48
2022-01-26 14:18:04.503 | DEBUG    | __main__:trials:24 - Trial = 20296/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.504 | DEBUG    | __main__:trials:29 - Trial = 20296/30000 | Total reward = 37.23
2022-01-26 14:18:04.508 | DEBUG    | __main__:trials:24 - Trial = 20297/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.508 | DEBUG    | __main__:trials:29 - Trial = 20297/30000 | Total reward = 51.23
2022-01-26 14:18:04.513 | DEBUG    | __main__:trials:24 - Trial = 20298/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.515 | DEBUG    | __main__:trials:29 - Trial = 20298/30000 | Total reward = 40.25
2022-01-26 14:18:04.519 | DEBUG    | __main__:trials:24 - Trial = 20299/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.520 | DEBUG    | __main__:trials:29 - Trial = 20299/30000 | Total reward = 44.33
2022-01-26 14:18:04.524 | DEBUG    | __main__:trials:24 - Trial = 20300/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.525 | DEBUG    | __main__:trials:29 - Trial = 20300/30000 | Total reward = 40.49
2022-01-26 14:18:04.529 | DEBUG    | __main__:trials:24 - Trial = 20301/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.530 | DEBUG    | __main__:trials:29 - Trial = 20301/30000 | Total reward = 53.59
2022-01-26 14:18:04.533 | DEBUG    | __main__:trials:24 - Trial = 20302/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.534 | DEBUG    | __main__:trials:29 - Trial = 20302/30000 | Total reward = 40.84
2022-01-26 14:18:04.537 | DEBUG    | __main__:trials:24 - Trial = 20303/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.538 | DEBUG    | __main__:trials:29 - Trial = 20303/30000 | Total reward = 40.49
2022-01-26 14:18:04.542 | DEBUG    | __main__:trials:24 - Trial = 20304/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.544 | DEBUG    | __main__:trials:29 - Trial = 20304/30000 | Total reward = 40.25
2022-01-26 14:18:04.548 | DEBUG    | __main__:trials:24 - Trial = 20305/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.549 | DEBUG    | __main__:trials:29 - Trial = 20305/30000 | Total reward = 46.58
2022-01-26 14:18:04.553 | DEBUG    | __main__:trials:24 - Trial = 20306/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.554 | DEBUG    | __main__:trials:29 - Trial = 20306/30000 | Total reward = 44.56
2022-01-26 14:18:04.557 | DEBUG    | __main__:trials:24 - Trial = 20307/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.559 | DEBUG    | __main__:trials:29 - Trial = 20307/30000 | Total reward = 37.77
2022-01-26 14:18:04.563 | DEBUG    | __main__:trials:24 - Trial = 20308/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.563 | DEBUG    | __main__:trials:29 - Trial = 20308/30000 | Total reward = 38.34
2022-01-26 14:18:04.567 | DEBUG    | __main__:trials:24 - Trial = 20309/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.569 | DEBUG    | __main__:trials:29 - Trial = 20309/30000 | Total reward = 46.95
2022-01-26 14:18:04.573 | DEBUG    | __main__:trials:24 - Trial = 20310/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.574 | DEBUG    | __main__:trials:29 - Trial = 20310/30000 | Total reward = 32.19
2022-01-26 14:18:04.577 | DEBUG    | __main__:trials:24 - Trial = 20311/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.578 | DEBUG    | __main__:trials:29 - Trial = 20311/30000 | Total reward = 42.58
2022-01-26 14:18:04.581 | DEBUG    | __main__:trials:24 - Trial = 20312/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.583 | DEBUG    | __main__:trials:29 - Trial = 20312/30000 | Total reward = 32.69
2022-01-26 14:18:04.587 | DEBUG    | __main__:trials:24 - Trial = 20313/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.588 | DEBUG    | __main__:trials:29 - Trial = 20313/30000 | Total reward = 40.02
2022-01-26 14:18:04.592 | DEBUG    | __main__:trials:24 - Trial = 20314/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.594 | DEBUG    | __main__:trials:29 - Trial = 20314/30000 | Total reward = 49.76
2022-01-26 14:18:04.597 | DEBUG    | __main__:trials:24 - Trial = 20315/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.598 | DEBUG    | __main__:trials:29 - Trial = 20315/30000 | Total reward = 33.88
2022-01-26 14:18:04.602 | DEBUG    | __main__:trials:24 - Trial = 20316/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.603 | DEBUG    | __main__:trials:29 - Trial = 20316/30000 | Total reward = 38.61
2022-01-26 14:18:04.608 | DEBUG    | __main__:trials:24 - Trial = 20317/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.608 | DEBUG    | __main__:trials:29 - Trial = 20317/30000 | Total reward = 37.88
2022-01-26 14:18:04.613 | DEBUG    | __main__:trials:24 - Trial = 20318/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.615 | DEBUG    | __main__:trials:29 - Trial = 20318/30000 | Total reward = 42.58
2022-01-26 14:18:04.619 | DEBUG    | __main__:trials:24 - Trial = 20319/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.620 | DEBUG    | __main__:trials:29 - Trial = 20319/30000 | Total reward = 40.49
2022-01-26 14:18:04.623 | DEBUG    | __main__:trials:24 - Trial = 20320/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.625 | DEBUG    | __main__:trials:29 - Trial = 20320/30000 | Total reward = 40.97
2022-01-26 14:18:04.628 | DEBUG    | __main__:trials:24 - Trial = 20321/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.630 | DEBUG    | __main__:trials:29 - Trial = 20321/30000 | Total reward = 40.59
2022-01-26 14:18:04.634 | DEBUG    | __main__:trials:24 - Trial = 20322/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.635 | DEBUG    | __main__:trials:29 - Trial = 20322/30000 | Total reward = 36.94
2022-01-26 14:18:04.639 | DEBUG    | __main__:trials:24 - Trial = 20323/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.640 | DEBUG    | __main__:trials:29 - Trial = 20323/30000 | Total reward = 27.15
2022-01-26 14:18:04.644 | DEBUG    | __main__:trials:24 - Trial = 20324/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.645 | DEBUG    | __main__:trials:29 - Trial = 20324/30000 | Total reward = 51.47
2022-01-26 14:18:04.649 | DEBUG    | __main__:trials:24 - Trial = 20325/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.650 | DEBUG    | __main__:trials:29 - Trial = 20325/30000 | Total reward = 54.45
2022-01-26 14:18:04.654 | DEBUG    | __main__:trials:24 - Trial = 20326/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.656 | DEBUG    | __main__:trials:29 - Trial = 20326/30000 | Total reward = 43.70
2022-01-26 14:18:04.660 | DEBUG    | __main__:trials:24 - Trial = 20327/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.662 | DEBUG    | __main__:trials:29 - Trial = 20327/30000 | Total reward = 37.53
2022-01-26 14:18:04.665 | DEBUG    | __main__:trials:24 - Trial = 20328/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.666 | DEBUG    | __main__:trials:29 - Trial = 20328/30000 | Total reward = 25.03
2022-01-26 14:18:04.670 | DEBUG    | __main__:trials:24 - Trial = 20329/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.672 | DEBUG    | __main__:trials:29 - Trial = 20329/30000 | Total reward = 32.61
2022-01-26 14:18:04.675 | DEBUG    | __main__:trials:24 - Trial = 20330/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.677 | DEBUG    | __main__:trials:29 - Trial = 20330/30000 | Total reward = 46.29
2022-01-26 14:18:04.680 | DEBUG    | __main__:trials:24 - Trial = 20331/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.682 | DEBUG    | __main__:trials:29 - Trial = 20331/30000 | Total reward = 39.22
2022-01-26 14:18:04.685 | DEBUG    | __main__:trials:26 - Trial = 20332/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.687 | DEBUG    | __main__:trials:29 - Trial = 20332/30000 | Total reward = 24.75
2022-01-26 14:18:04.690 | DEBUG    | __main__:trials:24 - Trial = 20333/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.692 | DEBUG    | __main__:trials:29 - Trial = 20333/30000 | Total reward = 40.25
2022-01-26 14:18:04.695 | DEBUG    | __main__:trials:24 - Trial = 20334/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.697 | DEBUG    | __main__:trials:29 - Trial = 20334/30000 | Total reward = 40.18
2022-01-26 14:18:04.700 | DEBUG    | __main__:trials:24 - Trial = 20335/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.702 | DEBUG    | __main__:trials:29 - Trial = 20335/30000 | Total reward = 37.58
2022-01-26 14:18:04.705 | DEBUG    | __main__:trials:24 - Trial = 20336/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.706 | DEBUG    | __main__:trials:29 - Trial = 20336/30000 | Total reward = 23.28
2022-01-26 14:18:04.710 | DEBUG    | __main__:trials:24 - Trial = 20337/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.711 | DEBUG    | __main__:trials:29 - Trial = 20337/30000 | Total reward = 44.73
2022-01-26 14:18:04.715 | DEBUG    | __main__:trials:24 - Trial = 20338/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.717 | DEBUG    | __main__:trials:29 - Trial = 20338/30000 | Total reward = 40.25
2022-01-26 14:18:04.721 | DEBUG    | __main__:trials:24 - Trial = 20339/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.721 | DEBUG    | __main__:trials:29 - Trial = 20339/30000 | Total reward = 52.03
2022-01-26 14:18:04.725 | DEBUG    | __main__:trials:26 - Trial = 20340/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:04.725 | DEBUG    | __main__:trials:29 - Trial = 20340/30000 | Total reward = 15.90
2022-01-26 14:18:04.729 | DEBUG    | __main__:trials:24 - Trial = 20341/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.730 | DEBUG    | __main__:trials:29 - Trial = 20341/30000 | Total reward = 44.94
2022-01-26 14:18:04.734 | DEBUG    | __main__:trials:24 - Trial = 20342/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.736 | DEBUG    | __main__:trials:29 - Trial = 20342/30000 | Total reward = 44.12
2022-01-26 14:18:04.739 | DEBUG    | __main__:trials:24 - Trial = 20343/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.740 | DEBUG    | __main__:trials:29 - Trial = 20343/30000 | Total reward = 34.77
2022-01-26 14:18:04.745 | DEBUG    | __main__:trials:24 - Trial = 20344/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.746 | DEBUG    | __main__:trials:29 - Trial = 20344/30000 | Total reward = 40.02
2022-01-26 14:18:04.750 | DEBUG    | __main__:trials:24 - Trial = 20345/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.752 | DEBUG    | __main__:trials:29 - Trial = 20345/30000 | Total reward = 44.30
2022-01-26 14:18:04.755 | DEBUG    | __main__:trials:24 - Trial = 20346/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.756 | DEBUG    | __main__:trials:29 - Trial = 20346/30000 | Total reward = 40.25
2022-01-26 14:18:04.760 | DEBUG    | __main__:trials:24 - Trial = 20347/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.762 | DEBUG    | __main__:trials:29 - Trial = 20347/30000 | Total reward = 32.91
2022-01-26 14:18:04.765 | DEBUG    | __main__:trials:24 - Trial = 20348/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.767 | DEBUG    | __main__:trials:29 - Trial = 20348/30000 | Total reward = 37.33
2022-01-26 14:18:04.771 | DEBUG    | __main__:trials:24 - Trial = 20349/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.772 | DEBUG    | __main__:trials:29 - Trial = 20349/30000 | Total reward = 43.20
2022-01-26 14:18:04.776 | DEBUG    | __main__:trials:24 - Trial = 20350/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.778 | DEBUG    | __main__:trials:29 - Trial = 20350/30000 | Total reward = 29.97
2022-01-26 14:18:04.781 | DEBUG    | __main__:trials:24 - Trial = 20351/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.782 | DEBUG    | __main__:trials:29 - Trial = 20351/30000 | Total reward = 35.04
2022-01-26 14:18:04.786 | DEBUG    | __main__:trials:24 - Trial = 20352/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.787 | DEBUG    | __main__:trials:29 - Trial = 20352/30000 | Total reward = 47.16
2022-01-26 14:18:04.791 | DEBUG    | __main__:trials:24 - Trial = 20353/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.793 | DEBUG    | __main__:trials:29 - Trial = 20353/30000 | Total reward = 54.85
2022-01-26 14:18:04.796 | DEBUG    | __main__:trials:24 - Trial = 20354/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.798 | DEBUG    | __main__:trials:29 - Trial = 20354/30000 | Total reward = 36.03
2022-01-26 14:18:04.801 | DEBUG    | __main__:trials:24 - Trial = 20355/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.803 | DEBUG    | __main__:trials:29 - Trial = 20355/30000 | Total reward = 46.74
2022-01-26 14:18:04.806 | DEBUG    | __main__:trials:24 - Trial = 20356/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.807 | DEBUG    | __main__:trials:29 - Trial = 20356/30000 | Total reward = 33.20
2022-01-26 14:18:04.810 | DEBUG    | __main__:trials:24 - Trial = 20357/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.811 | DEBUG    | __main__:trials:29 - Trial = 20357/30000 | Total reward = 37.62
2022-01-26 14:18:04.814 | DEBUG    | __main__:trials:24 - Trial = 20358/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.816 | DEBUG    | __main__:trials:29 - Trial = 20358/30000 | Total reward = 37.54
2022-01-26 14:18:04.820 | DEBUG    | __main__:trials:24 - Trial = 20359/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.821 | DEBUG    | __main__:trials:29 - Trial = 20359/30000 | Total reward = 32.52
2022-01-26 14:18:04.825 | DEBUG    | __main__:trials:24 - Trial = 20360/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.827 | DEBUG    | __main__:trials:29 - Trial = 20360/30000 | Total reward = 43.30
2022-01-26 14:18:04.831 | DEBUG    | __main__:trials:24 - Trial = 20361/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.832 | DEBUG    | __main__:trials:29 - Trial = 20361/30000 | Total reward = 31.45
2022-01-26 14:18:04.836 | DEBUG    | __main__:trials:24 - Trial = 20362/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.838 | DEBUG    | __main__:trials:29 - Trial = 20362/30000 | Total reward = 43.66
2022-01-26 14:18:04.842 | DEBUG    | __main__:trials:24 - Trial = 20363/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.843 | DEBUG    | __main__:trials:29 - Trial = 20363/30000 | Total reward = 39.01
2022-01-26 14:18:04.847 | DEBUG    | __main__:trials:24 - Trial = 20364/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.848 | DEBUG    | __main__:trials:29 - Trial = 20364/30000 | Total reward = 38.80
2022-01-26 14:18:04.852 | DEBUG    | __main__:trials:24 - Trial = 20365/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.853 | DEBUG    | __main__:trials:29 - Trial = 20365/30000 | Total reward = 46.21
2022-01-26 14:18:04.857 | DEBUG    | __main__:trials:24 - Trial = 20366/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.858 | DEBUG    | __main__:trials:29 - Trial = 20366/30000 | Total reward = 37.69
2022-01-26 14:18:04.861 | DEBUG    | __main__:trials:24 - Trial = 20367/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.862 | DEBUG    | __main__:trials:29 - Trial = 20367/30000 | Total reward = 37.64
2022-01-26 14:18:04.865 | DEBUG    | __main__:trials:24 - Trial = 20368/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.867 | DEBUG    | __main__:trials:29 - Trial = 20368/30000 | Total reward = 48.19
2022-01-26 14:18:04.870 | DEBUG    | __main__:trials:24 - Trial = 20369/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.871 | DEBUG    | __main__:trials:29 - Trial = 20369/30000 | Total reward = 38.22
2022-01-26 14:18:04.874 | DEBUG    | __main__:trials:24 - Trial = 20370/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.876 | DEBUG    | __main__:trials:29 - Trial = 20370/30000 | Total reward = 38.30
2022-01-26 14:18:04.880 | DEBUG    | __main__:trials:24 - Trial = 20371/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.881 | DEBUG    | __main__:trials:29 - Trial = 20371/30000 | Total reward = 37.11
2022-01-26 14:18:04.886 | DEBUG    | __main__:trials:24 - Trial = 20372/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.886 | DEBUG    | __main__:trials:29 - Trial = 20372/30000 | Total reward = 16.16
2022-01-26 14:18:04.891 | DEBUG    | __main__:trials:24 - Trial = 20373/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.892 | DEBUG    | __main__:trials:29 - Trial = 20373/30000 | Total reward = 40.92
2022-01-26 14:18:04.896 | DEBUG    | __main__:trials:24 - Trial = 20374/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.898 | DEBUG    | __main__:trials:29 - Trial = 20374/30000 | Total reward = 38.17
2022-01-26 14:18:04.901 | DEBUG    | __main__:trials:24 - Trial = 20375/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.902 | DEBUG    | __main__:trials:29 - Trial = 20375/30000 | Total reward = 53.58
2022-01-26 14:18:04.906 | DEBUG    | __main__:trials:24 - Trial = 20376/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.907 | DEBUG    | __main__:trials:29 - Trial = 20376/30000 | Total reward = 40.25
2022-01-26 14:18:04.911 | DEBUG    | __main__:trials:24 - Trial = 20377/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.912 | DEBUG    | __main__:trials:29 - Trial = 20377/30000 | Total reward = 40.25
2022-01-26 14:18:04.915 | DEBUG    | __main__:trials:24 - Trial = 20378/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.917 | DEBUG    | __main__:trials:29 - Trial = 20378/30000 | Total reward = 44.96
2022-01-26 14:18:04.921 | DEBUG    | __main__:trials:24 - Trial = 20379/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.921 | DEBUG    | __main__:trials:29 - Trial = 20379/30000 | Total reward = 35.80
2022-01-26 14:18:04.926 | DEBUG    | __main__:trials:24 - Trial = 20380/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.927 | DEBUG    | __main__:trials:29 - Trial = 20380/30000 | Total reward = 24.33
2022-01-26 14:18:04.930 | DEBUG    | __main__:trials:24 - Trial = 20381/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.932 | DEBUG    | __main__:trials:29 - Trial = 20381/30000 | Total reward = 45.57
2022-01-26 14:18:04.935 | DEBUG    | __main__:trials:24 - Trial = 20382/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.937 | DEBUG    | __main__:trials:29 - Trial = 20382/30000 | Total reward = 40.34
2022-01-26 14:18:04.940 | DEBUG    | __main__:trials:24 - Trial = 20383/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.942 | DEBUG    | __main__:trials:29 - Trial = 20383/30000 | Total reward = 45.56
2022-01-26 14:18:04.945 | DEBUG    | __main__:trials:24 - Trial = 20384/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.946 | DEBUG    | __main__:trials:29 - Trial = 20384/30000 | Total reward = 46.64
2022-01-26 14:18:04.951 | DEBUG    | __main__:trials:24 - Trial = 20385/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.952 | DEBUG    | __main__:trials:29 - Trial = 20385/30000 | Total reward = 40.49
2022-01-26 14:18:04.955 | DEBUG    | __main__:trials:24 - Trial = 20386/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.957 | DEBUG    | __main__:trials:29 - Trial = 20386/30000 | Total reward = 43.56
2022-01-26 14:18:04.961 | DEBUG    | __main__:trials:24 - Trial = 20387/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.962 | DEBUG    | __main__:trials:29 - Trial = 20387/30000 | Total reward = 48.60
2022-01-26 14:18:04.966 | DEBUG    | __main__:trials:24 - Trial = 20388/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.968 | DEBUG    | __main__:trials:29 - Trial = 20388/30000 | Total reward = 31.74
2022-01-26 14:18:04.971 | DEBUG    | __main__:trials:24 - Trial = 20389/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.973 | DEBUG    | __main__:trials:29 - Trial = 20389/30000 | Total reward = 40.49
2022-01-26 14:18:04.977 | DEBUG    | __main__:trials:24 - Trial = 20390/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.977 | DEBUG    | __main__:trials:29 - Trial = 20390/30000 | Total reward = 30.67
2022-01-26 14:18:04.982 | DEBUG    | __main__:trials:24 - Trial = 20391/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.982 | DEBUG    | __main__:trials:29 - Trial = 20391/30000 | Total reward = 40.25
2022-01-26 14:18:04.987 | DEBUG    | __main__:trials:24 - Trial = 20392/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.988 | DEBUG    | __main__:trials:29 - Trial = 20392/30000 | Total reward = 47.99
2022-01-26 14:18:04.992 | DEBUG    | __main__:trials:24 - Trial = 20393/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.993 | DEBUG    | __main__:trials:29 - Trial = 20393/30000 | Total reward = 48.39
2022-01-26 14:18:04.997 | DEBUG    | __main__:trials:24 - Trial = 20394/30000 | Max number of steps (20) reached
2022-01-26 14:18:04.998 | DEBUG    | __main__:trials:29 - Trial = 20394/30000 | Total reward = 39.23
2022-01-26 14:18:05.002 | DEBUG    | __main__:trials:24 - Trial = 20395/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.003 | DEBUG    | __main__:trials:29 - Trial = 20395/30000 | Total reward = 46.44
2022-01-26 14:18:05.007 | DEBUG    | __main__:trials:24 - Trial = 20396/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.008 | DEBUG    | __main__:trials:29 - Trial = 20396/30000 | Total reward = 37.54
2022-01-26 14:18:05.011 | DEBUG    | __main__:trials:26 - Trial = 20397/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.012 | DEBUG    | __main__:trials:29 - Trial = 20397/30000 | Total reward = 16.21
2022-01-26 14:18:05.015 | DEBUG    | __main__:trials:26 - Trial = 20398/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.017 | DEBUG    | __main__:trials:29 - Trial = 20398/30000 | Total reward = 15.92
2022-01-26 14:18:05.020 | DEBUG    | __main__:trials:24 - Trial = 20399/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.021 | DEBUG    | __main__:trials:29 - Trial = 20399/30000 | Total reward = 44.61
2022-01-26 14:18:05.026 | DEBUG    | __main__:trials:24 - Trial = 20400/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.026 | DEBUG    | __main__:trials:29 - Trial = 20400/30000 | Total reward = 49.21
2022-01-26 14:18:05.031 | DEBUG    | __main__:trials:24 - Trial = 20401/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.032 | DEBUG    | __main__:trials:29 - Trial = 20401/30000 | Total reward = 41.96
2022-01-26 14:18:05.036 | DEBUG    | __main__:trials:24 - Trial = 20402/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.038 | DEBUG    | __main__:trials:29 - Trial = 20402/30000 | Total reward = 36.57
2022-01-26 14:18:05.042 | DEBUG    | __main__:trials:24 - Trial = 20403/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.043 | DEBUG    | __main__:trials:29 - Trial = 20403/30000 | Total reward = 41.85
2022-01-26 14:18:05.047 | DEBUG    | __main__:trials:24 - Trial = 20404/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.048 | DEBUG    | __main__:trials:29 - Trial = 20404/30000 | Total reward = 39.85
2022-01-26 14:18:05.052 | DEBUG    | __main__:trials:24 - Trial = 20405/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.054 | DEBUG    | __main__:trials:29 - Trial = 20405/30000 | Total reward = 43.91
2022-01-26 14:18:05.057 | DEBUG    | __main__:trials:24 - Trial = 20406/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.059 | DEBUG    | __main__:trials:29 - Trial = 20406/30000 | Total reward = 45.26
2022-01-26 14:18:05.062 | DEBUG    | __main__:trials:24 - Trial = 20407/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.064 | DEBUG    | __main__:trials:29 - Trial = 20407/30000 | Total reward = 58.03
2022-01-26 14:18:05.068 | DEBUG    | __main__:trials:24 - Trial = 20408/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.069 | DEBUG    | __main__:trials:29 - Trial = 20408/30000 | Total reward = 49.41
2022-01-26 14:18:05.073 | DEBUG    | __main__:trials:24 - Trial = 20409/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.075 | DEBUG    | __main__:trials:29 - Trial = 20409/30000 | Total reward = 39.39
2022-01-26 14:18:05.079 | DEBUG    | __main__:trials:24 - Trial = 20410/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.079 | DEBUG    | __main__:trials:29 - Trial = 20410/30000 | Total reward = 39.69
2022-01-26 14:18:05.083 | DEBUG    | __main__:trials:24 - Trial = 20411/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.084 | DEBUG    | __main__:trials:29 - Trial = 20411/30000 | Total reward = 46.67
2022-01-26 14:18:05.088 | DEBUG    | __main__:trials:24 - Trial = 20412/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.090 | DEBUG    | __main__:trials:29 - Trial = 20412/30000 | Total reward = 44.21
2022-01-26 14:18:05.093 | DEBUG    | __main__:trials:24 - Trial = 20413/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.095 | DEBUG    | __main__:trials:29 - Trial = 20413/30000 | Total reward = 39.52
2022-01-26 14:18:05.099 | DEBUG    | __main__:trials:24 - Trial = 20414/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.099 | DEBUG    | __main__:trials:29 - Trial = 20414/30000 | Total reward = 44.93
2022-01-26 14:18:05.104 | DEBUG    | __main__:trials:24 - Trial = 20415/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.106 | DEBUG    | __main__:trials:29 - Trial = 20415/30000 | Total reward = 39.57
2022-01-26 14:18:05.109 | DEBUG    | __main__:trials:24 - Trial = 20416/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.110 | DEBUG    | __main__:trials:29 - Trial = 20416/30000 | Total reward = 36.73
2022-01-26 14:18:05.114 | DEBUG    | __main__:trials:24 - Trial = 20417/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.116 | DEBUG    | __main__:trials:29 - Trial = 20417/30000 | Total reward = 37.52
2022-01-26 14:18:05.119 | DEBUG    | __main__:trials:24 - Trial = 20418/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.121 | DEBUG    | __main__:trials:29 - Trial = 20418/30000 | Total reward = 44.16
2022-01-26 14:18:05.124 | DEBUG    | __main__:trials:24 - Trial = 20419/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.126 | DEBUG    | __main__:trials:29 - Trial = 20419/30000 | Total reward = 37.80
2022-01-26 14:18:05.129 | DEBUG    | __main__:trials:24 - Trial = 20420/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.131 | DEBUG    | __main__:trials:29 - Trial = 20420/30000 | Total reward = 48.03
2022-01-26 14:18:05.134 | DEBUG    | __main__:trials:24 - Trial = 20421/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.136 | DEBUG    | __main__:trials:29 - Trial = 20421/30000 | Total reward = 40.05
2022-01-26 14:18:05.140 | DEBUG    | __main__:trials:24 - Trial = 20422/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.141 | DEBUG    | __main__:trials:29 - Trial = 20422/30000 | Total reward = 51.62
2022-01-26 14:18:05.145 | DEBUG    | __main__:trials:24 - Trial = 20423/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.146 | DEBUG    | __main__:trials:29 - Trial = 20423/30000 | Total reward = 28.91
2022-01-26 14:18:05.150 | DEBUG    | __main__:trials:24 - Trial = 20424/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.151 | DEBUG    | __main__:trials:29 - Trial = 20424/30000 | Total reward = 26.53
2022-01-26 14:18:05.156 | DEBUG    | __main__:trials:24 - Trial = 20425/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.156 | DEBUG    | __main__:trials:29 - Trial = 20425/30000 | Total reward = 52.99
2022-01-26 14:18:05.161 | DEBUG    | __main__:trials:24 - Trial = 20426/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.161 | DEBUG    | __main__:trials:29 - Trial = 20426/30000 | Total reward = 52.93
2022-01-26 14:18:05.165 | DEBUG    | __main__:trials:24 - Trial = 20427/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.166 | DEBUG    | __main__:trials:29 - Trial = 20427/30000 | Total reward = 38.83
2022-01-26 14:18:05.169 | DEBUG    | __main__:trials:24 - Trial = 20428/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.171 | DEBUG    | __main__:trials:29 - Trial = 20428/30000 | Total reward = 51.16
2022-01-26 14:18:05.175 | DEBUG    | __main__:trials:24 - Trial = 20429/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.175 | DEBUG    | __main__:trials:29 - Trial = 20429/30000 | Total reward = 46.80
2022-01-26 14:18:05.180 | DEBUG    | __main__:trials:24 - Trial = 20430/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.181 | DEBUG    | __main__:trials:29 - Trial = 20430/30000 | Total reward = 39.57
2022-01-26 14:18:05.185 | DEBUG    | __main__:trials:24 - Trial = 20431/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.186 | DEBUG    | __main__:trials:29 - Trial = 20431/30000 | Total reward = 37.55
2022-01-26 14:18:05.189 | DEBUG    | __main__:trials:24 - Trial = 20432/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.190 | DEBUG    | __main__:trials:29 - Trial = 20432/30000 | Total reward = 40.64
2022-01-26 14:18:05.193 | DEBUG    | __main__:trials:24 - Trial = 20433/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.195 | DEBUG    | __main__:trials:29 - Trial = 20433/30000 | Total reward = 31.14
2022-01-26 14:18:05.198 | DEBUG    | __main__:trials:24 - Trial = 20434/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.200 | DEBUG    | __main__:trials:29 - Trial = 20434/30000 | Total reward = 46.80
2022-01-26 14:18:05.204 | DEBUG    | __main__:trials:24 - Trial = 20435/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.204 | DEBUG    | __main__:trials:29 - Trial = 20435/30000 | Total reward = 35.03
2022-01-26 14:18:05.209 | DEBUG    | __main__:trials:24 - Trial = 20436/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.211 | DEBUG    | __main__:trials:29 - Trial = 20436/30000 | Total reward = 31.52
2022-01-26 14:18:05.214 | DEBUG    | __main__:trials:24 - Trial = 20437/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.215 | DEBUG    | __main__:trials:29 - Trial = 20437/30000 | Total reward = 40.42
2022-01-26 14:18:05.218 | DEBUG    | __main__:trials:24 - Trial = 20438/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.220 | DEBUG    | __main__:trials:29 - Trial = 20438/30000 | Total reward = 60.43
2022-01-26 14:18:05.224 | DEBUG    | __main__:trials:24 - Trial = 20439/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.225 | DEBUG    | __main__:trials:29 - Trial = 20439/30000 | Total reward = 42.44
2022-01-26 14:18:05.228 | DEBUG    | __main__:trials:24 - Trial = 20440/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.230 | DEBUG    | __main__:trials:29 - Trial = 20440/30000 | Total reward = 48.70
2022-01-26 14:18:05.234 | DEBUG    | __main__:trials:24 - Trial = 20441/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.235 | DEBUG    | __main__:trials:29 - Trial = 20441/30000 | Total reward = 39.57
2022-01-26 14:18:05.239 | DEBUG    | __main__:trials:24 - Trial = 20442/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.241 | DEBUG    | __main__:trials:29 - Trial = 20442/30000 | Total reward = 24.52
2022-01-26 14:18:05.244 | DEBUG    | __main__:trials:26 - Trial = 20443/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.245 | DEBUG    | __main__:trials:29 - Trial = 20443/30000 | Total reward = 25.52
2022-01-26 14:18:05.249 | DEBUG    | __main__:trials:24 - Trial = 20444/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.250 | DEBUG    | __main__:trials:29 - Trial = 20444/30000 | Total reward = 36.62
2022-01-26 14:18:05.254 | DEBUG    | __main__:trials:24 - Trial = 20445/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.256 | DEBUG    | __main__:trials:29 - Trial = 20445/30000 | Total reward = 38.37
2022-01-26 14:18:05.259 | DEBUG    | __main__:trials:24 - Trial = 20446/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.261 | DEBUG    | __main__:trials:29 - Trial = 20446/30000 | Total reward = 40.92
2022-01-26 14:18:05.264 | DEBUG    | __main__:trials:24 - Trial = 20447/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.266 | DEBUG    | __main__:trials:29 - Trial = 20447/30000 | Total reward = 37.43
2022-01-26 14:18:05.269 | DEBUG    | __main__:trials:24 - Trial = 20448/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.270 | DEBUG    | __main__:trials:29 - Trial = 20448/30000 | Total reward = 53.08
2022-01-26 14:18:05.274 | DEBUG    | __main__:trials:26 - Trial = 20449/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.276 | DEBUG    | __main__:trials:29 - Trial = 20449/30000 | Total reward = 40.42
2022-01-26 14:18:05.279 | DEBUG    | __main__:trials:26 - Trial = 20450/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.280 | DEBUG    | __main__:trials:29 - Trial = 20450/30000 | Total reward = 31.83
2022-01-26 14:18:05.284 | DEBUG    | __main__:trials:24 - Trial = 20451/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.285 | DEBUG    | __main__:trials:29 - Trial = 20451/30000 | Total reward = 37.67
2022-01-26 14:18:05.288 | DEBUG    | __main__:trials:24 - Trial = 20452/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.289 | DEBUG    | __main__:trials:29 - Trial = 20452/30000 | Total reward = 36.75
2022-01-26 14:18:05.293 | DEBUG    | __main__:trials:24 - Trial = 20453/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.294 | DEBUG    | __main__:trials:29 - Trial = 20453/30000 | Total reward = 52.91
2022-01-26 14:18:05.298 | DEBUG    | __main__:trials:24 - Trial = 20454/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.299 | DEBUG    | __main__:trials:29 - Trial = 20454/30000 | Total reward = 35.69
2022-01-26 14:18:05.302 | DEBUG    | __main__:trials:24 - Trial = 20455/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.304 | DEBUG    | __main__:trials:29 - Trial = 20455/30000 | Total reward = 37.20
2022-01-26 14:18:05.308 | DEBUG    | __main__:trials:24 - Trial = 20456/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.309 | DEBUG    | __main__:trials:29 - Trial = 20456/30000 | Total reward = 38.74
2022-01-26 14:18:05.313 | DEBUG    | __main__:trials:24 - Trial = 20457/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.315 | DEBUG    | __main__:trials:29 - Trial = 20457/30000 | Total reward = 49.32
2022-01-26 14:18:05.318 | DEBUG    | __main__:trials:24 - Trial = 20458/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.320 | DEBUG    | __main__:trials:29 - Trial = 20458/30000 | Total reward = 36.96
2022-01-26 14:18:05.323 | DEBUG    | __main__:trials:24 - Trial = 20459/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.324 | DEBUG    | __main__:trials:29 - Trial = 20459/30000 | Total reward = 50.88
2022-01-26 14:18:05.328 | DEBUG    | __main__:trials:24 - Trial = 20460/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.330 | DEBUG    | __main__:trials:29 - Trial = 20460/30000 | Total reward = 43.62
2022-01-26 14:18:05.334 | DEBUG    | __main__:trials:24 - Trial = 20461/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.334 | DEBUG    | __main__:trials:29 - Trial = 20461/30000 | Total reward = 41.37
2022-01-26 14:18:05.338 | DEBUG    | __main__:trials:24 - Trial = 20462/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.340 | DEBUG    | __main__:trials:29 - Trial = 20462/30000 | Total reward = 33.70
2022-01-26 14:18:05.343 | DEBUG    | __main__:trials:24 - Trial = 20463/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.345 | DEBUG    | __main__:trials:29 - Trial = 20463/30000 | Total reward = 50.28
2022-01-26 14:18:05.348 | DEBUG    | __main__:trials:24 - Trial = 20464/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.349 | DEBUG    | __main__:trials:29 - Trial = 20464/30000 | Total reward = 23.51
2022-01-26 14:18:05.353 | DEBUG    | __main__:trials:24 - Trial = 20465/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.355 | DEBUG    | __main__:trials:29 - Trial = 20465/30000 | Total reward = 36.20
2022-01-26 14:18:05.359 | DEBUG    | __main__:trials:24 - Trial = 20466/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.360 | DEBUG    | __main__:trials:29 - Trial = 20466/30000 | Total reward = 44.27
2022-01-26 14:18:05.363 | DEBUG    | __main__:trials:24 - Trial = 20467/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.365 | DEBUG    | __main__:trials:29 - Trial = 20467/30000 | Total reward = 38.26
2022-01-26 14:18:05.369 | DEBUG    | __main__:trials:24 - Trial = 20468/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.371 | DEBUG    | __main__:trials:29 - Trial = 20468/30000 | Total reward = 37.27
2022-01-26 14:18:05.374 | DEBUG    | __main__:trials:24 - Trial = 20469/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.376 | DEBUG    | __main__:trials:29 - Trial = 20469/30000 | Total reward = 34.99
2022-01-26 14:18:05.379 | DEBUG    | __main__:trials:24 - Trial = 20470/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.380 | DEBUG    | __main__:trials:29 - Trial = 20470/30000 | Total reward = 51.30
2022-01-26 14:18:05.385 | DEBUG    | __main__:trials:24 - Trial = 20471/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.387 | DEBUG    | __main__:trials:29 - Trial = 20471/30000 | Total reward = 44.35
2022-01-26 14:18:05.390 | DEBUG    | __main__:trials:24 - Trial = 20472/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.392 | DEBUG    | __main__:trials:29 - Trial = 20472/30000 | Total reward = 37.47
2022-01-26 14:18:05.396 | DEBUG    | __main__:trials:24 - Trial = 20473/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.396 | DEBUG    | __main__:trials:29 - Trial = 20473/30000 | Total reward = 53.64
2022-01-26 14:18:05.400 | DEBUG    | __main__:trials:24 - Trial = 20474/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.402 | DEBUG    | __main__:trials:29 - Trial = 20474/30000 | Total reward = 39.42
2022-01-26 14:18:05.406 | DEBUG    | __main__:trials:24 - Trial = 20475/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.406 | DEBUG    | __main__:trials:29 - Trial = 20475/30000 | Total reward = 54.60
2022-01-26 14:18:05.411 | DEBUG    | __main__:trials:24 - Trial = 20476/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.412 | DEBUG    | __main__:trials:29 - Trial = 20476/30000 | Total reward = 49.34
2022-01-26 14:18:05.416 | DEBUG    | __main__:trials:24 - Trial = 20477/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.417 | DEBUG    | __main__:trials:29 - Trial = 20477/30000 | Total reward = 39.77
2022-01-26 14:18:05.421 | DEBUG    | __main__:trials:24 - Trial = 20478/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.423 | DEBUG    | __main__:trials:29 - Trial = 20478/30000 | Total reward = 37.25
2022-01-26 14:18:05.426 | DEBUG    | __main__:trials:24 - Trial = 20479/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.428 | DEBUG    | __main__:trials:29 - Trial = 20479/30000 | Total reward = 41.00
2022-01-26 14:18:05.431 | DEBUG    | __main__:trials:24 - Trial = 20480/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.433 | DEBUG    | __main__:trials:29 - Trial = 20480/30000 | Total reward = 45.84
2022-01-26 14:18:05.436 | DEBUG    | __main__:trials:24 - Trial = 20481/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.438 | DEBUG    | __main__:trials:29 - Trial = 20481/30000 | Total reward = 43.81
2022-01-26 14:18:05.442 | DEBUG    | __main__:trials:24 - Trial = 20482/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.442 | DEBUG    | __main__:trials:29 - Trial = 20482/30000 | Total reward = 43.55
2022-01-26 14:18:05.446 | DEBUG    | __main__:trials:24 - Trial = 20483/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.447 | DEBUG    | __main__:trials:29 - Trial = 20483/30000 | Total reward = 55.34
2022-01-26 14:18:05.451 | DEBUG    | __main__:trials:24 - Trial = 20484/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.453 | DEBUG    | __main__:trials:29 - Trial = 20484/30000 | Total reward = 37.46
2022-01-26 14:18:05.455 | DEBUG    | __main__:trials:26 - Trial = 20485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.457 | DEBUG    | __main__:trials:29 - Trial = 20485/30000 | Total reward = 31.01
2022-01-26 14:18:05.460 | DEBUG    | __main__:trials:24 - Trial = 20486/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.462 | DEBUG    | __main__:trials:29 - Trial = 20486/30000 | Total reward = 39.26
2022-01-26 14:18:05.466 | DEBUG    | __main__:trials:24 - Trial = 20487/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.466 | DEBUG    | __main__:trials:29 - Trial = 20487/30000 | Total reward = 44.50
2022-01-26 14:18:05.471 | DEBUG    | __main__:trials:24 - Trial = 20488/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.471 | DEBUG    | __main__:trials:29 - Trial = 20488/30000 | Total reward = 34.25
2022-01-26 14:18:05.475 | DEBUG    | __main__:trials:24 - Trial = 20489/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.476 | DEBUG    | __main__:trials:29 - Trial = 20489/30000 | Total reward = 55.26
2022-01-26 14:18:05.480 | DEBUG    | __main__:trials:24 - Trial = 20490/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.481 | DEBUG    | __main__:trials:29 - Trial = 20490/30000 | Total reward = 42.15
2022-01-26 14:18:05.484 | DEBUG    | __main__:trials:24 - Trial = 20491/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.485 | DEBUG    | __main__:trials:29 - Trial = 20491/30000 | Total reward = 36.98
2022-01-26 14:18:05.489 | DEBUG    | __main__:trials:24 - Trial = 20492/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.489 | DEBUG    | __main__:trials:29 - Trial = 20492/30000 | Total reward = 41.05
2022-01-26 14:18:05.493 | DEBUG    | __main__:trials:24 - Trial = 20493/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.494 | DEBUG    | __main__:trials:29 - Trial = 20493/30000 | Total reward = 38.01
2022-01-26 14:18:05.497 | DEBUG    | __main__:trials:24 - Trial = 20494/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.498 | DEBUG    | __main__:trials:29 - Trial = 20494/30000 | Total reward = 37.97
2022-01-26 14:18:05.501 | DEBUG    | __main__:trials:24 - Trial = 20495/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.502 | DEBUG    | __main__:trials:29 - Trial = 20495/30000 | Total reward = 41.68
2022-01-26 14:18:05.506 | DEBUG    | __main__:trials:24 - Trial = 20496/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.506 | DEBUG    | __main__:trials:29 - Trial = 20496/30000 | Total reward = 45.53
2022-01-26 14:18:05.510 | DEBUG    | __main__:trials:24 - Trial = 20497/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.511 | DEBUG    | __main__:trials:29 - Trial = 20497/30000 | Total reward = 43.27
2022-01-26 14:18:05.515 | DEBUG    | __main__:trials:24 - Trial = 20498/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.516 | DEBUG    | __main__:trials:29 - Trial = 20498/30000 | Total reward = 35.03
2022-01-26 14:18:05.519 | DEBUG    | __main__:trials:24 - Trial = 20499/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.521 | DEBUG    | __main__:trials:29 - Trial = 20499/30000 | Total reward = 38.69
2022-01-26 14:18:05.524 | DEBUG    | __main__:trials:24 - Trial = 20500/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.526 | DEBUG    | __main__:trials:29 - Trial = 20500/30000 | Total reward = 37.36
2022-01-26 14:18:05.529 | DEBUG    | __main__:trials:24 - Trial = 20501/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.530 | DEBUG    | __main__:trials:29 - Trial = 20501/30000 | Total reward = 37.20
2022-01-26 14:18:05.535 | DEBUG    | __main__:trials:24 - Trial = 20502/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.536 | DEBUG    | __main__:trials:29 - Trial = 20502/30000 | Total reward = 33.29
2022-01-26 14:18:05.540 | DEBUG    | __main__:trials:24 - Trial = 20503/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.541 | DEBUG    | __main__:trials:29 - Trial = 20503/30000 | Total reward = 46.76
2022-01-26 14:18:05.544 | DEBUG    | __main__:trials:24 - Trial = 20504/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.546 | DEBUG    | __main__:trials:29 - Trial = 20504/30000 | Total reward = 39.16
2022-01-26 14:18:05.549 | DEBUG    | __main__:trials:24 - Trial = 20505/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.551 | DEBUG    | __main__:trials:29 - Trial = 20505/30000 | Total reward = 45.86
2022-01-26 14:18:05.555 | DEBUG    | __main__:trials:24 - Trial = 20506/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.557 | DEBUG    | __main__:trials:29 - Trial = 20506/30000 | Total reward = 48.12
2022-01-26 14:18:05.560 | DEBUG    | __main__:trials:24 - Trial = 20507/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.562 | DEBUG    | __main__:trials:29 - Trial = 20507/30000 | Total reward = 51.64
2022-01-26 14:18:05.567 | DEBUG    | __main__:trials:24 - Trial = 20508/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.568 | DEBUG    | __main__:trials:29 - Trial = 20508/30000 | Total reward = 48.62
2022-01-26 14:18:05.572 | DEBUG    | __main__:trials:24 - Trial = 20509/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.573 | DEBUG    | __main__:trials:29 - Trial = 20509/30000 | Total reward = 42.51
2022-01-26 14:18:05.577 | DEBUG    | __main__:trials:24 - Trial = 20510/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.578 | DEBUG    | __main__:trials:29 - Trial = 20510/30000 | Total reward = 44.31
2022-01-26 14:18:05.581 | DEBUG    | __main__:trials:24 - Trial = 20511/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.583 | DEBUG    | __main__:trials:29 - Trial = 20511/30000 | Total reward = 38.03
2022-01-26 14:18:05.587 | DEBUG    | __main__:trials:24 - Trial = 20512/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.588 | DEBUG    | __main__:trials:29 - Trial = 20512/30000 | Total reward = 51.46
2022-01-26 14:18:05.591 | DEBUG    | __main__:trials:24 - Trial = 20513/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.593 | DEBUG    | __main__:trials:29 - Trial = 20513/30000 | Total reward = 39.40
2022-01-26 14:18:05.597 | DEBUG    | __main__:trials:24 - Trial = 20514/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.598 | DEBUG    | __main__:trials:29 - Trial = 20514/30000 | Total reward = 41.00
2022-01-26 14:18:05.603 | DEBUG    | __main__:trials:24 - Trial = 20515/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.604 | DEBUG    | __main__:trials:29 - Trial = 20515/30000 | Total reward = 38.38
2022-01-26 14:18:05.608 | DEBUG    | __main__:trials:24 - Trial = 20516/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.610 | DEBUG    | __main__:trials:29 - Trial = 20516/30000 | Total reward = 35.94
2022-01-26 14:18:05.613 | DEBUG    | __main__:trials:24 - Trial = 20517/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.614 | DEBUG    | __main__:trials:29 - Trial = 20517/30000 | Total reward = 51.51
2022-01-26 14:18:05.619 | DEBUG    | __main__:trials:24 - Trial = 20518/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.619 | DEBUG    | __main__:trials:29 - Trial = 20518/30000 | Total reward = 39.57
2022-01-26 14:18:05.624 | DEBUG    | __main__:trials:24 - Trial = 20519/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.625 | DEBUG    | __main__:trials:29 - Trial = 20519/30000 | Total reward = 40.61
2022-01-26 14:18:05.629 | DEBUG    | __main__:trials:24 - Trial = 20520/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.630 | DEBUG    | __main__:trials:29 - Trial = 20520/30000 | Total reward = 50.46
2022-01-26 14:18:05.633 | DEBUG    | __main__:trials:24 - Trial = 20521/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.634 | DEBUG    | __main__:trials:29 - Trial = 20521/30000 | Total reward = 34.27
2022-01-26 14:18:05.637 | DEBUG    | __main__:trials:24 - Trial = 20522/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.639 | DEBUG    | __main__:trials:29 - Trial = 20522/30000 | Total reward = 46.08
2022-01-26 14:18:05.642 | DEBUG    | __main__:trials:24 - Trial = 20523/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.643 | DEBUG    | __main__:trials:29 - Trial = 20523/30000 | Total reward = 39.30
2022-01-26 14:18:05.646 | DEBUG    | __main__:trials:26 - Trial = 20524/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.648 | DEBUG    | __main__:trials:29 - Trial = 20524/30000 | Total reward = 22.28
2022-01-26 14:18:05.652 | DEBUG    | __main__:trials:24 - Trial = 20525/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.652 | DEBUG    | __main__:trials:29 - Trial = 20525/30000 | Total reward = 32.58
2022-01-26 14:18:05.656 | DEBUG    | __main__:trials:24 - Trial = 20526/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.657 | DEBUG    | __main__:trials:29 - Trial = 20526/30000 | Total reward = 56.70
2022-01-26 14:18:05.661 | DEBUG    | __main__:trials:24 - Trial = 20527/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.661 | DEBUG    | __main__:trials:29 - Trial = 20527/30000 | Total reward = 43.81
2022-01-26 14:18:05.665 | DEBUG    | __main__:trials:24 - Trial = 20528/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.666 | DEBUG    | __main__:trials:29 - Trial = 20528/30000 | Total reward = 41.82
2022-01-26 14:18:05.669 | DEBUG    | __main__:trials:24 - Trial = 20529/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.670 | DEBUG    | __main__:trials:29 - Trial = 20529/30000 | Total reward = 34.96
2022-01-26 14:18:05.673 | DEBUG    | __main__:trials:26 - Trial = 20530/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.675 | DEBUG    | __main__:trials:29 - Trial = 20530/30000 | Total reward = 20.82
2022-01-26 14:18:05.679 | DEBUG    | __main__:trials:24 - Trial = 20531/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.680 | DEBUG    | __main__:trials:29 - Trial = 20531/30000 | Total reward = 36.25
2022-01-26 14:18:05.684 | DEBUG    | __main__:trials:24 - Trial = 20532/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.685 | DEBUG    | __main__:trials:29 - Trial = 20532/30000 | Total reward = 42.60
2022-01-26 14:18:05.689 | DEBUG    | __main__:trials:24 - Trial = 20533/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.690 | DEBUG    | __main__:trials:29 - Trial = 20533/30000 | Total reward = 51.06
2022-01-26 14:18:05.694 | DEBUG    | __main__:trials:24 - Trial = 20534/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.695 | DEBUG    | __main__:trials:29 - Trial = 20534/30000 | Total reward = 46.17
2022-01-26 14:18:05.700 | DEBUG    | __main__:trials:24 - Trial = 20535/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.701 | DEBUG    | __main__:trials:29 - Trial = 20535/30000 | Total reward = 37.41
2022-01-26 14:18:05.705 | DEBUG    | __main__:trials:24 - Trial = 20536/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.706 | DEBUG    | __main__:trials:29 - Trial = 20536/30000 | Total reward = 37.25
2022-01-26 14:18:05.709 | DEBUG    | __main__:trials:24 - Trial = 20537/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.711 | DEBUG    | __main__:trials:29 - Trial = 20537/30000 | Total reward = 37.54
2022-01-26 14:18:05.713 | DEBUG    | __main__:trials:24 - Trial = 20538/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.714 | DEBUG    | __main__:trials:29 - Trial = 20538/30000 | Total reward = 37.44
2022-01-26 14:18:05.717 | DEBUG    | __main__:trials:24 - Trial = 20539/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.719 | DEBUG    | __main__:trials:29 - Trial = 20539/30000 | Total reward = 39.21
2022-01-26 14:18:05.723 | DEBUG    | __main__:trials:24 - Trial = 20540/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.725 | DEBUG    | __main__:trials:29 - Trial = 20540/30000 | Total reward = 38.75
2022-01-26 14:18:05.728 | DEBUG    | __main__:trials:24 - Trial = 20541/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.729 | DEBUG    | __main__:trials:29 - Trial = 20541/30000 | Total reward = 35.52
2022-01-26 14:18:05.732 | DEBUG    | __main__:trials:24 - Trial = 20542/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.734 | DEBUG    | __main__:trials:29 - Trial = 20542/30000 | Total reward = 37.27
2022-01-26 14:18:05.737 | DEBUG    | __main__:trials:24 - Trial = 20543/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.738 | DEBUG    | __main__:trials:29 - Trial = 20543/30000 | Total reward = 41.24
2022-01-26 14:18:05.741 | DEBUG    | __main__:trials:24 - Trial = 20544/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.742 | DEBUG    | __main__:trials:29 - Trial = 20544/30000 | Total reward = 40.11
2022-01-26 14:18:05.745 | DEBUG    | __main__:trials:24 - Trial = 20545/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.746 | DEBUG    | __main__:trials:29 - Trial = 20545/30000 | Total reward = 41.86
2022-01-26 14:18:05.750 | DEBUG    | __main__:trials:24 - Trial = 20546/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.750 | DEBUG    | __main__:trials:29 - Trial = 20546/30000 | Total reward = 39.21
2022-01-26 14:18:05.754 | DEBUG    | __main__:trials:24 - Trial = 20547/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.754 | DEBUG    | __main__:trials:29 - Trial = 20547/30000 | Total reward = 52.60
2022-01-26 14:18:05.758 | DEBUG    | __main__:trials:24 - Trial = 20548/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.759 | DEBUG    | __main__:trials:29 - Trial = 20548/30000 | Total reward = 34.40
2022-01-26 14:18:05.762 | DEBUG    | __main__:trials:24 - Trial = 20549/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.764 | DEBUG    | __main__:trials:29 - Trial = 20549/30000 | Total reward = 45.28
2022-01-26 14:18:05.767 | DEBUG    | __main__:trials:24 - Trial = 20550/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.769 | DEBUG    | __main__:trials:29 - Trial = 20550/30000 | Total reward = 45.97
2022-01-26 14:18:05.772 | DEBUG    | __main__:trials:24 - Trial = 20551/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.773 | DEBUG    | __main__:trials:29 - Trial = 20551/30000 | Total reward = 33.56
2022-01-26 14:18:05.777 | DEBUG    | __main__:trials:24 - Trial = 20552/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.778 | DEBUG    | __main__:trials:29 - Trial = 20552/30000 | Total reward = 37.38
2022-01-26 14:18:05.782 | DEBUG    | __main__:trials:24 - Trial = 20553/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.784 | DEBUG    | __main__:trials:29 - Trial = 20553/30000 | Total reward = 41.62
2022-01-26 14:18:05.788 | DEBUG    | __main__:trials:24 - Trial = 20554/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.788 | DEBUG    | __main__:trials:29 - Trial = 20554/30000 | Total reward = 32.94
2022-01-26 14:18:05.792 | DEBUG    | __main__:trials:24 - Trial = 20555/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.794 | DEBUG    | __main__:trials:29 - Trial = 20555/30000 | Total reward = 36.68
2022-01-26 14:18:05.798 | DEBUG    | __main__:trials:24 - Trial = 20556/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.799 | DEBUG    | __main__:trials:29 - Trial = 20556/30000 | Total reward = 55.50
2022-01-26 14:18:05.803 | DEBUG    | __main__:trials:24 - Trial = 20557/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.804 | DEBUG    | __main__:trials:29 - Trial = 20557/30000 | Total reward = 45.26
2022-01-26 14:18:05.807 | DEBUG    | __main__:trials:24 - Trial = 20558/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.809 | DEBUG    | __main__:trials:29 - Trial = 20558/30000 | Total reward = 39.17
2022-01-26 14:18:05.812 | DEBUG    | __main__:trials:24 - Trial = 20559/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.814 | DEBUG    | __main__:trials:29 - Trial = 20559/30000 | Total reward = 36.35
2022-01-26 14:18:05.818 | DEBUG    | __main__:trials:24 - Trial = 20560/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.820 | DEBUG    | __main__:trials:29 - Trial = 20560/30000 | Total reward = 42.22
2022-01-26 14:18:05.823 | DEBUG    | __main__:trials:24 - Trial = 20561/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.825 | DEBUG    | __main__:trials:29 - Trial = 20561/30000 | Total reward = 50.00
2022-01-26 14:18:05.828 | DEBUG    | __main__:trials:24 - Trial = 20562/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.829 | DEBUG    | __main__:trials:29 - Trial = 20562/30000 | Total reward = 38.30
2022-01-26 14:18:05.833 | DEBUG    | __main__:trials:24 - Trial = 20563/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.834 | DEBUG    | __main__:trials:29 - Trial = 20563/30000 | Total reward = 45.71
2022-01-26 14:18:05.838 | DEBUG    | __main__:trials:24 - Trial = 20564/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.839 | DEBUG    | __main__:trials:29 - Trial = 20564/30000 | Total reward = 55.45
2022-01-26 14:18:05.843 | DEBUG    | __main__:trials:24 - Trial = 20565/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.845 | DEBUG    | __main__:trials:29 - Trial = 20565/30000 | Total reward = 51.57
2022-01-26 14:18:05.849 | DEBUG    | __main__:trials:24 - Trial = 20566/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.850 | DEBUG    | __main__:trials:29 - Trial = 20566/30000 | Total reward = 33.18
2022-01-26 14:18:05.854 | DEBUG    | __main__:trials:24 - Trial = 20567/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.855 | DEBUG    | __main__:trials:29 - Trial = 20567/30000 | Total reward = 37.55
2022-01-26 14:18:05.859 | DEBUG    | __main__:trials:24 - Trial = 20568/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.860 | DEBUG    | __main__:trials:29 - Trial = 20568/30000 | Total reward = 46.40
2022-01-26 14:18:05.864 | DEBUG    | __main__:trials:24 - Trial = 20569/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.865 | DEBUG    | __main__:trials:29 - Trial = 20569/30000 | Total reward = 53.01
2022-01-26 14:18:05.869 | DEBUG    | __main__:trials:24 - Trial = 20570/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.870 | DEBUG    | __main__:trials:29 - Trial = 20570/30000 | Total reward = 35.56
2022-01-26 14:18:05.873 | DEBUG    | __main__:trials:26 - Trial = 20571/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:05.874 | DEBUG    | __main__:trials:29 - Trial = 20571/30000 | Total reward = 13.67
2022-01-26 14:18:05.878 | DEBUG    | __main__:trials:24 - Trial = 20572/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.880 | DEBUG    | __main__:trials:29 - Trial = 20572/30000 | Total reward = 42.98
2022-01-26 14:18:05.883 | DEBUG    | __main__:trials:24 - Trial = 20573/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.884 | DEBUG    | __main__:trials:29 - Trial = 20573/30000 | Total reward = 58.83
2022-01-26 14:18:05.888 | DEBUG    | __main__:trials:24 - Trial = 20574/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.889 | DEBUG    | __main__:trials:29 - Trial = 20574/30000 | Total reward = 47.52
2022-01-26 14:18:05.894 | DEBUG    | __main__:trials:24 - Trial = 20575/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.894 | DEBUG    | __main__:trials:29 - Trial = 20575/30000 | Total reward = 59.50
2022-01-26 14:18:05.899 | DEBUG    | __main__:trials:24 - Trial = 20576/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.900 | DEBUG    | __main__:trials:29 - Trial = 20576/30000 | Total reward = 56.44
2022-01-26 14:18:05.904 | DEBUG    | __main__:trials:24 - Trial = 20577/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.906 | DEBUG    | __main__:trials:29 - Trial = 20577/30000 | Total reward = 47.79
2022-01-26 14:18:05.909 | DEBUG    | __main__:trials:24 - Trial = 20578/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.911 | DEBUG    | __main__:trials:29 - Trial = 20578/30000 | Total reward = 39.48
2022-01-26 14:18:05.914 | DEBUG    | __main__:trials:24 - Trial = 20579/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.916 | DEBUG    | __main__:trials:29 - Trial = 20579/30000 | Total reward = 55.01
2022-01-26 14:18:05.920 | DEBUG    | __main__:trials:24 - Trial = 20580/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.921 | DEBUG    | __main__:trials:29 - Trial = 20580/30000 | Total reward = 47.28
2022-01-26 14:18:05.925 | DEBUG    | __main__:trials:24 - Trial = 20581/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.926 | DEBUG    | __main__:trials:29 - Trial = 20581/30000 | Total reward = 47.07
2022-01-26 14:18:05.929 | DEBUG    | __main__:trials:24 - Trial = 20582/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.930 | DEBUG    | __main__:trials:29 - Trial = 20582/30000 | Total reward = 49.22
2022-01-26 14:18:05.933 | DEBUG    | __main__:trials:24 - Trial = 20583/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.935 | DEBUG    | __main__:trials:29 - Trial = 20583/30000 | Total reward = 38.80
2022-01-26 14:18:05.938 | DEBUG    | __main__:trials:24 - Trial = 20584/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.940 | DEBUG    | __main__:trials:29 - Trial = 20584/30000 | Total reward = 38.51
2022-01-26 14:18:05.944 | DEBUG    | __main__:trials:24 - Trial = 20585/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.945 | DEBUG    | __main__:trials:29 - Trial = 20585/30000 | Total reward = 33.57
2022-01-26 14:18:05.949 | DEBUG    | __main__:trials:24 - Trial = 20586/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.951 | DEBUG    | __main__:trials:29 - Trial = 20586/30000 | Total reward = 49.76
2022-01-26 14:18:05.955 | DEBUG    | __main__:trials:24 - Trial = 20587/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.956 | DEBUG    | __main__:trials:29 - Trial = 20587/30000 | Total reward = 45.39
2022-01-26 14:18:05.960 | DEBUG    | __main__:trials:24 - Trial = 20588/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.962 | DEBUG    | __main__:trials:29 - Trial = 20588/30000 | Total reward = 57.75
2022-01-26 14:18:05.965 | DEBUG    | __main__:trials:24 - Trial = 20589/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.967 | DEBUG    | __main__:trials:29 - Trial = 20589/30000 | Total reward = 47.01
2022-01-26 14:18:05.971 | DEBUG    | __main__:trials:24 - Trial = 20590/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.972 | DEBUG    | __main__:trials:29 - Trial = 20590/30000 | Total reward = 50.44
2022-01-26 14:18:05.976 | DEBUG    | __main__:trials:24 - Trial = 20591/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.977 | DEBUG    | __main__:trials:29 - Trial = 20591/30000 | Total reward = 53.18
2022-01-26 14:18:05.981 | DEBUG    | __main__:trials:24 - Trial = 20592/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.983 | DEBUG    | __main__:trials:29 - Trial = 20592/30000 | Total reward = 45.04
2022-01-26 14:18:05.987 | DEBUG    | __main__:trials:24 - Trial = 20593/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.988 | DEBUG    | __main__:trials:29 - Trial = 20593/30000 | Total reward = 46.73
2022-01-26 14:18:05.992 | DEBUG    | __main__:trials:24 - Trial = 20594/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.994 | DEBUG    | __main__:trials:29 - Trial = 20594/30000 | Total reward = 46.80
2022-01-26 14:18:05.997 | DEBUG    | __main__:trials:24 - Trial = 20595/30000 | Max number of steps (20) reached
2022-01-26 14:18:05.999 | DEBUG    | __main__:trials:29 - Trial = 20595/30000 | Total reward = 51.41
2022-01-26 14:18:06.003 | DEBUG    | __main__:trials:24 - Trial = 20596/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.004 | DEBUG    | __main__:trials:29 - Trial = 20596/30000 | Total reward = 47.35
2022-01-26 14:18:06.008 | DEBUG    | __main__:trials:24 - Trial = 20597/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.010 | DEBUG    | __main__:trials:29 - Trial = 20597/30000 | Total reward = 45.39
2022-01-26 14:18:06.014 | DEBUG    | __main__:trials:24 - Trial = 20598/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.015 | DEBUG    | __main__:trials:29 - Trial = 20598/30000 | Total reward = 43.52
2022-01-26 14:18:06.019 | DEBUG    | __main__:trials:24 - Trial = 20599/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.021 | DEBUG    | __main__:trials:29 - Trial = 20599/30000 | Total reward = 46.86
2022-01-26 14:18:06.024 | DEBUG    | __main__:trials:24 - Trial = 20600/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.026 | DEBUG    | __main__:trials:29 - Trial = 20600/30000 | Total reward = 37.20
2022-01-26 14:18:06.030 | DEBUG    | __main__:trials:24 - Trial = 20601/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.031 | DEBUG    | __main__:trials:29 - Trial = 20601/30000 | Total reward = 54.21
2022-01-26 14:18:06.034 | DEBUG    | __main__:trials:24 - Trial = 20602/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.036 | DEBUG    | __main__:trials:29 - Trial = 20602/30000 | Total reward = 39.41
2022-01-26 14:18:06.040 | DEBUG    | __main__:trials:24 - Trial = 20603/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.041 | DEBUG    | __main__:trials:29 - Trial = 20603/30000 | Total reward = 29.87
2022-01-26 14:18:06.044 | DEBUG    | __main__:trials:24 - Trial = 20604/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.046 | DEBUG    | __main__:trials:29 - Trial = 20604/30000 | Total reward = 38.77
2022-01-26 14:18:06.050 | DEBUG    | __main__:trials:24 - Trial = 20605/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.052 | DEBUG    | __main__:trials:29 - Trial = 20605/30000 | Total reward = 33.62
2022-01-26 14:18:06.055 | DEBUG    | __main__:trials:24 - Trial = 20606/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.057 | DEBUG    | __main__:trials:29 - Trial = 20606/30000 | Total reward = 51.91
2022-01-26 14:18:06.060 | DEBUG    | __main__:trials:24 - Trial = 20607/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.062 | DEBUG    | __main__:trials:29 - Trial = 20607/30000 | Total reward = 30.91
2022-01-26 14:18:06.066 | DEBUG    | __main__:trials:24 - Trial = 20608/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.067 | DEBUG    | __main__:trials:29 - Trial = 20608/30000 | Total reward = 37.72
2022-01-26 14:18:06.071 | DEBUG    | __main__:trials:26 - Trial = 20609/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.073 | DEBUG    | __main__:trials:29 - Trial = 20609/30000 | Total reward = 33.63
2022-01-26 14:18:06.076 | DEBUG    | __main__:trials:24 - Trial = 20610/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.078 | DEBUG    | __main__:trials:29 - Trial = 20610/30000 | Total reward = 39.57
2022-01-26 14:18:06.082 | DEBUG    | __main__:trials:24 - Trial = 20611/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.083 | DEBUG    | __main__:trials:29 - Trial = 20611/30000 | Total reward = 35.97
2022-01-26 14:18:06.086 | DEBUG    | __main__:trials:24 - Trial = 20612/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.088 | DEBUG    | __main__:trials:29 - Trial = 20612/30000 | Total reward = 37.97
2022-01-26 14:18:06.092 | DEBUG    | __main__:trials:24 - Trial = 20613/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.094 | DEBUG    | __main__:trials:29 - Trial = 20613/30000 | Total reward = 38.99
2022-01-26 14:18:06.098 | DEBUG    | __main__:trials:24 - Trial = 20614/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.099 | DEBUG    | __main__:trials:29 - Trial = 20614/30000 | Total reward = 37.80
2022-01-26 14:18:06.103 | DEBUG    | __main__:trials:24 - Trial = 20615/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.104 | DEBUG    | __main__:trials:29 - Trial = 20615/30000 | Total reward = 43.39
2022-01-26 14:18:06.108 | DEBUG    | __main__:trials:24 - Trial = 20616/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.110 | DEBUG    | __main__:trials:29 - Trial = 20616/30000 | Total reward = 39.57
2022-01-26 14:18:06.114 | DEBUG    | __main__:trials:24 - Trial = 20617/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.115 | DEBUG    | __main__:trials:29 - Trial = 20617/30000 | Total reward = 29.53
2022-01-26 14:18:06.119 | DEBUG    | __main__:trials:24 - Trial = 20618/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.120 | DEBUG    | __main__:trials:29 - Trial = 20618/30000 | Total reward = 30.33
2022-01-26 14:18:06.124 | DEBUG    | __main__:trials:24 - Trial = 20619/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.125 | DEBUG    | __main__:trials:29 - Trial = 20619/30000 | Total reward = 49.68
2022-01-26 14:18:06.129 | DEBUG    | __main__:trials:24 - Trial = 20620/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.131 | DEBUG    | __main__:trials:29 - Trial = 20620/30000 | Total reward = 30.72
2022-01-26 14:18:06.134 | DEBUG    | __main__:trials:24 - Trial = 20621/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.135 | DEBUG    | __main__:trials:29 - Trial = 20621/30000 | Total reward = 40.32
2022-01-26 14:18:06.139 | DEBUG    | __main__:trials:24 - Trial = 20622/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.141 | DEBUG    | __main__:trials:29 - Trial = 20622/30000 | Total reward = 39.37
2022-01-26 14:18:06.144 | DEBUG    | __main__:trials:24 - Trial = 20623/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.146 | DEBUG    | __main__:trials:29 - Trial = 20623/30000 | Total reward = 32.86
2022-01-26 14:18:06.149 | DEBUG    | __main__:trials:24 - Trial = 20624/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.150 | DEBUG    | __main__:trials:29 - Trial = 20624/30000 | Total reward = 33.90
2022-01-26 14:18:06.154 | DEBUG    | __main__:trials:24 - Trial = 20625/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.155 | DEBUG    | __main__:trials:29 - Trial = 20625/30000 | Total reward = 35.82
2022-01-26 14:18:06.159 | DEBUG    | __main__:trials:24 - Trial = 20626/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.161 | DEBUG    | __main__:trials:29 - Trial = 20626/30000 | Total reward = 40.85
2022-01-26 14:18:06.164 | DEBUG    | __main__:trials:24 - Trial = 20627/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.166 | DEBUG    | __main__:trials:29 - Trial = 20627/30000 | Total reward = 37.58
2022-01-26 14:18:06.169 | DEBUG    | __main__:trials:24 - Trial = 20628/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.171 | DEBUG    | __main__:trials:29 - Trial = 20628/30000 | Total reward = 42.80
2022-01-26 14:18:06.175 | DEBUG    | __main__:trials:24 - Trial = 20629/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.177 | DEBUG    | __main__:trials:29 - Trial = 20629/30000 | Total reward = 48.33
2022-01-26 14:18:06.180 | DEBUG    | __main__:trials:24 - Trial = 20630/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.181 | DEBUG    | __main__:trials:29 - Trial = 20630/30000 | Total reward = 33.03
2022-01-26 14:18:06.185 | DEBUG    | __main__:trials:24 - Trial = 20631/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.186 | DEBUG    | __main__:trials:29 - Trial = 20631/30000 | Total reward = 49.31
2022-01-26 14:18:06.189 | DEBUG    | __main__:trials:24 - Trial = 20632/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.190 | DEBUG    | __main__:trials:29 - Trial = 20632/30000 | Total reward = 44.12
2022-01-26 14:18:06.193 | DEBUG    | __main__:trials:24 - Trial = 20633/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.194 | DEBUG    | __main__:trials:29 - Trial = 20633/30000 | Total reward = 38.50
2022-01-26 14:18:06.197 | DEBUG    | __main__:trials:24 - Trial = 20634/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.198 | DEBUG    | __main__:trials:29 - Trial = 20634/30000 | Total reward = 42.97
2022-01-26 14:18:06.202 | DEBUG    | __main__:trials:24 - Trial = 20635/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.202 | DEBUG    | __main__:trials:29 - Trial = 20635/30000 | Total reward = 46.11
2022-01-26 14:18:06.206 | DEBUG    | __main__:trials:24 - Trial = 20636/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.208 | DEBUG    | __main__:trials:29 - Trial = 20636/30000 | Total reward = 54.73
2022-01-26 14:18:06.211 | DEBUG    | __main__:trials:24 - Trial = 20637/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.212 | DEBUG    | __main__:trials:29 - Trial = 20637/30000 | Total reward = 53.22
2022-01-26 14:18:06.216 | DEBUG    | __main__:trials:24 - Trial = 20638/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.217 | DEBUG    | __main__:trials:29 - Trial = 20638/30000 | Total reward = 36.37
2022-01-26 14:18:06.221 | DEBUG    | __main__:trials:24 - Trial = 20639/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.223 | DEBUG    | __main__:trials:29 - Trial = 20639/30000 | Total reward = 41.08
2022-01-26 14:18:06.226 | DEBUG    | __main__:trials:24 - Trial = 20640/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.228 | DEBUG    | __main__:trials:29 - Trial = 20640/30000 | Total reward = 36.99
2022-01-26 14:18:06.233 | DEBUG    | __main__:trials:24 - Trial = 20641/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.234 | DEBUG    | __main__:trials:29 - Trial = 20641/30000 | Total reward = 45.98
2022-01-26 14:18:06.238 | DEBUG    | __main__:trials:24 - Trial = 20642/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.239 | DEBUG    | __main__:trials:29 - Trial = 20642/30000 | Total reward = 37.96
2022-01-26 14:18:06.243 | DEBUG    | __main__:trials:24 - Trial = 20643/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.245 | DEBUG    | __main__:trials:29 - Trial = 20643/30000 | Total reward = 39.57
2022-01-26 14:18:06.249 | DEBUG    | __main__:trials:24 - Trial = 20644/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.249 | DEBUG    | __main__:trials:29 - Trial = 20644/30000 | Total reward = 36.60
2022-01-26 14:18:06.253 | DEBUG    | __main__:trials:24 - Trial = 20645/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.254 | DEBUG    | __main__:trials:29 - Trial = 20645/30000 | Total reward = 37.25
2022-01-26 14:18:06.258 | DEBUG    | __main__:trials:24 - Trial = 20646/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.259 | DEBUG    | __main__:trials:29 - Trial = 20646/30000 | Total reward = 44.84
2022-01-26 14:18:06.263 | DEBUG    | __main__:trials:24 - Trial = 20647/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.265 | DEBUG    | __main__:trials:29 - Trial = 20647/30000 | Total reward = 34.88
2022-01-26 14:18:06.268 | DEBUG    | __main__:trials:24 - Trial = 20648/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.270 | DEBUG    | __main__:trials:29 - Trial = 20648/30000 | Total reward = 40.05
2022-01-26 14:18:06.273 | DEBUG    | __main__:trials:24 - Trial = 20649/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.275 | DEBUG    | __main__:trials:29 - Trial = 20649/30000 | Total reward = 39.92
2022-01-26 14:18:06.279 | DEBUG    | __main__:trials:24 - Trial = 20650/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.280 | DEBUG    | __main__:trials:29 - Trial = 20650/30000 | Total reward = 41.02
2022-01-26 14:18:06.284 | DEBUG    | __main__:trials:24 - Trial = 20651/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.285 | DEBUG    | __main__:trials:29 - Trial = 20651/30000 | Total reward = 36.56
2022-01-26 14:18:06.289 | DEBUG    | __main__:trials:24 - Trial = 20652/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.290 | DEBUG    | __main__:trials:29 - Trial = 20652/30000 | Total reward = 39.57
2022-01-26 14:18:06.293 | DEBUG    | __main__:trials:24 - Trial = 20653/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.294 | DEBUG    | __main__:trials:29 - Trial = 20653/30000 | Total reward = 45.48
2022-01-26 14:18:06.297 | DEBUG    | __main__:trials:24 - Trial = 20654/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.297 | DEBUG    | __main__:trials:29 - Trial = 20654/30000 | Total reward = 47.12
2022-01-26 14:18:06.301 | DEBUG    | __main__:trials:24 - Trial = 20655/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.302 | DEBUG    | __main__:trials:29 - Trial = 20655/30000 | Total reward = 51.32
2022-01-26 14:18:06.306 | DEBUG    | __main__:trials:24 - Trial = 20656/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.307 | DEBUG    | __main__:trials:29 - Trial = 20656/30000 | Total reward = 53.13
2022-01-26 14:18:06.310 | DEBUG    | __main__:trials:24 - Trial = 20657/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.312 | DEBUG    | __main__:trials:29 - Trial = 20657/30000 | Total reward = 39.63
2022-01-26 14:18:06.315 | DEBUG    | __main__:trials:24 - Trial = 20658/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.316 | DEBUG    | __main__:trials:29 - Trial = 20658/30000 | Total reward = 36.64
2022-01-26 14:18:06.319 | DEBUG    | __main__:trials:24 - Trial = 20659/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.320 | DEBUG    | __main__:trials:29 - Trial = 20659/30000 | Total reward = 50.77
2022-01-26 14:18:06.324 | DEBUG    | __main__:trials:24 - Trial = 20660/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.325 | DEBUG    | __main__:trials:29 - Trial = 20660/30000 | Total reward = 48.44
2022-01-26 14:18:06.329 | DEBUG    | __main__:trials:24 - Trial = 20661/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.330 | DEBUG    | __main__:trials:29 - Trial = 20661/30000 | Total reward = 42.07
2022-01-26 14:18:06.333 | DEBUG    | __main__:trials:24 - Trial = 20662/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.334 | DEBUG    | __main__:trials:29 - Trial = 20662/30000 | Total reward = 59.99
2022-01-26 14:18:06.338 | DEBUG    | __main__:trials:24 - Trial = 20663/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.339 | DEBUG    | __main__:trials:29 - Trial = 20663/30000 | Total reward = 43.40
2022-01-26 14:18:06.343 | DEBUG    | __main__:trials:24 - Trial = 20664/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.344 | DEBUG    | __main__:trials:29 - Trial = 20664/30000 | Total reward = 53.66
2022-01-26 14:18:06.348 | DEBUG    | __main__:trials:24 - Trial = 20665/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.349 | DEBUG    | __main__:trials:29 - Trial = 20665/30000 | Total reward = 47.40
2022-01-26 14:18:06.353 | DEBUG    | __main__:trials:26 - Trial = 20666/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.353 | DEBUG    | __main__:trials:29 - Trial = 20666/30000 | Total reward = 34.81
2022-01-26 14:18:06.357 | DEBUG    | __main__:trials:24 - Trial = 20667/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.358 | DEBUG    | __main__:trials:29 - Trial = 20667/30000 | Total reward = 37.43
2022-01-26 14:18:06.362 | DEBUG    | __main__:trials:24 - Trial = 20668/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.362 | DEBUG    | __main__:trials:29 - Trial = 20668/30000 | Total reward = 46.79
2022-01-26 14:18:06.366 | DEBUG    | __main__:trials:24 - Trial = 20669/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.367 | DEBUG    | __main__:trials:29 - Trial = 20669/30000 | Total reward = 42.52
2022-01-26 14:18:06.371 | DEBUG    | __main__:trials:24 - Trial = 20670/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.372 | DEBUG    | __main__:trials:29 - Trial = 20670/30000 | Total reward = 57.01
2022-01-26 14:18:06.375 | DEBUG    | __main__:trials:24 - Trial = 20671/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.377 | DEBUG    | __main__:trials:29 - Trial = 20671/30000 | Total reward = 53.28
2022-01-26 14:18:06.380 | DEBUG    | __main__:trials:24 - Trial = 20672/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.381 | DEBUG    | __main__:trials:29 - Trial = 20672/30000 | Total reward = 43.63
2022-01-26 14:18:06.384 | DEBUG    | __main__:trials:24 - Trial = 20673/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.386 | DEBUG    | __main__:trials:29 - Trial = 20673/30000 | Total reward = 46.87
2022-01-26 14:18:06.390 | DEBUG    | __main__:trials:24 - Trial = 20674/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.391 | DEBUG    | __main__:trials:29 - Trial = 20674/30000 | Total reward = 52.32
2022-01-26 14:18:06.394 | DEBUG    | __main__:trials:24 - Trial = 20675/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.396 | DEBUG    | __main__:trials:29 - Trial = 20675/30000 | Total reward = 42.21
2022-01-26 14:18:06.400 | DEBUG    | __main__:trials:24 - Trial = 20676/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.402 | DEBUG    | __main__:trials:29 - Trial = 20676/30000 | Total reward = 53.02
2022-01-26 14:18:06.406 | DEBUG    | __main__:trials:24 - Trial = 20677/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.406 | DEBUG    | __main__:trials:29 - Trial = 20677/30000 | Total reward = 50.67
2022-01-26 14:18:06.410 | DEBUG    | __main__:trials:24 - Trial = 20678/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.412 | DEBUG    | __main__:trials:29 - Trial = 20678/30000 | Total reward = 40.73
2022-01-26 14:18:06.415 | DEBUG    | __main__:trials:24 - Trial = 20679/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.417 | DEBUG    | __main__:trials:29 - Trial = 20679/30000 | Total reward = 49.89
2022-01-26 14:18:06.420 | DEBUG    | __main__:trials:24 - Trial = 20680/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.422 | DEBUG    | __main__:trials:29 - Trial = 20680/30000 | Total reward = 53.28
2022-01-26 14:18:06.426 | DEBUG    | __main__:trials:24 - Trial = 20681/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.427 | DEBUG    | __main__:trials:29 - Trial = 20681/30000 | Total reward = 34.62
2022-01-26 14:18:06.431 | DEBUG    | __main__:trials:24 - Trial = 20682/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.433 | DEBUG    | __main__:trials:29 - Trial = 20682/30000 | Total reward = 53.04
2022-01-26 14:18:06.437 | DEBUG    | __main__:trials:24 - Trial = 20683/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.437 | DEBUG    | __main__:trials:29 - Trial = 20683/30000 | Total reward = 47.11
2022-01-26 14:18:06.441 | DEBUG    | __main__:trials:24 - Trial = 20684/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.442 | DEBUG    | __main__:trials:29 - Trial = 20684/30000 | Total reward = 41.64
2022-01-26 14:18:06.446 | DEBUG    | __main__:trials:24 - Trial = 20685/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.449 | DEBUG    | __main__:trials:29 - Trial = 20685/30000 | Total reward = 39.17
2022-01-26 14:18:06.452 | DEBUG    | __main__:trials:24 - Trial = 20686/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.453 | DEBUG    | __main__:trials:29 - Trial = 20686/30000 | Total reward = 32.17
2022-01-26 14:18:06.457 | DEBUG    | __main__:trials:24 - Trial = 20687/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.458 | DEBUG    | __main__:trials:29 - Trial = 20687/30000 | Total reward = 43.46
2022-01-26 14:18:06.462 | DEBUG    | __main__:trials:24 - Trial = 20688/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.463 | DEBUG    | __main__:trials:29 - Trial = 20688/30000 | Total reward = 32.17
2022-01-26 14:18:06.467 | DEBUG    | __main__:trials:24 - Trial = 20689/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.468 | DEBUG    | __main__:trials:29 - Trial = 20689/30000 | Total reward = 36.44
2022-01-26 14:18:06.472 | DEBUG    | __main__:trials:24 - Trial = 20690/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.473 | DEBUG    | __main__:trials:29 - Trial = 20690/30000 | Total reward = 39.62
2022-01-26 14:18:06.477 | DEBUG    | __main__:trials:24 - Trial = 20691/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.478 | DEBUG    | __main__:trials:29 - Trial = 20691/30000 | Total reward = 39.57
2022-01-26 14:18:06.482 | DEBUG    | __main__:trials:24 - Trial = 20692/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.484 | DEBUG    | __main__:trials:29 - Trial = 20692/30000 | Total reward = 52.14
2022-01-26 14:18:06.487 | DEBUG    | __main__:trials:24 - Trial = 20693/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.489 | DEBUG    | __main__:trials:29 - Trial = 20693/30000 | Total reward = 39.42
2022-01-26 14:18:06.493 | DEBUG    | __main__:trials:24 - Trial = 20694/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.494 | DEBUG    | __main__:trials:29 - Trial = 20694/30000 | Total reward = 41.27
2022-01-26 14:18:06.498 | DEBUG    | __main__:trials:24 - Trial = 20695/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.500 | DEBUG    | __main__:trials:29 - Trial = 20695/30000 | Total reward = 47.06
2022-01-26 14:18:06.504 | DEBUG    | __main__:trials:24 - Trial = 20696/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.505 | DEBUG    | __main__:trials:29 - Trial = 20696/30000 | Total reward = 38.23
2022-01-26 14:18:06.509 | DEBUG    | __main__:trials:24 - Trial = 20697/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.511 | DEBUG    | __main__:trials:29 - Trial = 20697/30000 | Total reward = 40.93
2022-01-26 14:18:06.515 | DEBUG    | __main__:trials:24 - Trial = 20698/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.516 | DEBUG    | __main__:trials:29 - Trial = 20698/30000 | Total reward = 34.65
2022-01-26 14:18:06.520 | DEBUG    | __main__:trials:24 - Trial = 20699/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.522 | DEBUG    | __main__:trials:29 - Trial = 20699/30000 | Total reward = 35.01
2022-01-26 14:18:06.526 | DEBUG    | __main__:trials:24 - Trial = 20700/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.527 | DEBUG    | __main__:trials:29 - Trial = 20700/30000 | Total reward = 39.80
2022-01-26 14:18:06.530 | DEBUG    | __main__:trials:24 - Trial = 20701/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.532 | DEBUG    | __main__:trials:29 - Trial = 20701/30000 | Total reward = 41.35
2022-01-26 14:18:06.536 | DEBUG    | __main__:trials:24 - Trial = 20702/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.538 | DEBUG    | __main__:trials:29 - Trial = 20702/30000 | Total reward = 34.73
2022-01-26 14:18:06.541 | DEBUG    | __main__:trials:26 - Trial = 20703/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.542 | DEBUG    | __main__:trials:29 - Trial = 20703/30000 | Total reward = 12.07
2022-01-26 14:18:06.546 | DEBUG    | __main__:trials:24 - Trial = 20704/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.547 | DEBUG    | __main__:trials:29 - Trial = 20704/30000 | Total reward = 47.33
2022-01-26 14:18:06.551 | DEBUG    | __main__:trials:24 - Trial = 20705/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.553 | DEBUG    | __main__:trials:29 - Trial = 20705/30000 | Total reward = 42.02
2022-01-26 14:18:06.556 | DEBUG    | __main__:trials:24 - Trial = 20706/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.558 | DEBUG    | __main__:trials:29 - Trial = 20706/30000 | Total reward = 40.22
2022-01-26 14:18:06.562 | DEBUG    | __main__:trials:24 - Trial = 20707/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.563 | DEBUG    | __main__:trials:29 - Trial = 20707/30000 | Total reward = 39.57
2022-01-26 14:18:06.567 | DEBUG    | __main__:trials:24 - Trial = 20708/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.569 | DEBUG    | __main__:trials:29 - Trial = 20708/30000 | Total reward = 42.72
2022-01-26 14:18:06.572 | DEBUG    | __main__:trials:24 - Trial = 20709/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.573 | DEBUG    | __main__:trials:29 - Trial = 20709/30000 | Total reward = 37.13
2022-01-26 14:18:06.577 | DEBUG    | __main__:trials:24 - Trial = 20710/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.578 | DEBUG    | __main__:trials:29 - Trial = 20710/30000 | Total reward = 47.23
2022-01-26 14:18:06.582 | DEBUG    | __main__:trials:24 - Trial = 20711/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.583 | DEBUG    | __main__:trials:29 - Trial = 20711/30000 | Total reward = 34.26
2022-01-26 14:18:06.587 | DEBUG    | __main__:trials:24 - Trial = 20712/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.588 | DEBUG    | __main__:trials:29 - Trial = 20712/30000 | Total reward = 38.82
2022-01-26 14:18:06.592 | DEBUG    | __main__:trials:24 - Trial = 20713/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.594 | DEBUG    | __main__:trials:29 - Trial = 20713/30000 | Total reward = 49.47
2022-01-26 14:18:06.598 | DEBUG    | __main__:trials:24 - Trial = 20714/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.599 | DEBUG    | __main__:trials:29 - Trial = 20714/30000 | Total reward = 39.88
2022-01-26 14:18:06.603 | DEBUG    | __main__:trials:24 - Trial = 20715/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.605 | DEBUG    | __main__:trials:29 - Trial = 20715/30000 | Total reward = 38.93
2022-01-26 14:18:06.608 | DEBUG    | __main__:trials:24 - Trial = 20716/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.609 | DEBUG    | __main__:trials:29 - Trial = 20716/30000 | Total reward = 39.57
2022-01-26 14:18:06.612 | DEBUG    | __main__:trials:24 - Trial = 20717/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.614 | DEBUG    | __main__:trials:29 - Trial = 20717/30000 | Total reward = 41.90
2022-01-26 14:18:06.618 | DEBUG    | __main__:trials:24 - Trial = 20718/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.620 | DEBUG    | __main__:trials:29 - Trial = 20718/30000 | Total reward = 47.17
2022-01-26 14:18:06.623 | DEBUG    | __main__:trials:24 - Trial = 20719/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.625 | DEBUG    | __main__:trials:29 - Trial = 20719/30000 | Total reward = 44.52
2022-01-26 14:18:06.628 | DEBUG    | __main__:trials:24 - Trial = 20720/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.630 | DEBUG    | __main__:trials:29 - Trial = 20720/30000 | Total reward = 49.71
2022-01-26 14:18:06.634 | DEBUG    | __main__:trials:24 - Trial = 20721/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.636 | DEBUG    | __main__:trials:29 - Trial = 20721/30000 | Total reward = 40.20
2022-01-26 14:18:06.639 | DEBUG    | __main__:trials:24 - Trial = 20722/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.639 | DEBUG    | __main__:trials:29 - Trial = 20722/30000 | Total reward = 52.69
2022-01-26 14:18:06.644 | DEBUG    | __main__:trials:24 - Trial = 20723/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.645 | DEBUG    | __main__:trials:29 - Trial = 20723/30000 | Total reward = 38.79
2022-01-26 14:18:06.649 | DEBUG    | __main__:trials:24 - Trial = 20724/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.651 | DEBUG    | __main__:trials:29 - Trial = 20724/30000 | Total reward = 39.12
2022-01-26 14:18:06.655 | DEBUG    | __main__:trials:24 - Trial = 20725/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.656 | DEBUG    | __main__:trials:29 - Trial = 20725/30000 | Total reward = 42.43
2022-01-26 14:18:06.660 | DEBUG    | __main__:trials:24 - Trial = 20726/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.662 | DEBUG    | __main__:trials:29 - Trial = 20726/30000 | Total reward = 32.93
2022-01-26 14:18:06.665 | DEBUG    | __main__:trials:24 - Trial = 20727/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.667 | DEBUG    | __main__:trials:29 - Trial = 20727/30000 | Total reward = 37.74
2022-01-26 14:18:06.671 | DEBUG    | __main__:trials:24 - Trial = 20728/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.672 | DEBUG    | __main__:trials:29 - Trial = 20728/30000 | Total reward = 45.00
2022-01-26 14:18:06.676 | DEBUG    | __main__:trials:26 - Trial = 20729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.677 | DEBUG    | __main__:trials:29 - Trial = 20729/30000 | Total reward = 25.79
2022-01-26 14:18:06.681 | DEBUG    | __main__:trials:24 - Trial = 20730/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.682 | DEBUG    | __main__:trials:29 - Trial = 20730/30000 | Total reward = 35.33
2022-01-26 14:18:06.686 | DEBUG    | __main__:trials:24 - Trial = 20731/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.688 | DEBUG    | __main__:trials:29 - Trial = 20731/30000 | Total reward = 37.32
2022-01-26 14:18:06.692 | DEBUG    | __main__:trials:24 - Trial = 20732/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.692 | DEBUG    | __main__:trials:29 - Trial = 20732/30000 | Total reward = 35.90
2022-01-26 14:18:06.697 | DEBUG    | __main__:trials:24 - Trial = 20733/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.697 | DEBUG    | __main__:trials:29 - Trial = 20733/30000 | Total reward = 40.69
2022-01-26 14:18:06.702 | DEBUG    | __main__:trials:24 - Trial = 20734/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.703 | DEBUG    | __main__:trials:29 - Trial = 20734/30000 | Total reward = 32.24
2022-01-26 14:18:06.707 | DEBUG    | __main__:trials:24 - Trial = 20735/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.709 | DEBUG    | __main__:trials:29 - Trial = 20735/30000 | Total reward = 35.93
2022-01-26 14:18:06.713 | DEBUG    | __main__:trials:24 - Trial = 20736/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.714 | DEBUG    | __main__:trials:29 - Trial = 20736/30000 | Total reward = 37.35
2022-01-26 14:18:06.717 | DEBUG    | __main__:trials:24 - Trial = 20737/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.718 | DEBUG    | __main__:trials:29 - Trial = 20737/30000 | Total reward = 38.39
2022-01-26 14:18:06.721 | DEBUG    | __main__:trials:24 - Trial = 20738/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.722 | DEBUG    | __main__:trials:29 - Trial = 20738/30000 | Total reward = 39.57
2022-01-26 14:18:06.726 | DEBUG    | __main__:trials:24 - Trial = 20739/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.727 | DEBUG    | __main__:trials:29 - Trial = 20739/30000 | Total reward = 34.24
2022-01-26 14:18:06.730 | DEBUG    | __main__:trials:24 - Trial = 20740/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.732 | DEBUG    | __main__:trials:29 - Trial = 20740/30000 | Total reward = 46.37
2022-01-26 14:18:06.735 | DEBUG    | __main__:trials:24 - Trial = 20741/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.737 | DEBUG    | __main__:trials:29 - Trial = 20741/30000 | Total reward = 40.50
2022-01-26 14:18:06.741 | DEBUG    | __main__:trials:24 - Trial = 20742/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.742 | DEBUG    | __main__:trials:29 - Trial = 20742/30000 | Total reward = 63.18
2022-01-26 14:18:06.746 | DEBUG    | __main__:trials:24 - Trial = 20743/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.747 | DEBUG    | __main__:trials:29 - Trial = 20743/30000 | Total reward = 33.53
2022-01-26 14:18:06.750 | DEBUG    | __main__:trials:24 - Trial = 20744/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.752 | DEBUG    | __main__:trials:29 - Trial = 20744/30000 | Total reward = 39.83
2022-01-26 14:18:06.756 | DEBUG    | __main__:trials:24 - Trial = 20745/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.757 | DEBUG    | __main__:trials:29 - Trial = 20745/30000 | Total reward = 28.71
2022-01-26 14:18:06.761 | DEBUG    | __main__:trials:24 - Trial = 20746/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.762 | DEBUG    | __main__:trials:29 - Trial = 20746/30000 | Total reward = 49.26
2022-01-26 14:18:06.766 | DEBUG    | __main__:trials:24 - Trial = 20747/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.768 | DEBUG    | __main__:trials:29 - Trial = 20747/30000 | Total reward = 48.55
2022-01-26 14:18:06.771 | DEBUG    | __main__:trials:24 - Trial = 20748/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.773 | DEBUG    | __main__:trials:29 - Trial = 20748/30000 | Total reward = 45.79
2022-01-26 14:18:06.777 | DEBUG    | __main__:trials:24 - Trial = 20749/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.779 | DEBUG    | __main__:trials:29 - Trial = 20749/30000 | Total reward = 38.92
2022-01-26 14:18:06.783 | DEBUG    | __main__:trials:24 - Trial = 20750/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.784 | DEBUG    | __main__:trials:29 - Trial = 20750/30000 | Total reward = 27.31
2022-01-26 14:18:06.787 | DEBUG    | __main__:trials:24 - Trial = 20751/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.789 | DEBUG    | __main__:trials:29 - Trial = 20751/30000 | Total reward = 42.08
2022-01-26 14:18:06.793 | DEBUG    | __main__:trials:24 - Trial = 20752/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.794 | DEBUG    | __main__:trials:29 - Trial = 20752/30000 | Total reward = 38.69
2022-01-26 14:18:06.798 | DEBUG    | __main__:trials:24 - Trial = 20753/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.799 | DEBUG    | __main__:trials:29 - Trial = 20753/30000 | Total reward = 37.50
2022-01-26 14:18:06.802 | DEBUG    | __main__:trials:26 - Trial = 20754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.803 | DEBUG    | __main__:trials:29 - Trial = 20754/30000 | Total reward = 22.94
2022-01-26 14:18:06.807 | DEBUG    | __main__:trials:24 - Trial = 20755/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.809 | DEBUG    | __main__:trials:29 - Trial = 20755/30000 | Total reward = 37.68
2022-01-26 14:18:06.812 | DEBUG    | __main__:trials:24 - Trial = 20756/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.813 | DEBUG    | __main__:trials:29 - Trial = 20756/30000 | Total reward = 40.58
2022-01-26 14:18:06.817 | DEBUG    | __main__:trials:24 - Trial = 20757/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.819 | DEBUG    | __main__:trials:29 - Trial = 20757/30000 | Total reward = 42.07
2022-01-26 14:18:06.822 | DEBUG    | __main__:trials:24 - Trial = 20758/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.822 | DEBUG    | __main__:trials:29 - Trial = 20758/30000 | Total reward = 37.38
2022-01-26 14:18:06.827 | DEBUG    | __main__:trials:24 - Trial = 20759/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.828 | DEBUG    | __main__:trials:29 - Trial = 20759/30000 | Total reward = 39.57
2022-01-26 14:18:06.832 | DEBUG    | __main__:trials:24 - Trial = 20760/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.833 | DEBUG    | __main__:trials:29 - Trial = 20760/30000 | Total reward = 38.01
2022-01-26 14:18:06.837 | DEBUG    | __main__:trials:24 - Trial = 20761/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.839 | DEBUG    | __main__:trials:29 - Trial = 20761/30000 | Total reward = 40.99
2022-01-26 14:18:06.843 | DEBUG    | __main__:trials:24 - Trial = 20762/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.844 | DEBUG    | __main__:trials:29 - Trial = 20762/30000 | Total reward = 49.32
2022-01-26 14:18:06.847 | DEBUG    | __main__:trials:24 - Trial = 20763/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.849 | DEBUG    | __main__:trials:29 - Trial = 20763/30000 | Total reward = 43.34
2022-01-26 14:18:06.852 | DEBUG    | __main__:trials:24 - Trial = 20764/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.854 | DEBUG    | __main__:trials:29 - Trial = 20764/30000 | Total reward = 36.53
2022-01-26 14:18:06.858 | DEBUG    | __main__:trials:24 - Trial = 20765/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.859 | DEBUG    | __main__:trials:29 - Trial = 20765/30000 | Total reward = 41.62
2022-01-26 14:18:06.864 | DEBUG    | __main__:trials:24 - Trial = 20766/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.866 | DEBUG    | __main__:trials:29 - Trial = 20766/30000 | Total reward = 41.14
2022-01-26 14:18:06.869 | DEBUG    | __main__:trials:24 - Trial = 20767/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.870 | DEBUG    | __main__:trials:29 - Trial = 20767/30000 | Total reward = 39.58
2022-01-26 14:18:06.875 | DEBUG    | __main__:trials:24 - Trial = 20768/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.877 | DEBUG    | __main__:trials:29 - Trial = 20768/30000 | Total reward = 43.59
2022-01-26 14:18:06.880 | DEBUG    | __main__:trials:24 - Trial = 20769/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.882 | DEBUG    | __main__:trials:29 - Trial = 20769/30000 | Total reward = 44.04
2022-01-26 14:18:06.885 | DEBUG    | __main__:trials:24 - Trial = 20770/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.886 | DEBUG    | __main__:trials:29 - Trial = 20770/30000 | Total reward = 39.57
2022-01-26 14:18:06.891 | DEBUG    | __main__:trials:24 - Trial = 20771/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.892 | DEBUG    | __main__:trials:29 - Trial = 20771/30000 | Total reward = 49.32
2022-01-26 14:18:06.896 | DEBUG    | __main__:trials:24 - Trial = 20772/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.897 | DEBUG    | __main__:trials:29 - Trial = 20772/30000 | Total reward = 50.05
2022-01-26 14:18:06.901 | DEBUG    | __main__:trials:26 - Trial = 20773/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:06.903 | DEBUG    | __main__:trials:29 - Trial = 20773/30000 | Total reward = 26.80
2022-01-26 14:18:06.907 | DEBUG    | __main__:trials:24 - Trial = 20774/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.909 | DEBUG    | __main__:trials:29 - Trial = 20774/30000 | Total reward = 42.99
2022-01-26 14:18:06.912 | DEBUG    | __main__:trials:24 - Trial = 20775/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.913 | DEBUG    | __main__:trials:29 - Trial = 20775/30000 | Total reward = 40.11
2022-01-26 14:18:06.917 | DEBUG    | __main__:trials:24 - Trial = 20776/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.918 | DEBUG    | __main__:trials:29 - Trial = 20776/30000 | Total reward = 46.63
2022-01-26 14:18:06.921 | DEBUG    | __main__:trials:24 - Trial = 20777/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.923 | DEBUG    | __main__:trials:29 - Trial = 20777/30000 | Total reward = 40.03
2022-01-26 14:18:06.926 | DEBUG    | __main__:trials:24 - Trial = 20778/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.927 | DEBUG    | __main__:trials:29 - Trial = 20778/30000 | Total reward = 38.56
2022-01-26 14:18:06.932 | DEBUG    | __main__:trials:24 - Trial = 20779/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.933 | DEBUG    | __main__:trials:29 - Trial = 20779/30000 | Total reward = 46.15
2022-01-26 14:18:06.937 | DEBUG    | __main__:trials:24 - Trial = 20780/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.939 | DEBUG    | __main__:trials:29 - Trial = 20780/30000 | Total reward = 42.84
2022-01-26 14:18:06.942 | DEBUG    | __main__:trials:24 - Trial = 20781/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.944 | DEBUG    | __main__:trials:29 - Trial = 20781/30000 | Total reward = 32.33
2022-01-26 14:18:06.948 | DEBUG    | __main__:trials:24 - Trial = 20782/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.950 | DEBUG    | __main__:trials:29 - Trial = 20782/30000 | Total reward = 46.82
2022-01-26 14:18:06.954 | DEBUG    | __main__:trials:24 - Trial = 20783/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.955 | DEBUG    | __main__:trials:29 - Trial = 20783/30000 | Total reward = 49.46
2022-01-26 14:18:06.959 | DEBUG    | __main__:trials:24 - Trial = 20784/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.960 | DEBUG    | __main__:trials:29 - Trial = 20784/30000 | Total reward = 36.75
2022-01-26 14:18:06.964 | DEBUG    | __main__:trials:24 - Trial = 20785/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.965 | DEBUG    | __main__:trials:29 - Trial = 20785/30000 | Total reward = 43.85
2022-01-26 14:18:06.969 | DEBUG    | __main__:trials:24 - Trial = 20786/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.971 | DEBUG    | __main__:trials:29 - Trial = 20786/30000 | Total reward = 48.35
2022-01-26 14:18:06.975 | DEBUG    | __main__:trials:24 - Trial = 20787/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.975 | DEBUG    | __main__:trials:29 - Trial = 20787/30000 | Total reward = 35.21
2022-01-26 14:18:06.979 | DEBUG    | __main__:trials:24 - Trial = 20788/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.981 | DEBUG    | __main__:trials:29 - Trial = 20788/30000 | Total reward = 26.53
2022-01-26 14:18:06.985 | DEBUG    | __main__:trials:24 - Trial = 20789/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.985 | DEBUG    | __main__:trials:29 - Trial = 20789/30000 | Total reward = 37.48
2022-01-26 14:18:06.989 | DEBUG    | __main__:trials:24 - Trial = 20790/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.990 | DEBUG    | __main__:trials:29 - Trial = 20790/30000 | Total reward = 36.91
2022-01-26 14:18:06.993 | DEBUG    | __main__:trials:24 - Trial = 20791/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.994 | DEBUG    | __main__:trials:29 - Trial = 20791/30000 | Total reward = 47.96
2022-01-26 14:18:06.998 | DEBUG    | __main__:trials:24 - Trial = 20792/30000 | Max number of steps (20) reached
2022-01-26 14:18:06.998 | DEBUG    | __main__:trials:29 - Trial = 20792/30000 | Total reward = 40.60
2022-01-26 14:18:07.002 | DEBUG    | __main__:trials:24 - Trial = 20793/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.003 | DEBUG    | __main__:trials:29 - Trial = 20793/30000 | Total reward = 36.49
2022-01-26 14:18:07.007 | DEBUG    | __main__:trials:24 - Trial = 20794/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.009 | DEBUG    | __main__:trials:29 - Trial = 20794/30000 | Total reward = 43.36
2022-01-26 14:18:07.012 | DEBUG    | __main__:trials:24 - Trial = 20795/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.014 | DEBUG    | __main__:trials:29 - Trial = 20795/30000 | Total reward = 41.68
2022-01-26 14:18:07.018 | DEBUG    | __main__:trials:24 - Trial = 20796/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.019 | DEBUG    | __main__:trials:29 - Trial = 20796/30000 | Total reward = 47.74
2022-01-26 14:18:07.022 | DEBUG    | __main__:trials:24 - Trial = 20797/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.024 | DEBUG    | __main__:trials:29 - Trial = 20797/30000 | Total reward = 42.39
2022-01-26 14:18:07.028 | DEBUG    | __main__:trials:24 - Trial = 20798/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.029 | DEBUG    | __main__:trials:29 - Trial = 20798/30000 | Total reward = 46.47
2022-01-26 14:18:07.033 | DEBUG    | __main__:trials:24 - Trial = 20799/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.034 | DEBUG    | __main__:trials:29 - Trial = 20799/30000 | Total reward = 36.56
2022-01-26 14:18:07.038 | DEBUG    | __main__:trials:24 - Trial = 20800/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.040 | DEBUG    | __main__:trials:29 - Trial = 20800/30000 | Total reward = 37.89
2022-01-26 14:18:07.043 | DEBUG    | __main__:trials:24 - Trial = 20801/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.045 | DEBUG    | __main__:trials:29 - Trial = 20801/30000 | Total reward = 38.48
2022-01-26 14:18:07.048 | DEBUG    | __main__:trials:24 - Trial = 20802/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.049 | DEBUG    | __main__:trials:29 - Trial = 20802/30000 | Total reward = 36.78
2022-01-26 14:18:07.053 | DEBUG    | __main__:trials:24 - Trial = 20803/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.054 | DEBUG    | __main__:trials:29 - Trial = 20803/30000 | Total reward = 34.21
2022-01-26 14:18:07.058 | DEBUG    | __main__:trials:24 - Trial = 20804/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.060 | DEBUG    | __main__:trials:29 - Trial = 20804/30000 | Total reward = 39.80
2022-01-26 14:18:07.063 | DEBUG    | __main__:trials:24 - Trial = 20805/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.065 | DEBUG    | __main__:trials:29 - Trial = 20805/30000 | Total reward = 45.32
2022-01-26 14:18:07.068 | DEBUG    | __main__:trials:24 - Trial = 20806/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.069 | DEBUG    | __main__:trials:29 - Trial = 20806/30000 | Total reward = 38.00
2022-01-26 14:18:07.072 | DEBUG    | __main__:trials:24 - Trial = 20807/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.074 | DEBUG    | __main__:trials:29 - Trial = 20807/30000 | Total reward = 37.40
2022-01-26 14:18:07.078 | DEBUG    | __main__:trials:24 - Trial = 20808/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.078 | DEBUG    | __main__:trials:29 - Trial = 20808/30000 | Total reward = 44.21
2022-01-26 14:18:07.083 | DEBUG    | __main__:trials:24 - Trial = 20809/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.084 | DEBUG    | __main__:trials:29 - Trial = 20809/30000 | Total reward = 34.72
2022-01-26 14:18:07.088 | DEBUG    | __main__:trials:24 - Trial = 20810/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.090 | DEBUG    | __main__:trials:29 - Trial = 20810/30000 | Total reward = 37.69
2022-01-26 14:18:07.093 | DEBUG    | __main__:trials:24 - Trial = 20811/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.094 | DEBUG    | __main__:trials:29 - Trial = 20811/30000 | Total reward = 48.36
2022-01-26 14:18:07.099 | DEBUG    | __main__:trials:24 - Trial = 20812/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.100 | DEBUG    | __main__:trials:29 - Trial = 20812/30000 | Total reward = 42.68
2022-01-26 14:18:07.104 | DEBUG    | __main__:trials:24 - Trial = 20813/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.106 | DEBUG    | __main__:trials:29 - Trial = 20813/30000 | Total reward = 35.13
2022-01-26 14:18:07.109 | DEBUG    | __main__:trials:26 - Trial = 20814/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.110 | DEBUG    | __main__:trials:29 - Trial = 20814/30000 | Total reward = 5.99
2022-01-26 14:18:07.113 | DEBUG    | __main__:trials:26 - Trial = 20815/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.114 | DEBUG    | __main__:trials:29 - Trial = 20815/30000 | Total reward = 9.99
2022-01-26 14:18:07.117 | DEBUG    | __main__:trials:24 - Trial = 20816/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.119 | DEBUG    | __main__:trials:29 - Trial = 20816/30000 | Total reward = 49.92
2022-01-26 14:18:07.122 | DEBUG    | __main__:trials:26 - Trial = 20817/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.122 | DEBUG    | __main__:trials:29 - Trial = 20817/30000 | Total reward = 9.99
2022-01-26 14:18:07.125 | DEBUG    | __main__:trials:26 - Trial = 20818/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.127 | DEBUG    | __main__:trials:29 - Trial = 20818/30000 | Total reward = 9.99
2022-01-26 14:18:07.130 | DEBUG    | __main__:trials:26 - Trial = 20819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.131 | DEBUG    | __main__:trials:29 - Trial = 20819/30000 | Total reward = 9.99
2022-01-26 14:18:07.134 | DEBUG    | __main__:trials:26 - Trial = 20820/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.136 | DEBUG    | __main__:trials:29 - Trial = 20820/30000 | Total reward = 22.62
2022-01-26 14:18:07.140 | DEBUG    | __main__:trials:24 - Trial = 20821/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.141 | DEBUG    | __main__:trials:29 - Trial = 20821/30000 | Total reward = 51.45
2022-01-26 14:18:07.145 | DEBUG    | __main__:trials:26 - Trial = 20822/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.147 | DEBUG    | __main__:trials:29 - Trial = 20822/30000 | Total reward = 23.41
2022-01-26 14:18:07.149 | DEBUG    | __main__:trials:26 - Trial = 20823/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.150 | DEBUG    | __main__:trials:29 - Trial = 20823/30000 | Total reward = 9.99
2022-01-26 14:18:07.154 | DEBUG    | __main__:trials:24 - Trial = 20824/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.156 | DEBUG    | __main__:trials:29 - Trial = 20824/30000 | Total reward = 49.29
2022-01-26 14:18:07.160 | DEBUG    | __main__:trials:24 - Trial = 20825/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.161 | DEBUG    | __main__:trials:29 - Trial = 20825/30000 | Total reward = 49.09
2022-01-26 14:18:07.164 | DEBUG    | __main__:trials:26 - Trial = 20826/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.166 | DEBUG    | __main__:trials:29 - Trial = 20826/30000 | Total reward = 9.99
2022-01-26 14:18:07.169 | DEBUG    | __main__:trials:26 - Trial = 20827/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.169 | DEBUG    | __main__:trials:29 - Trial = 20827/30000 | Total reward = 10.41
2022-01-26 14:18:07.172 | DEBUG    | __main__:trials:26 - Trial = 20828/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.173 | DEBUG    | __main__:trials:29 - Trial = 20828/30000 | Total reward = 34.51
2022-01-26 14:18:07.176 | DEBUG    | __main__:trials:26 - Trial = 20829/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.178 | DEBUG    | __main__:trials:29 - Trial = 20829/30000 | Total reward = 27.22
2022-01-26 14:18:07.180 | DEBUG    | __main__:trials:26 - Trial = 20830/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.182 | DEBUG    | __main__:trials:29 - Trial = 20830/30000 | Total reward = 9.99
2022-01-26 14:18:07.184 | DEBUG    | __main__:trials:26 - Trial = 20831/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.186 | DEBUG    | __main__:trials:29 - Trial = 20831/30000 | Total reward = 9.99
2022-01-26 14:18:07.190 | DEBUG    | __main__:trials:24 - Trial = 20832/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.190 | DEBUG    | __main__:trials:29 - Trial = 20832/30000 | Total reward = 47.67
2022-01-26 14:18:07.195 | DEBUG    | __main__:trials:24 - Trial = 20833/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.197 | DEBUG    | __main__:trials:29 - Trial = 20833/30000 | Total reward = 37.00
2022-01-26 14:18:07.200 | DEBUG    | __main__:trials:24 - Trial = 20834/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.202 | DEBUG    | __main__:trials:29 - Trial = 20834/30000 | Total reward = 13.28
2022-01-26 14:18:07.206 | DEBUG    | __main__:trials:26 - Trial = 20835/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.208 | DEBUG    | __main__:trials:29 - Trial = 20835/30000 | Total reward = 44.26
2022-01-26 14:18:07.211 | DEBUG    | __main__:trials:24 - Trial = 20836/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.213 | DEBUG    | __main__:trials:29 - Trial = 20836/30000 | Total reward = 1.54
2022-01-26 14:18:07.214 | DEBUG    | __main__:trials:26 - Trial = 20837/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.216 | DEBUG    | __main__:trials:29 - Trial = 20837/30000 | Total reward = 9.99
2022-01-26 14:18:07.218 | DEBUG    | __main__:trials:26 - Trial = 20838/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.219 | DEBUG    | __main__:trials:29 - Trial = 20838/30000 | Total reward = 9.99
2022-01-26 14:18:07.222 | DEBUG    | __main__:trials:26 - Trial = 20839/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.222 | DEBUG    | __main__:trials:29 - Trial = 20839/30000 | Total reward = 9.99
2022-01-26 14:18:07.226 | DEBUG    | __main__:trials:26 - Trial = 20840/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.227 | DEBUG    | __main__:trials:29 - Trial = 20840/30000 | Total reward = 9.99
2022-01-26 14:18:07.229 | DEBUG    | __main__:trials:26 - Trial = 20841/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.231 | DEBUG    | __main__:trials:29 - Trial = 20841/30000 | Total reward = 9.99
2022-01-26 14:18:07.233 | DEBUG    | __main__:trials:26 - Trial = 20842/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.234 | DEBUG    | __main__:trials:29 - Trial = 20842/30000 | Total reward = 17.80
2022-01-26 14:18:07.236 | DEBUG    | __main__:trials:26 - Trial = 20843/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.236 | DEBUG    | __main__:trials:29 - Trial = 20843/30000 | Total reward = 9.99
2022-01-26 14:18:07.239 | DEBUG    | __main__:trials:26 - Trial = 20844/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.240 | DEBUG    | __main__:trials:29 - Trial = 20844/30000 | Total reward = 4.70
2022-01-26 14:18:07.244 | DEBUG    | __main__:trials:24 - Trial = 20845/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.246 | DEBUG    | __main__:trials:29 - Trial = 20845/30000 | Total reward = 46.98
2022-01-26 14:18:07.250 | DEBUG    | __main__:trials:24 - Trial = 20846/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.252 | DEBUG    | __main__:trials:29 - Trial = 20846/30000 | Total reward = 42.70
2022-01-26 14:18:07.255 | DEBUG    | __main__:trials:24 - Trial = 20847/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.257 | DEBUG    | __main__:trials:29 - Trial = 20847/30000 | Total reward = 43.24
2022-01-26 14:18:07.261 | DEBUG    | __main__:trials:24 - Trial = 20848/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.262 | DEBUG    | __main__:trials:29 - Trial = 20848/30000 | Total reward = 41.45
2022-01-26 14:18:07.265 | DEBUG    | __main__:trials:24 - Trial = 20849/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.267 | DEBUG    | __main__:trials:29 - Trial = 20849/30000 | Total reward = 58.44
2022-01-26 14:18:07.269 | DEBUG    | __main__:trials:26 - Trial = 20850/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.270 | DEBUG    | __main__:trials:29 - Trial = 20850/30000 | Total reward = 25.36
2022-01-26 14:18:07.273 | DEBUG    | __main__:trials:24 - Trial = 20851/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.273 | DEBUG    | __main__:trials:29 - Trial = 20851/30000 | Total reward = 26.99
2022-01-26 14:18:07.277 | DEBUG    | __main__:trials:24 - Trial = 20852/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.278 | DEBUG    | __main__:trials:29 - Trial = 20852/30000 | Total reward = 53.17
2022-01-26 14:18:07.281 | DEBUG    | __main__:trials:26 - Trial = 20853/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.283 | DEBUG    | __main__:trials:29 - Trial = 20853/30000 | Total reward = 25.36
2022-01-26 14:18:07.287 | DEBUG    | __main__:trials:24 - Trial = 20854/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.288 | DEBUG    | __main__:trials:29 - Trial = 20854/30000 | Total reward = 33.39
2022-01-26 14:18:07.292 | DEBUG    | __main__:trials:26 - Trial = 20855/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.293 | DEBUG    | __main__:trials:29 - Trial = 20855/30000 | Total reward = 38.99
2022-01-26 14:18:07.296 | DEBUG    | __main__:trials:24 - Trial = 20856/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.298 | DEBUG    | __main__:trials:29 - Trial = 20856/30000 | Total reward = 51.20
2022-01-26 14:18:07.301 | DEBUG    | __main__:trials:26 - Trial = 20857/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.303 | DEBUG    | __main__:trials:29 - Trial = 20857/30000 | Total reward = 33.07
2022-01-26 14:18:07.306 | DEBUG    | __main__:trials:26 - Trial = 20858/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.307 | DEBUG    | __main__:trials:29 - Trial = 20858/30000 | Total reward = 27.88
2022-01-26 14:18:07.311 | DEBUG    | __main__:trials:24 - Trial = 20859/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.313 | DEBUG    | __main__:trials:29 - Trial = 20859/30000 | Total reward = 51.42
2022-01-26 14:18:07.316 | DEBUG    | __main__:trials:24 - Trial = 20860/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.318 | DEBUG    | __main__:trials:29 - Trial = 20860/30000 | Total reward = 39.11
2022-01-26 14:18:07.322 | DEBUG    | __main__:trials:24 - Trial = 20861/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.323 | DEBUG    | __main__:trials:29 - Trial = 20861/30000 | Total reward = 36.75
2022-01-26 14:18:07.327 | DEBUG    | __main__:trials:24 - Trial = 20862/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.328 | DEBUG    | __main__:trials:29 - Trial = 20862/30000 | Total reward = 39.95
2022-01-26 14:18:07.332 | DEBUG    | __main__:trials:24 - Trial = 20863/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.333 | DEBUG    | __main__:trials:29 - Trial = 20863/30000 | Total reward = 41.65
2022-01-26 14:18:07.337 | DEBUG    | __main__:trials:24 - Trial = 20864/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.339 | DEBUG    | __main__:trials:29 - Trial = 20864/30000 | Total reward = 37.31
2022-01-26 14:18:07.342 | DEBUG    | __main__:trials:24 - Trial = 20865/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.344 | DEBUG    | __main__:trials:29 - Trial = 20865/30000 | Total reward = 51.57
2022-01-26 14:18:07.347 | DEBUG    | __main__:trials:24 - Trial = 20866/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.349 | DEBUG    | __main__:trials:29 - Trial = 20866/30000 | Total reward = 41.13
2022-01-26 14:18:07.352 | DEBUG    | __main__:trials:24 - Trial = 20867/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.353 | DEBUG    | __main__:trials:29 - Trial = 20867/30000 | Total reward = 35.98
2022-01-26 14:18:07.357 | DEBUG    | __main__:trials:24 - Trial = 20868/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.359 | DEBUG    | __main__:trials:29 - Trial = 20868/30000 | Total reward = 39.16
2022-01-26 14:18:07.363 | DEBUG    | __main__:trials:24 - Trial = 20869/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.364 | DEBUG    | __main__:trials:29 - Trial = 20869/30000 | Total reward = 54.68
2022-01-26 14:18:07.368 | DEBUG    | __main__:trials:24 - Trial = 20870/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.369 | DEBUG    | __main__:trials:29 - Trial = 20870/30000 | Total reward = 44.76
2022-01-26 14:18:07.373 | DEBUG    | __main__:trials:24 - Trial = 20871/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.374 | DEBUG    | __main__:trials:29 - Trial = 20871/30000 | Total reward = 41.95
2022-01-26 14:18:07.379 | DEBUG    | __main__:trials:24 - Trial = 20872/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.381 | DEBUG    | __main__:trials:29 - Trial = 20872/30000 | Total reward = 40.69
2022-01-26 14:18:07.385 | DEBUG    | __main__:trials:24 - Trial = 20873/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.387 | DEBUG    | __main__:trials:29 - Trial = 20873/30000 | Total reward = 41.99
2022-01-26 14:18:07.391 | DEBUG    | __main__:trials:24 - Trial = 20874/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.393 | DEBUG    | __main__:trials:29 - Trial = 20874/30000 | Total reward = 51.83
2022-01-26 14:18:07.396 | DEBUG    | __main__:trials:24 - Trial = 20875/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.397 | DEBUG    | __main__:trials:29 - Trial = 20875/30000 | Total reward = 53.52
2022-01-26 14:18:07.400 | DEBUG    | __main__:trials:24 - Trial = 20876/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.402 | DEBUG    | __main__:trials:29 - Trial = 20876/30000 | Total reward = 40.80
2022-01-26 14:18:07.405 | DEBUG    | __main__:trials:24 - Trial = 20877/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.406 | DEBUG    | __main__:trials:29 - Trial = 20877/30000 | Total reward = 36.49
2022-01-26 14:18:07.409 | DEBUG    | __main__:trials:24 - Trial = 20878/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.410 | DEBUG    | __main__:trials:29 - Trial = 20878/30000 | Total reward = 33.48
2022-01-26 14:18:07.413 | DEBUG    | __main__:trials:24 - Trial = 20879/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.415 | DEBUG    | __main__:trials:29 - Trial = 20879/30000 | Total reward = 37.86
2022-01-26 14:18:07.419 | DEBUG    | __main__:trials:24 - Trial = 20880/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.419 | DEBUG    | __main__:trials:29 - Trial = 20880/30000 | Total reward = 38.56
2022-01-26 14:18:07.424 | DEBUG    | __main__:trials:24 - Trial = 20881/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.425 | DEBUG    | __main__:trials:29 - Trial = 20881/30000 | Total reward = 38.29
2022-01-26 14:18:07.429 | DEBUG    | __main__:trials:24 - Trial = 20882/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.431 | DEBUG    | __main__:trials:29 - Trial = 20882/30000 | Total reward = 47.22
2022-01-26 14:18:07.435 | DEBUG    | __main__:trials:24 - Trial = 20883/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.436 | DEBUG    | __main__:trials:29 - Trial = 20883/30000 | Total reward = 46.34
2022-01-26 14:18:07.440 | DEBUG    | __main__:trials:24 - Trial = 20884/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.442 | DEBUG    | __main__:trials:29 - Trial = 20884/30000 | Total reward = 41.11
2022-01-26 14:18:07.446 | DEBUG    | __main__:trials:24 - Trial = 20885/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.446 | DEBUG    | __main__:trials:29 - Trial = 20885/30000 | Total reward = 56.27
2022-01-26 14:18:07.450 | DEBUG    | __main__:trials:24 - Trial = 20886/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.452 | DEBUG    | __main__:trials:29 - Trial = 20886/30000 | Total reward = 44.74
2022-01-26 14:18:07.455 | DEBUG    | __main__:trials:24 - Trial = 20887/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.456 | DEBUG    | __main__:trials:29 - Trial = 20887/30000 | Total reward = 44.66
2022-01-26 14:18:07.460 | DEBUG    | __main__:trials:24 - Trial = 20888/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.461 | DEBUG    | __main__:trials:29 - Trial = 20888/30000 | Total reward = 58.36
2022-01-26 14:18:07.465 | DEBUG    | __main__:trials:24 - Trial = 20889/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.467 | DEBUG    | __main__:trials:29 - Trial = 20889/30000 | Total reward = 36.35
2022-01-26 14:18:07.470 | DEBUG    | __main__:trials:24 - Trial = 20890/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.472 | DEBUG    | __main__:trials:29 - Trial = 20890/30000 | Total reward = 44.86
2022-01-26 14:18:07.476 | DEBUG    | __main__:trials:24 - Trial = 20891/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.477 | DEBUG    | __main__:trials:29 - Trial = 20891/30000 | Total reward = 36.88
2022-01-26 14:18:07.481 | DEBUG    | __main__:trials:24 - Trial = 20892/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.482 | DEBUG    | __main__:trials:29 - Trial = 20892/30000 | Total reward = 41.91
2022-01-26 14:18:07.485 | DEBUG    | __main__:trials:24 - Trial = 20893/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.486 | DEBUG    | __main__:trials:29 - Trial = 20893/30000 | Total reward = 56.40
2022-01-26 14:18:07.490 | DEBUG    | __main__:trials:24 - Trial = 20894/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.492 | DEBUG    | __main__:trials:29 - Trial = 20894/30000 | Total reward = 35.85
2022-01-26 14:18:07.496 | DEBUG    | __main__:trials:24 - Trial = 20895/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.496 | DEBUG    | __main__:trials:29 - Trial = 20895/30000 | Total reward = 32.00
2022-01-26 14:18:07.501 | DEBUG    | __main__:trials:24 - Trial = 20896/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.502 | DEBUG    | __main__:trials:29 - Trial = 20896/30000 | Total reward = 34.53
2022-01-26 14:18:07.506 | DEBUG    | __main__:trials:24 - Trial = 20897/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.507 | DEBUG    | __main__:trials:29 - Trial = 20897/30000 | Total reward = 38.30
2022-01-26 14:18:07.510 | DEBUG    | __main__:trials:24 - Trial = 20898/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.512 | DEBUG    | __main__:trials:29 - Trial = 20898/30000 | Total reward = 38.23
2022-01-26 14:18:07.516 | DEBUG    | __main__:trials:24 - Trial = 20899/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.517 | DEBUG    | __main__:trials:29 - Trial = 20899/30000 | Total reward = 41.31
2022-01-26 14:18:07.520 | DEBUG    | __main__:trials:24 - Trial = 20900/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.522 | DEBUG    | __main__:trials:29 - Trial = 20900/30000 | Total reward = 38.34
2022-01-26 14:18:07.526 | DEBUG    | __main__:trials:24 - Trial = 20901/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.527 | DEBUG    | __main__:trials:29 - Trial = 20901/30000 | Total reward = 37.53
2022-01-26 14:18:07.531 | DEBUG    | __main__:trials:24 - Trial = 20902/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.532 | DEBUG    | __main__:trials:29 - Trial = 20902/30000 | Total reward = 36.34
2022-01-26 14:18:07.536 | DEBUG    | __main__:trials:24 - Trial = 20903/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.538 | DEBUG    | __main__:trials:29 - Trial = 20903/30000 | Total reward = 32.69
2022-01-26 14:18:07.541 | DEBUG    | __main__:trials:24 - Trial = 20904/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.542 | DEBUG    | __main__:trials:29 - Trial = 20904/30000 | Total reward = 37.76
2022-01-26 14:18:07.546 | DEBUG    | __main__:trials:24 - Trial = 20905/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.547 | DEBUG    | __main__:trials:29 - Trial = 20905/30000 | Total reward = 43.42
2022-01-26 14:18:07.551 | DEBUG    | __main__:trials:24 - Trial = 20906/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.553 | DEBUG    | __main__:trials:29 - Trial = 20906/30000 | Total reward = 41.40
2022-01-26 14:18:07.556 | DEBUG    | __main__:trials:24 - Trial = 20907/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.558 | DEBUG    | __main__:trials:29 - Trial = 20907/30000 | Total reward = 43.58
2022-01-26 14:18:07.562 | DEBUG    | __main__:trials:24 - Trial = 20908/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.564 | DEBUG    | __main__:trials:29 - Trial = 20908/30000 | Total reward = 49.87
2022-01-26 14:18:07.567 | DEBUG    | __main__:trials:24 - Trial = 20909/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.568 | DEBUG    | __main__:trials:29 - Trial = 20909/30000 | Total reward = 61.49
2022-01-26 14:18:07.572 | DEBUG    | __main__:trials:24 - Trial = 20910/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.573 | DEBUG    | __main__:trials:29 - Trial = 20910/30000 | Total reward = 39.57
2022-01-26 14:18:07.577 | DEBUG    | __main__:trials:24 - Trial = 20911/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.578 | DEBUG    | __main__:trials:29 - Trial = 20911/30000 | Total reward = 37.93
2022-01-26 14:18:07.581 | DEBUG    | __main__:trials:24 - Trial = 20912/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.582 | DEBUG    | __main__:trials:29 - Trial = 20912/30000 | Total reward = 39.57
2022-01-26 14:18:07.585 | DEBUG    | __main__:trials:24 - Trial = 20913/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.587 | DEBUG    | __main__:trials:29 - Trial = 20913/30000 | Total reward = 33.33
2022-01-26 14:18:07.591 | DEBUG    | __main__:trials:24 - Trial = 20914/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.591 | DEBUG    | __main__:trials:29 - Trial = 20914/30000 | Total reward = 31.03
2022-01-26 14:18:07.596 | DEBUG    | __main__:trials:24 - Trial = 20915/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.597 | DEBUG    | __main__:trials:29 - Trial = 20915/30000 | Total reward = 44.78
2022-01-26 14:18:07.601 | DEBUG    | __main__:trials:24 - Trial = 20916/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.603 | DEBUG    | __main__:trials:29 - Trial = 20916/30000 | Total reward = 59.12
2022-01-26 14:18:07.606 | DEBUG    | __main__:trials:24 - Trial = 20917/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.608 | DEBUG    | __main__:trials:29 - Trial = 20917/30000 | Total reward = 39.64
2022-01-26 14:18:07.611 | DEBUG    | __main__:trials:24 - Trial = 20918/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.613 | DEBUG    | __main__:trials:29 - Trial = 20918/30000 | Total reward = 36.29
2022-01-26 14:18:07.617 | DEBUG    | __main__:trials:24 - Trial = 20919/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.618 | DEBUG    | __main__:trials:29 - Trial = 20919/30000 | Total reward = 35.18
2022-01-26 14:18:07.622 | DEBUG    | __main__:trials:24 - Trial = 20920/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.623 | DEBUG    | __main__:trials:29 - Trial = 20920/30000 | Total reward = 42.37
2022-01-26 14:18:07.627 | DEBUG    | __main__:trials:24 - Trial = 20921/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.628 | DEBUG    | __main__:trials:29 - Trial = 20921/30000 | Total reward = 36.97
2022-01-26 14:18:07.633 | DEBUG    | __main__:trials:24 - Trial = 20922/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.633 | DEBUG    | __main__:trials:29 - Trial = 20922/30000 | Total reward = 38.10
2022-01-26 14:18:07.637 | DEBUG    | __main__:trials:24 - Trial = 20923/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.638 | DEBUG    | __main__:trials:29 - Trial = 20923/30000 | Total reward = 38.79
2022-01-26 14:18:07.641 | DEBUG    | __main__:trials:24 - Trial = 20924/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.642 | DEBUG    | __main__:trials:29 - Trial = 20924/30000 | Total reward = 39.62
2022-01-26 14:18:07.645 | DEBUG    | __main__:trials:24 - Trial = 20925/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.647 | DEBUG    | __main__:trials:29 - Trial = 20925/30000 | Total reward = 37.91
2022-01-26 14:18:07.651 | DEBUG    | __main__:trials:24 - Trial = 20926/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.652 | DEBUG    | __main__:trials:29 - Trial = 20926/30000 | Total reward = 44.20
2022-01-26 14:18:07.656 | DEBUG    | __main__:trials:24 - Trial = 20927/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.657 | DEBUG    | __main__:trials:29 - Trial = 20927/30000 | Total reward = 53.61
2022-01-26 14:18:07.661 | DEBUG    | __main__:trials:24 - Trial = 20928/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.662 | DEBUG    | __main__:trials:29 - Trial = 20928/30000 | Total reward = 48.49
2022-01-26 14:18:07.665 | DEBUG    | __main__:trials:24 - Trial = 20929/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.666 | DEBUG    | __main__:trials:29 - Trial = 20929/30000 | Total reward = 47.68
2022-01-26 14:18:07.670 | DEBUG    | __main__:trials:24 - Trial = 20930/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.672 | DEBUG    | __main__:trials:29 - Trial = 20930/30000 | Total reward = 55.64
2022-01-26 14:18:07.676 | DEBUG    | __main__:trials:24 - Trial = 20931/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.678 | DEBUG    | __main__:trials:29 - Trial = 20931/30000 | Total reward = 42.75
2022-01-26 14:18:07.681 | DEBUG    | __main__:trials:24 - Trial = 20932/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.682 | DEBUG    | __main__:trials:29 - Trial = 20932/30000 | Total reward = 44.08
2022-01-26 14:18:07.686 | DEBUG    | __main__:trials:24 - Trial = 20933/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.687 | DEBUG    | __main__:trials:29 - Trial = 20933/30000 | Total reward = 45.29
2022-01-26 14:18:07.692 | DEBUG    | __main__:trials:24 - Trial = 20934/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.692 | DEBUG    | __main__:trials:29 - Trial = 20934/30000 | Total reward = 51.53
2022-01-26 14:18:07.697 | DEBUG    | __main__:trials:24 - Trial = 20935/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.697 | DEBUG    | __main__:trials:29 - Trial = 20935/30000 | Total reward = 50.65
2022-01-26 14:18:07.701 | DEBUG    | __main__:trials:24 - Trial = 20936/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.702 | DEBUG    | __main__:trials:29 - Trial = 20936/30000 | Total reward = 40.46
2022-01-26 14:18:07.706 | DEBUG    | __main__:trials:24 - Trial = 20937/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.707 | DEBUG    | __main__:trials:29 - Trial = 20937/30000 | Total reward = 53.23
2022-01-26 14:18:07.710 | DEBUG    | __main__:trials:24 - Trial = 20938/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.712 | DEBUG    | __main__:trials:29 - Trial = 20938/30000 | Total reward = 49.91
2022-01-26 14:18:07.716 | DEBUG    | __main__:trials:24 - Trial = 20939/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.717 | DEBUG    | __main__:trials:29 - Trial = 20939/30000 | Total reward = 40.27
2022-01-26 14:18:07.720 | DEBUG    | __main__:trials:24 - Trial = 20940/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.722 | DEBUG    | __main__:trials:29 - Trial = 20940/30000 | Total reward = 35.14
2022-01-26 14:18:07.726 | DEBUG    | __main__:trials:24 - Trial = 20941/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.727 | DEBUG    | __main__:trials:29 - Trial = 20941/30000 | Total reward = 46.00
2022-01-26 14:18:07.731 | DEBUG    | __main__:trials:24 - Trial = 20942/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.731 | DEBUG    | __main__:trials:29 - Trial = 20942/30000 | Total reward = 41.38
2022-01-26 14:18:07.736 | DEBUG    | __main__:trials:24 - Trial = 20943/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.737 | DEBUG    | __main__:trials:29 - Trial = 20943/30000 | Total reward = 37.78
2022-01-26 14:18:07.741 | DEBUG    | __main__:trials:24 - Trial = 20944/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.742 | DEBUG    | __main__:trials:29 - Trial = 20944/30000 | Total reward = 31.35
2022-01-26 14:18:07.746 | DEBUG    | __main__:trials:24 - Trial = 20945/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.747 | DEBUG    | __main__:trials:29 - Trial = 20945/30000 | Total reward = 39.57
2022-01-26 14:18:07.751 | DEBUG    | __main__:trials:24 - Trial = 20946/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.753 | DEBUG    | __main__:trials:29 - Trial = 20946/30000 | Total reward = 35.07
2022-01-26 14:18:07.756 | DEBUG    | __main__:trials:24 - Trial = 20947/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.757 | DEBUG    | __main__:trials:29 - Trial = 20947/30000 | Total reward = 40.75
2022-01-26 14:18:07.761 | DEBUG    | __main__:trials:24 - Trial = 20948/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.761 | DEBUG    | __main__:trials:29 - Trial = 20948/30000 | Total reward = 36.97
2022-01-26 14:18:07.765 | DEBUG    | __main__:trials:24 - Trial = 20949/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.766 | DEBUG    | __main__:trials:29 - Trial = 20949/30000 | Total reward = 49.00
2022-01-26 14:18:07.769 | DEBUG    | __main__:trials:24 - Trial = 20950/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.770 | DEBUG    | __main__:trials:29 - Trial = 20950/30000 | Total reward = 43.64
2022-01-26 14:18:07.774 | DEBUG    | __main__:trials:24 - Trial = 20951/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.776 | DEBUG    | __main__:trials:29 - Trial = 20951/30000 | Total reward = 38.09
2022-01-26 14:18:07.780 | DEBUG    | __main__:trials:24 - Trial = 20952/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.781 | DEBUG    | __main__:trials:29 - Trial = 20952/30000 | Total reward = 39.10
2022-01-26 14:18:07.784 | DEBUG    | __main__:trials:24 - Trial = 20953/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.786 | DEBUG    | __main__:trials:29 - Trial = 20953/30000 | Total reward = 39.72
2022-01-26 14:18:07.790 | DEBUG    | __main__:trials:24 - Trial = 20954/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.791 | DEBUG    | __main__:trials:29 - Trial = 20954/30000 | Total reward = 45.99
2022-01-26 14:18:07.795 | DEBUG    | __main__:trials:24 - Trial = 20955/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.796 | DEBUG    | __main__:trials:29 - Trial = 20955/30000 | Total reward = 40.28
2022-01-26 14:18:07.800 | DEBUG    | __main__:trials:24 - Trial = 20956/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.801 | DEBUG    | __main__:trials:29 - Trial = 20956/30000 | Total reward = 36.04
2022-01-26 14:18:07.805 | DEBUG    | __main__:trials:24 - Trial = 20957/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.807 | DEBUG    | __main__:trials:29 - Trial = 20957/30000 | Total reward = 33.77
2022-01-26 14:18:07.811 | DEBUG    | __main__:trials:24 - Trial = 20958/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.812 | DEBUG    | __main__:trials:29 - Trial = 20958/30000 | Total reward = 54.88
2022-01-26 14:18:07.816 | DEBUG    | __main__:trials:24 - Trial = 20959/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.818 | DEBUG    | __main__:trials:29 - Trial = 20959/30000 | Total reward = 29.53
2022-01-26 14:18:07.822 | DEBUG    | __main__:trials:24 - Trial = 20960/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.822 | DEBUG    | __main__:trials:29 - Trial = 20960/30000 | Total reward = 34.89
2022-01-26 14:18:07.827 | DEBUG    | __main__:trials:24 - Trial = 20961/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.829 | DEBUG    | __main__:trials:29 - Trial = 20961/30000 | Total reward = 44.61
2022-01-26 14:18:07.832 | DEBUG    | __main__:trials:24 - Trial = 20962/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.833 | DEBUG    | __main__:trials:29 - Trial = 20962/30000 | Total reward = 42.34
2022-01-26 14:18:07.838 | DEBUG    | __main__:trials:24 - Trial = 20963/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.839 | DEBUG    | __main__:trials:29 - Trial = 20963/30000 | Total reward = 53.57
2022-01-26 14:18:07.844 | DEBUG    | __main__:trials:24 - Trial = 20964/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.845 | DEBUG    | __main__:trials:29 - Trial = 20964/30000 | Total reward = 39.61
2022-01-26 14:18:07.849 | DEBUG    | __main__:trials:24 - Trial = 20965/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.850 | DEBUG    | __main__:trials:29 - Trial = 20965/30000 | Total reward = 32.15
2022-01-26 14:18:07.854 | DEBUG    | __main__:trials:24 - Trial = 20966/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.856 | DEBUG    | __main__:trials:29 - Trial = 20966/30000 | Total reward = 40.11
2022-01-26 14:18:07.859 | DEBUG    | __main__:trials:24 - Trial = 20967/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.861 | DEBUG    | __main__:trials:29 - Trial = 20967/30000 | Total reward = 20.21
2022-01-26 14:18:07.864 | DEBUG    | __main__:trials:24 - Trial = 20968/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.866 | DEBUG    | __main__:trials:29 - Trial = 20968/30000 | Total reward = 43.37
2022-01-26 14:18:07.869 | DEBUG    | __main__:trials:24 - Trial = 20969/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.871 | DEBUG    | __main__:trials:29 - Trial = 20969/30000 | Total reward = 48.55
2022-01-26 14:18:07.875 | DEBUG    | __main__:trials:24 - Trial = 20970/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.876 | DEBUG    | __main__:trials:29 - Trial = 20970/30000 | Total reward = 34.72
2022-01-26 14:18:07.880 | DEBUG    | __main__:trials:24 - Trial = 20971/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.881 | DEBUG    | __main__:trials:29 - Trial = 20971/30000 | Total reward = 38.05
2022-01-26 14:18:07.886 | DEBUG    | __main__:trials:24 - Trial = 20972/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.886 | DEBUG    | __main__:trials:29 - Trial = 20972/30000 | Total reward = 30.20
2022-01-26 14:18:07.890 | DEBUG    | __main__:trials:26 - Trial = 20973/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.891 | DEBUG    | __main__:trials:29 - Trial = 20973/30000 | Total reward = 18.36
2022-01-26 14:18:07.895 | DEBUG    | __main__:trials:24 - Trial = 20974/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.896 | DEBUG    | __main__:trials:29 - Trial = 20974/30000 | Total reward = 36.26
2022-01-26 14:18:07.900 | DEBUG    | __main__:trials:24 - Trial = 20975/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.901 | DEBUG    | __main__:trials:29 - Trial = 20975/30000 | Total reward = 48.42
2022-01-26 14:18:07.906 | DEBUG    | __main__:trials:24 - Trial = 20976/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.907 | DEBUG    | __main__:trials:29 - Trial = 20976/30000 | Total reward = 35.17
2022-01-26 14:18:07.912 | DEBUG    | __main__:trials:24 - Trial = 20977/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.913 | DEBUG    | __main__:trials:29 - Trial = 20977/30000 | Total reward = 23.87
2022-01-26 14:18:07.916 | DEBUG    | __main__:trials:24 - Trial = 20978/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.918 | DEBUG    | __main__:trials:29 - Trial = 20978/30000 | Total reward = 39.57
2022-01-26 14:18:07.922 | DEBUG    | __main__:trials:24 - Trial = 20979/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.923 | DEBUG    | __main__:trials:29 - Trial = 20979/30000 | Total reward = 36.91
2022-01-26 14:18:07.927 | DEBUG    | __main__:trials:24 - Trial = 20980/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.928 | DEBUG    | __main__:trials:29 - Trial = 20980/30000 | Total reward = 39.64
2022-01-26 14:18:07.932 | DEBUG    | __main__:trials:24 - Trial = 20981/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.932 | DEBUG    | __main__:trials:29 - Trial = 20981/30000 | Total reward = 37.47
2022-01-26 14:18:07.936 | DEBUG    | __main__:trials:24 - Trial = 20982/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.938 | DEBUG    | __main__:trials:29 - Trial = 20982/30000 | Total reward = 28.89
2022-01-26 14:18:07.941 | DEBUG    | __main__:trials:24 - Trial = 20983/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.943 | DEBUG    | __main__:trials:29 - Trial = 20983/30000 | Total reward = 39.57
2022-01-26 14:18:07.947 | DEBUG    | __main__:trials:24 - Trial = 20984/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.947 | DEBUG    | __main__:trials:29 - Trial = 20984/30000 | Total reward = 39.58
2022-01-26 14:18:07.951 | DEBUG    | __main__:trials:24 - Trial = 20985/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.952 | DEBUG    | __main__:trials:29 - Trial = 20985/30000 | Total reward = 43.91
2022-01-26 14:18:07.956 | DEBUG    | __main__:trials:24 - Trial = 20986/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.958 | DEBUG    | __main__:trials:29 - Trial = 20986/30000 | Total reward = 36.94
2022-01-26 14:18:07.961 | DEBUG    | __main__:trials:24 - Trial = 20987/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.963 | DEBUG    | __main__:trials:29 - Trial = 20987/30000 | Total reward = 35.11
2022-01-26 14:18:07.967 | DEBUG    | __main__:trials:24 - Trial = 20988/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.968 | DEBUG    | __main__:trials:29 - Trial = 20988/30000 | Total reward = 31.99
2022-01-26 14:18:07.972 | DEBUG    | __main__:trials:24 - Trial = 20989/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.973 | DEBUG    | __main__:trials:29 - Trial = 20989/30000 | Total reward = 38.87
2022-01-26 14:18:07.977 | DEBUG    | __main__:trials:26 - Trial = 20990/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:07.978 | DEBUG    | __main__:trials:29 - Trial = 20990/30000 | Total reward = 43.37
2022-01-26 14:18:07.983 | DEBUG    | __main__:trials:24 - Trial = 20991/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.984 | DEBUG    | __main__:trials:29 - Trial = 20991/30000 | Total reward = 46.82
2022-01-26 14:18:07.988 | DEBUG    | __main__:trials:24 - Trial = 20992/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.990 | DEBUG    | __main__:trials:29 - Trial = 20992/30000 | Total reward = 39.80
2022-01-26 14:18:07.994 | DEBUG    | __main__:trials:24 - Trial = 20993/30000 | Max number of steps (20) reached
2022-01-26 14:18:07.994 | DEBUG    | __main__:trials:29 - Trial = 20993/30000 | Total reward = 39.01
2022-01-26 14:18:07.999 | DEBUG    | __main__:trials:24 - Trial = 20994/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.000 | DEBUG    | __main__:trials:29 - Trial = 20994/30000 | Total reward = 40.77
2022-01-26 14:18:08.004 | DEBUG    | __main__:trials:24 - Trial = 20995/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.005 | DEBUG    | __main__:trials:29 - Trial = 20995/30000 | Total reward = 47.44
2022-01-26 14:18:08.008 | DEBUG    | __main__:trials:24 - Trial = 20996/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.010 | DEBUG    | __main__:trials:29 - Trial = 20996/30000 | Total reward = 35.54
2022-01-26 14:18:08.013 | DEBUG    | __main__:trials:24 - Trial = 20997/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.014 | DEBUG    | __main__:trials:29 - Trial = 20997/30000 | Total reward = 48.04
2022-01-26 14:18:08.017 | DEBUG    | __main__:trials:26 - Trial = 20998/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.017 | DEBUG    | __main__:trials:29 - Trial = 20998/30000 | Total reward = 25.78
2022-01-26 14:18:08.022 | DEBUG    | __main__:trials:24 - Trial = 20999/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.022 | DEBUG    | __main__:trials:29 - Trial = 20999/30000 | Total reward = 41.22
2022-01-26 14:18:08.027 | DEBUG    | __main__:trials:24 - Trial = 21000/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.027 | DEBUG    | __main__:trials:29 - Trial = 21000/30000 | Total reward = 39.10
2022-01-26 14:18:08.032 | DEBUG    | __main__:trials:24 - Trial = 21001/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.034 | DEBUG    | __main__:trials:29 - Trial = 21001/30000 | Total reward = 50.28
2022-01-26 14:18:08.038 | DEBUG    | __main__:trials:24 - Trial = 21002/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.039 | DEBUG    | __main__:trials:29 - Trial = 21002/30000 | Total reward = 38.92
2022-01-26 14:18:08.043 | DEBUG    | __main__:trials:24 - Trial = 21003/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.044 | DEBUG    | __main__:trials:29 - Trial = 21003/30000 | Total reward = 31.82
2022-01-26 14:18:08.048 | DEBUG    | __main__:trials:24 - Trial = 21004/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.049 | DEBUG    | __main__:trials:29 - Trial = 21004/30000 | Total reward = 40.05
2022-01-26 14:18:08.053 | DEBUG    | __main__:trials:24 - Trial = 21005/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.055 | DEBUG    | __main__:trials:29 - Trial = 21005/30000 | Total reward = 38.87
2022-01-26 14:18:08.059 | DEBUG    | __main__:trials:24 - Trial = 21006/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.059 | DEBUG    | __main__:trials:29 - Trial = 21006/30000 | Total reward = 40.98
2022-01-26 14:18:08.063 | DEBUG    | __main__:trials:24 - Trial = 21007/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.064 | DEBUG    | __main__:trials:29 - Trial = 21007/30000 | Total reward = 44.81
2022-01-26 14:18:08.068 | DEBUG    | __main__:trials:24 - Trial = 21008/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.070 | DEBUG    | __main__:trials:29 - Trial = 21008/30000 | Total reward = 39.52
2022-01-26 14:18:08.074 | DEBUG    | __main__:trials:24 - Trial = 21009/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.075 | DEBUG    | __main__:trials:29 - Trial = 21009/30000 | Total reward = 48.82
2022-01-26 14:18:08.079 | DEBUG    | __main__:trials:24 - Trial = 21010/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.080 | DEBUG    | __main__:trials:29 - Trial = 21010/30000 | Total reward = 35.26
2022-01-26 14:18:08.084 | DEBUG    | __main__:trials:24 - Trial = 21011/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.085 | DEBUG    | __main__:trials:29 - Trial = 21011/30000 | Total reward = 46.36
2022-01-26 14:18:08.089 | DEBUG    | __main__:trials:24 - Trial = 21012/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.090 | DEBUG    | __main__:trials:29 - Trial = 21012/30000 | Total reward = 47.61
2022-01-26 14:18:08.093 | DEBUG    | __main__:trials:24 - Trial = 21013/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.094 | DEBUG    | __main__:trials:29 - Trial = 21013/30000 | Total reward = 39.10
2022-01-26 14:18:08.097 | DEBUG    | __main__:trials:24 - Trial = 21014/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.099 | DEBUG    | __main__:trials:29 - Trial = 21014/30000 | Total reward = 39.36
2022-01-26 14:18:08.102 | DEBUG    | __main__:trials:24 - Trial = 21015/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.103 | DEBUG    | __main__:trials:29 - Trial = 21015/30000 | Total reward = 41.70
2022-01-26 14:18:08.107 | DEBUG    | __main__:trials:24 - Trial = 21016/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.108 | DEBUG    | __main__:trials:29 - Trial = 21016/30000 | Total reward = 34.28
2022-01-26 14:18:08.112 | DEBUG    | __main__:trials:24 - Trial = 21017/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.114 | DEBUG    | __main__:trials:29 - Trial = 21017/30000 | Total reward = 36.07
2022-01-26 14:18:08.117 | DEBUG    | __main__:trials:24 - Trial = 21018/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.118 | DEBUG    | __main__:trials:29 - Trial = 21018/30000 | Total reward = 55.36
2022-01-26 14:18:08.123 | DEBUG    | __main__:trials:24 - Trial = 21019/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.124 | DEBUG    | __main__:trials:29 - Trial = 21019/30000 | Total reward = 31.84
2022-01-26 14:18:08.128 | DEBUG    | __main__:trials:24 - Trial = 21020/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.129 | DEBUG    | __main__:trials:29 - Trial = 21020/30000 | Total reward = 39.96
2022-01-26 14:18:08.134 | DEBUG    | __main__:trials:24 - Trial = 21021/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.135 | DEBUG    | __main__:trials:29 - Trial = 21021/30000 | Total reward = 37.94
2022-01-26 14:18:08.139 | DEBUG    | __main__:trials:24 - Trial = 21022/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.140 | DEBUG    | __main__:trials:29 - Trial = 21022/30000 | Total reward = 36.85
2022-01-26 14:18:08.145 | DEBUG    | __main__:trials:24 - Trial = 21023/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.146 | DEBUG    | __main__:trials:29 - Trial = 21023/30000 | Total reward = 42.37
2022-01-26 14:18:08.150 | DEBUG    | __main__:trials:24 - Trial = 21024/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.151 | DEBUG    | __main__:trials:29 - Trial = 21024/30000 | Total reward = 37.71
2022-01-26 14:18:08.155 | DEBUG    | __main__:trials:24 - Trial = 21025/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.156 | DEBUG    | __main__:trials:29 - Trial = 21025/30000 | Total reward = 47.39
2022-01-26 14:18:08.161 | DEBUG    | __main__:trials:24 - Trial = 21026/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.161 | DEBUG    | __main__:trials:29 - Trial = 21026/30000 | Total reward = 37.09
2022-01-26 14:18:08.166 | DEBUG    | __main__:trials:24 - Trial = 21027/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.167 | DEBUG    | __main__:trials:29 - Trial = 21027/30000 | Total reward = 34.58
2022-01-26 14:18:08.171 | DEBUG    | __main__:trials:24 - Trial = 21028/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.172 | DEBUG    | __main__:trials:29 - Trial = 21028/30000 | Total reward = 41.97
2022-01-26 14:18:08.176 | DEBUG    | __main__:trials:26 - Trial = 21029/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.177 | DEBUG    | __main__:trials:29 - Trial = 21029/30000 | Total reward = 33.22
2022-01-26 14:18:08.181 | DEBUG    | __main__:trials:24 - Trial = 21030/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.183 | DEBUG    | __main__:trials:29 - Trial = 21030/30000 | Total reward = 43.88
2022-01-26 14:18:08.187 | DEBUG    | __main__:trials:24 - Trial = 21031/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.188 | DEBUG    | __main__:trials:29 - Trial = 21031/30000 | Total reward = 34.27
2022-01-26 14:18:08.191 | DEBUG    | __main__:trials:26 - Trial = 21032/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.192 | DEBUG    | __main__:trials:29 - Trial = 21032/30000 | Total reward = 23.18
2022-01-26 14:18:08.196 | DEBUG    | __main__:trials:24 - Trial = 21033/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.198 | DEBUG    | __main__:trials:29 - Trial = 21033/30000 | Total reward = 39.57
2022-01-26 14:18:08.202 | DEBUG    | __main__:trials:24 - Trial = 21034/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.203 | DEBUG    | __main__:trials:29 - Trial = 21034/30000 | Total reward = 40.71
2022-01-26 14:18:08.206 | DEBUG    | __main__:trials:24 - Trial = 21035/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.208 | DEBUG    | __main__:trials:29 - Trial = 21035/30000 | Total reward = 45.52
2022-01-26 14:18:08.211 | DEBUG    | __main__:trials:24 - Trial = 21036/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.213 | DEBUG    | __main__:trials:29 - Trial = 21036/30000 | Total reward = 43.11
2022-01-26 14:18:08.216 | DEBUG    | __main__:trials:24 - Trial = 21037/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.218 | DEBUG    | __main__:trials:29 - Trial = 21037/30000 | Total reward = 60.89
2022-01-26 14:18:08.222 | DEBUG    | __main__:trials:24 - Trial = 21038/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.223 | DEBUG    | __main__:trials:29 - Trial = 21038/30000 | Total reward = 31.96
2022-01-26 14:18:08.226 | DEBUG    | __main__:trials:24 - Trial = 21039/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.227 | DEBUG    | __main__:trials:29 - Trial = 21039/30000 | Total reward = 34.70
2022-01-26 14:18:08.231 | DEBUG    | __main__:trials:24 - Trial = 21040/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.233 | DEBUG    | __main__:trials:29 - Trial = 21040/30000 | Total reward = 46.18
2022-01-26 14:18:08.236 | DEBUG    | __main__:trials:24 - Trial = 21041/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.238 | DEBUG    | __main__:trials:29 - Trial = 21041/30000 | Total reward = 39.92
2022-01-26 14:18:08.242 | DEBUG    | __main__:trials:24 - Trial = 21042/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.242 | DEBUG    | __main__:trials:29 - Trial = 21042/30000 | Total reward = 44.20
2022-01-26 14:18:08.247 | DEBUG    | __main__:trials:24 - Trial = 21043/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.248 | DEBUG    | __main__:trials:29 - Trial = 21043/30000 | Total reward = 45.66
2022-01-26 14:18:08.252 | DEBUG    | __main__:trials:24 - Trial = 21044/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.252 | DEBUG    | __main__:trials:29 - Trial = 21044/30000 | Total reward = 42.72
2022-01-26 14:18:08.256 | DEBUG    | __main__:trials:24 - Trial = 21045/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.258 | DEBUG    | __main__:trials:29 - Trial = 21045/30000 | Total reward = 45.26
2022-01-26 14:18:08.262 | DEBUG    | __main__:trials:24 - Trial = 21046/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.262 | DEBUG    | __main__:trials:29 - Trial = 21046/30000 | Total reward = 51.44
2022-01-26 14:18:08.267 | DEBUG    | __main__:trials:24 - Trial = 21047/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.267 | DEBUG    | __main__:trials:29 - Trial = 21047/30000 | Total reward = 44.91
2022-01-26 14:18:08.272 | DEBUG    | __main__:trials:24 - Trial = 21048/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.273 | DEBUG    | __main__:trials:29 - Trial = 21048/30000 | Total reward = 37.96
2022-01-26 14:18:08.277 | DEBUG    | __main__:trials:24 - Trial = 21049/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.279 | DEBUG    | __main__:trials:29 - Trial = 21049/30000 | Total reward = 40.31
2022-01-26 14:18:08.283 | DEBUG    | __main__:trials:24 - Trial = 21050/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.283 | DEBUG    | __main__:trials:29 - Trial = 21050/30000 | Total reward = 34.00
2022-01-26 14:18:08.288 | DEBUG    | __main__:trials:24 - Trial = 21051/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.289 | DEBUG    | __main__:trials:29 - Trial = 21051/30000 | Total reward = 40.94
2022-01-26 14:18:08.293 | DEBUG    | __main__:trials:24 - Trial = 21052/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.294 | DEBUG    | __main__:trials:29 - Trial = 21052/30000 | Total reward = 23.66
2022-01-26 14:18:08.297 | DEBUG    | __main__:trials:24 - Trial = 21053/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.298 | DEBUG    | __main__:trials:29 - Trial = 21053/30000 | Total reward = 31.69
2022-01-26 14:18:08.301 | DEBUG    | __main__:trials:24 - Trial = 21054/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.303 | DEBUG    | __main__:trials:29 - Trial = 21054/30000 | Total reward = 47.08
2022-01-26 14:18:08.307 | DEBUG    | __main__:trials:24 - Trial = 21055/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.308 | DEBUG    | __main__:trials:29 - Trial = 21055/30000 | Total reward = 42.97
2022-01-26 14:18:08.312 | DEBUG    | __main__:trials:24 - Trial = 21056/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.313 | DEBUG    | __main__:trials:29 - Trial = 21056/30000 | Total reward = 46.93
2022-01-26 14:18:08.317 | DEBUG    | __main__:trials:24 - Trial = 21057/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.318 | DEBUG    | __main__:trials:29 - Trial = 21057/30000 | Total reward = 38.69
2022-01-26 14:18:08.321 | DEBUG    | __main__:trials:24 - Trial = 21058/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.322 | DEBUG    | __main__:trials:29 - Trial = 21058/30000 | Total reward = 43.98
2022-01-26 14:18:08.326 | DEBUG    | __main__:trials:24 - Trial = 21059/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.327 | DEBUG    | __main__:trials:29 - Trial = 21059/30000 | Total reward = 52.98
2022-01-26 14:18:08.330 | DEBUG    | __main__:trials:26 - Trial = 21060/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.331 | DEBUG    | __main__:trials:29 - Trial = 21060/30000 | Total reward = 27.57
2022-01-26 14:18:08.335 | DEBUG    | __main__:trials:24 - Trial = 21061/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.335 | DEBUG    | __main__:trials:29 - Trial = 21061/30000 | Total reward = 39.28
2022-01-26 14:18:08.339 | DEBUG    | __main__:trials:24 - Trial = 21062/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.341 | DEBUG    | __main__:trials:29 - Trial = 21062/30000 | Total reward = 38.54
2022-01-26 14:18:08.344 | DEBUG    | __main__:trials:24 - Trial = 21063/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.345 | DEBUG    | __main__:trials:29 - Trial = 21063/30000 | Total reward = 43.74
2022-01-26 14:18:08.348 | DEBUG    | __main__:trials:24 - Trial = 21064/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.350 | DEBUG    | __main__:trials:29 - Trial = 21064/30000 | Total reward = 23.51
2022-01-26 14:18:08.354 | DEBUG    | __main__:trials:24 - Trial = 21065/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.355 | DEBUG    | __main__:trials:29 - Trial = 21065/30000 | Total reward = 49.25
2022-01-26 14:18:08.359 | DEBUG    | __main__:trials:24 - Trial = 21066/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.361 | DEBUG    | __main__:trials:29 - Trial = 21066/30000 | Total reward = 60.08
2022-01-26 14:18:08.364 | DEBUG    | __main__:trials:24 - Trial = 21067/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.366 | DEBUG    | __main__:trials:29 - Trial = 21067/30000 | Total reward = 36.30
2022-01-26 14:18:08.369 | DEBUG    | __main__:trials:24 - Trial = 21068/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.370 | DEBUG    | __main__:trials:29 - Trial = 21068/30000 | Total reward = 34.73
2022-01-26 14:18:08.373 | DEBUG    | __main__:trials:26 - Trial = 21069/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.375 | DEBUG    | __main__:trials:29 - Trial = 21069/30000 | Total reward = 26.94
2022-01-26 14:18:08.378 | DEBUG    | __main__:trials:24 - Trial = 21070/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.380 | DEBUG    | __main__:trials:29 - Trial = 21070/30000 | Total reward = 35.50
2022-01-26 14:18:08.383 | DEBUG    | __main__:trials:24 - Trial = 21071/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.384 | DEBUG    | __main__:trials:29 - Trial = 21071/30000 | Total reward = 45.05
2022-01-26 14:18:08.388 | DEBUG    | __main__:trials:24 - Trial = 21072/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.390 | DEBUG    | __main__:trials:29 - Trial = 21072/30000 | Total reward = 33.31
2022-01-26 14:18:08.393 | DEBUG    | __main__:trials:24 - Trial = 21073/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.395 | DEBUG    | __main__:trials:29 - Trial = 21073/30000 | Total reward = 34.85
2022-01-26 14:18:08.399 | DEBUG    | __main__:trials:24 - Trial = 21074/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.399 | DEBUG    | __main__:trials:29 - Trial = 21074/30000 | Total reward = 38.33
2022-01-26 14:18:08.404 | DEBUG    | __main__:trials:24 - Trial = 21075/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.405 | DEBUG    | __main__:trials:29 - Trial = 21075/30000 | Total reward = 39.88
2022-01-26 14:18:08.408 | DEBUG    | __main__:trials:24 - Trial = 21076/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.410 | DEBUG    | __main__:trials:29 - Trial = 21076/30000 | Total reward = 38.39
2022-01-26 14:18:08.414 | DEBUG    | __main__:trials:24 - Trial = 21077/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.415 | DEBUG    | __main__:trials:29 - Trial = 21077/30000 | Total reward = 46.19
2022-01-26 14:18:08.419 | DEBUG    | __main__:trials:24 - Trial = 21078/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.420 | DEBUG    | __main__:trials:29 - Trial = 21078/30000 | Total reward = 38.39
2022-01-26 14:18:08.424 | DEBUG    | __main__:trials:24 - Trial = 21079/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.426 | DEBUG    | __main__:trials:29 - Trial = 21079/30000 | Total reward = 39.61
2022-01-26 14:18:08.428 | DEBUG    | __main__:trials:26 - Trial = 21080/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.430 | DEBUG    | __main__:trials:29 - Trial = 21080/30000 | Total reward = 23.53
2022-01-26 14:18:08.433 | DEBUG    | __main__:trials:24 - Trial = 21081/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.433 | DEBUG    | __main__:trials:29 - Trial = 21081/30000 | Total reward = 44.86
2022-01-26 14:18:08.438 | DEBUG    | __main__:trials:24 - Trial = 21082/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.438 | DEBUG    | __main__:trials:29 - Trial = 21082/30000 | Total reward = 40.10
2022-01-26 14:18:08.443 | DEBUG    | __main__:trials:24 - Trial = 21083/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.444 | DEBUG    | __main__:trials:29 - Trial = 21083/30000 | Total reward = 42.48
2022-01-26 14:18:08.448 | DEBUG    | __main__:trials:24 - Trial = 21084/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.450 | DEBUG    | __main__:trials:29 - Trial = 21084/30000 | Total reward = 42.54
2022-01-26 14:18:08.454 | DEBUG    | __main__:trials:24 - Trial = 21085/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.456 | DEBUG    | __main__:trials:29 - Trial = 21085/30000 | Total reward = 46.11
2022-01-26 14:18:08.460 | DEBUG    | __main__:trials:24 - Trial = 21086/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.461 | DEBUG    | __main__:trials:29 - Trial = 21086/30000 | Total reward = 47.73
2022-01-26 14:18:08.465 | DEBUG    | __main__:trials:24 - Trial = 21087/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.467 | DEBUG    | __main__:trials:29 - Trial = 21087/30000 | Total reward = 32.84
2022-01-26 14:18:08.470 | DEBUG    | __main__:trials:24 - Trial = 21088/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.472 | DEBUG    | __main__:trials:29 - Trial = 21088/30000 | Total reward = 39.57
2022-01-26 14:18:08.476 | DEBUG    | __main__:trials:24 - Trial = 21089/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.477 | DEBUG    | __main__:trials:29 - Trial = 21089/30000 | Total reward = 43.06
2022-01-26 14:18:08.481 | DEBUG    | __main__:trials:24 - Trial = 21090/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.483 | DEBUG    | __main__:trials:29 - Trial = 21090/30000 | Total reward = 39.91
2022-01-26 14:18:08.487 | DEBUG    | __main__:trials:24 - Trial = 21091/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.488 | DEBUG    | __main__:trials:29 - Trial = 21091/30000 | Total reward = 43.03
2022-01-26 14:18:08.491 | DEBUG    | __main__:trials:24 - Trial = 21092/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.493 | DEBUG    | __main__:trials:29 - Trial = 21092/30000 | Total reward = 41.28
2022-01-26 14:18:08.496 | DEBUG    | __main__:trials:24 - Trial = 21093/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.498 | DEBUG    | __main__:trials:29 - Trial = 21093/30000 | Total reward = 43.27
2022-01-26 14:18:08.502 | DEBUG    | __main__:trials:26 - Trial = 21094/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.504 | DEBUG    | __main__:trials:29 - Trial = 21094/30000 | Total reward = 37.27
2022-01-26 14:18:08.508 | DEBUG    | __main__:trials:24 - Trial = 21095/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.508 | DEBUG    | __main__:trials:29 - Trial = 21095/30000 | Total reward = 27.68
2022-01-26 14:18:08.512 | DEBUG    | __main__:trials:24 - Trial = 21096/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.513 | DEBUG    | __main__:trials:29 - Trial = 21096/30000 | Total reward = 36.09
2022-01-26 14:18:08.517 | DEBUG    | __main__:trials:24 - Trial = 21097/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.518 | DEBUG    | __main__:trials:29 - Trial = 21097/30000 | Total reward = 38.47
2022-01-26 14:18:08.521 | DEBUG    | __main__:trials:24 - Trial = 21098/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.523 | DEBUG    | __main__:trials:29 - Trial = 21098/30000 | Total reward = 25.00
2022-01-26 14:18:08.526 | DEBUG    | __main__:trials:24 - Trial = 21099/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.528 | DEBUG    | __main__:trials:29 - Trial = 21099/30000 | Total reward = 34.65
2022-01-26 14:18:08.531 | DEBUG    | __main__:trials:24 - Trial = 21100/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.533 | DEBUG    | __main__:trials:29 - Trial = 21100/30000 | Total reward = 40.08
2022-01-26 14:18:08.536 | DEBUG    | __main__:trials:24 - Trial = 21101/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.538 | DEBUG    | __main__:trials:29 - Trial = 21101/30000 | Total reward = 52.53
2022-01-26 14:18:08.542 | DEBUG    | __main__:trials:24 - Trial = 21102/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.542 | DEBUG    | __main__:trials:29 - Trial = 21102/30000 | Total reward = 35.46
2022-01-26 14:18:08.547 | DEBUG    | __main__:trials:24 - Trial = 21103/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.548 | DEBUG    | __main__:trials:29 - Trial = 21103/30000 | Total reward = 31.96
2022-01-26 14:18:08.552 | DEBUG    | __main__:trials:24 - Trial = 21104/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.553 | DEBUG    | __main__:trials:29 - Trial = 21104/30000 | Total reward = 31.23
2022-01-26 14:18:08.558 | DEBUG    | __main__:trials:24 - Trial = 21105/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.559 | DEBUG    | __main__:trials:29 - Trial = 21105/30000 | Total reward = 41.15
2022-01-26 14:18:08.563 | DEBUG    | __main__:trials:24 - Trial = 21106/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.565 | DEBUG    | __main__:trials:29 - Trial = 21106/30000 | Total reward = 41.40
2022-01-26 14:18:08.568 | DEBUG    | __main__:trials:24 - Trial = 21107/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.570 | DEBUG    | __main__:trials:29 - Trial = 21107/30000 | Total reward = 46.50
2022-01-26 14:18:08.574 | DEBUG    | __main__:trials:24 - Trial = 21108/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.575 | DEBUG    | __main__:trials:29 - Trial = 21108/30000 | Total reward = 30.16
2022-01-26 14:18:08.578 | DEBUG    | __main__:trials:24 - Trial = 21109/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.580 | DEBUG    | __main__:trials:29 - Trial = 21109/30000 | Total reward = 38.99
2022-01-26 14:18:08.584 | DEBUG    | __main__:trials:24 - Trial = 21110/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.585 | DEBUG    | __main__:trials:29 - Trial = 21110/30000 | Total reward = 38.92
2022-01-26 14:18:08.589 | DEBUG    | __main__:trials:24 - Trial = 21111/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.590 | DEBUG    | __main__:trials:29 - Trial = 21111/30000 | Total reward = 49.71
2022-01-26 14:18:08.594 | DEBUG    | __main__:trials:24 - Trial = 21112/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.596 | DEBUG    | __main__:trials:29 - Trial = 21112/30000 | Total reward = 39.54
2022-01-26 14:18:08.599 | DEBUG    | __main__:trials:24 - Trial = 21113/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.601 | DEBUG    | __main__:trials:29 - Trial = 21113/30000 | Total reward = 26.70
2022-01-26 14:18:08.605 | DEBUG    | __main__:trials:24 - Trial = 21114/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.606 | DEBUG    | __main__:trials:29 - Trial = 21114/30000 | Total reward = 39.57
2022-01-26 14:18:08.610 | DEBUG    | __main__:trials:24 - Trial = 21115/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.611 | DEBUG    | __main__:trials:29 - Trial = 21115/30000 | Total reward = 51.92
2022-01-26 14:18:08.615 | DEBUG    | __main__:trials:24 - Trial = 21116/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.616 | DEBUG    | __main__:trials:29 - Trial = 21116/30000 | Total reward = 39.20
2022-01-26 14:18:08.620 | DEBUG    | __main__:trials:24 - Trial = 21117/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.622 | DEBUG    | __main__:trials:29 - Trial = 21117/30000 | Total reward = 36.65
2022-01-26 14:18:08.625 | DEBUG    | __main__:trials:24 - Trial = 21118/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.626 | DEBUG    | __main__:trials:29 - Trial = 21118/30000 | Total reward = 39.30
2022-01-26 14:18:08.629 | DEBUG    | __main__:trials:24 - Trial = 21119/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.631 | DEBUG    | __main__:trials:29 - Trial = 21119/30000 | Total reward = 35.87
2022-01-26 14:18:08.634 | DEBUG    | __main__:trials:24 - Trial = 21120/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.635 | DEBUG    | __main__:trials:29 - Trial = 21120/30000 | Total reward = 39.73
2022-01-26 14:18:08.639 | DEBUG    | __main__:trials:24 - Trial = 21121/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.641 | DEBUG    | __main__:trials:29 - Trial = 21121/30000 | Total reward = 37.17
2022-01-26 14:18:08.644 | DEBUG    | __main__:trials:24 - Trial = 21122/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.646 | DEBUG    | __main__:trials:29 - Trial = 21122/30000 | Total reward = 41.74
2022-01-26 14:18:08.650 | DEBUG    | __main__:trials:24 - Trial = 21123/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.651 | DEBUG    | __main__:trials:29 - Trial = 21123/30000 | Total reward = 39.06
2022-01-26 14:18:08.655 | DEBUG    | __main__:trials:24 - Trial = 21124/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.657 | DEBUG    | __main__:trials:29 - Trial = 21124/30000 | Total reward = 39.41
2022-01-26 14:18:08.660 | DEBUG    | __main__:trials:24 - Trial = 21125/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.662 | DEBUG    | __main__:trials:29 - Trial = 21125/30000 | Total reward = 39.57
2022-01-26 14:18:08.665 | DEBUG    | __main__:trials:24 - Trial = 21126/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.667 | DEBUG    | __main__:trials:29 - Trial = 21126/30000 | Total reward = 34.54
2022-01-26 14:18:08.671 | DEBUG    | __main__:trials:24 - Trial = 21127/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.672 | DEBUG    | __main__:trials:29 - Trial = 21127/30000 | Total reward = 56.10
2022-01-26 14:18:08.675 | DEBUG    | __main__:trials:24 - Trial = 21128/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.677 | DEBUG    | __main__:trials:29 - Trial = 21128/30000 | Total reward = 41.45
2022-01-26 14:18:08.680 | DEBUG    | __main__:trials:24 - Trial = 21129/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.682 | DEBUG    | __main__:trials:29 - Trial = 21129/30000 | Total reward = 39.29
2022-01-26 14:18:08.686 | DEBUG    | __main__:trials:24 - Trial = 21130/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.688 | DEBUG    | __main__:trials:29 - Trial = 21130/30000 | Total reward = 48.82
2022-01-26 14:18:08.691 | DEBUG    | __main__:trials:26 - Trial = 21131/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.692 | DEBUG    | __main__:trials:29 - Trial = 21131/30000 | Total reward = 23.49
2022-01-26 14:18:08.696 | DEBUG    | __main__:trials:24 - Trial = 21132/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.697 | DEBUG    | __main__:trials:29 - Trial = 21132/30000 | Total reward = 52.91
2022-01-26 14:18:08.701 | DEBUG    | __main__:trials:24 - Trial = 21133/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.703 | DEBUG    | __main__:trials:29 - Trial = 21133/30000 | Total reward = 40.27
2022-01-26 14:18:08.706 | DEBUG    | __main__:trials:24 - Trial = 21134/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.708 | DEBUG    | __main__:trials:29 - Trial = 21134/30000 | Total reward = 44.66
2022-01-26 14:18:08.712 | DEBUG    | __main__:trials:26 - Trial = 21135/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.713 | DEBUG    | __main__:trials:29 - Trial = 21135/30000 | Total reward = 28.23
2022-01-26 14:18:08.716 | DEBUG    | __main__:trials:26 - Trial = 21136/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.717 | DEBUG    | __main__:trials:29 - Trial = 21136/30000 | Total reward = 31.89
2022-01-26 14:18:08.720 | DEBUG    | __main__:trials:26 - Trial = 21137/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.721 | DEBUG    | __main__:trials:29 - Trial = 21137/30000 | Total reward = 28.60
2022-01-26 14:18:08.724 | DEBUG    | __main__:trials:24 - Trial = 21138/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.726 | DEBUG    | __main__:trials:29 - Trial = 21138/30000 | Total reward = 50.22
2022-01-26 14:18:08.729 | DEBUG    | __main__:trials:24 - Trial = 21139/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.731 | DEBUG    | __main__:trials:29 - Trial = 21139/30000 | Total reward = 44.54
2022-01-26 14:18:08.735 | DEBUG    | __main__:trials:24 - Trial = 21140/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.736 | DEBUG    | __main__:trials:29 - Trial = 21140/30000 | Total reward = 38.97
2022-01-26 14:18:08.740 | DEBUG    | __main__:trials:24 - Trial = 21141/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.741 | DEBUG    | __main__:trials:29 - Trial = 21141/30000 | Total reward = 40.33
2022-01-26 14:18:08.745 | DEBUG    | __main__:trials:24 - Trial = 21142/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.746 | DEBUG    | __main__:trials:29 - Trial = 21142/30000 | Total reward = 41.42
2022-01-26 14:18:08.749 | DEBUG    | __main__:trials:24 - Trial = 21143/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.750 | DEBUG    | __main__:trials:29 - Trial = 21143/30000 | Total reward = 36.12
2022-01-26 14:18:08.753 | DEBUG    | __main__:trials:24 - Trial = 21144/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.754 | DEBUG    | __main__:trials:29 - Trial = 21144/30000 | Total reward = 42.56
2022-01-26 14:18:08.759 | DEBUG    | __main__:trials:24 - Trial = 21145/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.760 | DEBUG    | __main__:trials:29 - Trial = 21145/30000 | Total reward = 48.93
2022-01-26 14:18:08.764 | DEBUG    | __main__:trials:24 - Trial = 21146/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.765 | DEBUG    | __main__:trials:29 - Trial = 21146/30000 | Total reward = 49.00
2022-01-26 14:18:08.769 | DEBUG    | __main__:trials:24 - Trial = 21147/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.771 | DEBUG    | __main__:trials:29 - Trial = 21147/30000 | Total reward = 46.12
2022-01-26 14:18:08.774 | DEBUG    | __main__:trials:24 - Trial = 21148/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.776 | DEBUG    | __main__:trials:29 - Trial = 21148/30000 | Total reward = 44.43
2022-01-26 14:18:08.779 | DEBUG    | __main__:trials:24 - Trial = 21149/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.781 | DEBUG    | __main__:trials:29 - Trial = 21149/30000 | Total reward = 47.07
2022-01-26 14:18:08.784 | DEBUG    | __main__:trials:24 - Trial = 21150/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.786 | DEBUG    | __main__:trials:29 - Trial = 21150/30000 | Total reward = 55.62
2022-01-26 14:18:08.790 | DEBUG    | __main__:trials:24 - Trial = 21151/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.791 | DEBUG    | __main__:trials:29 - Trial = 21151/30000 | Total reward = 63.56
2022-01-26 14:18:08.795 | DEBUG    | __main__:trials:24 - Trial = 21152/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.796 | DEBUG    | __main__:trials:29 - Trial = 21152/30000 | Total reward = 39.57
2022-01-26 14:18:08.799 | DEBUG    | __main__:trials:24 - Trial = 21153/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.801 | DEBUG    | __main__:trials:29 - Trial = 21153/30000 | Total reward = 52.54
2022-01-26 14:18:08.805 | DEBUG    | __main__:trials:24 - Trial = 21154/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.806 | DEBUG    | __main__:trials:29 - Trial = 21154/30000 | Total reward = 41.55
2022-01-26 14:18:08.810 | DEBUG    | __main__:trials:24 - Trial = 21155/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.811 | DEBUG    | __main__:trials:29 - Trial = 21155/30000 | Total reward = 39.95
2022-01-26 14:18:08.815 | DEBUG    | __main__:trials:24 - Trial = 21156/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.816 | DEBUG    | __main__:trials:29 - Trial = 21156/30000 | Total reward = 43.51
2022-01-26 14:18:08.820 | DEBUG    | __main__:trials:24 - Trial = 21157/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.821 | DEBUG    | __main__:trials:29 - Trial = 21157/30000 | Total reward = 53.01
2022-01-26 14:18:08.825 | DEBUG    | __main__:trials:24 - Trial = 21158/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.825 | DEBUG    | __main__:trials:29 - Trial = 21158/30000 | Total reward = 55.49
2022-01-26 14:18:08.830 | DEBUG    | __main__:trials:24 - Trial = 21159/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.830 | DEBUG    | __main__:trials:29 - Trial = 21159/30000 | Total reward = 52.24
2022-01-26 14:18:08.834 | DEBUG    | __main__:trials:24 - Trial = 21160/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.834 | DEBUG    | __main__:trials:29 - Trial = 21160/30000 | Total reward = 55.34
2022-01-26 14:18:08.838 | DEBUG    | __main__:trials:24 - Trial = 21161/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.839 | DEBUG    | __main__:trials:29 - Trial = 21161/30000 | Total reward = 63.57
2022-01-26 14:18:08.843 | DEBUG    | __main__:trials:24 - Trial = 21162/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.844 | DEBUG    | __main__:trials:29 - Trial = 21162/30000 | Total reward = 52.74
2022-01-26 14:18:08.848 | DEBUG    | __main__:trials:24 - Trial = 21163/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.850 | DEBUG    | __main__:trials:29 - Trial = 21163/30000 | Total reward = 53.23
2022-01-26 14:18:08.853 | DEBUG    | __main__:trials:24 - Trial = 21164/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.855 | DEBUG    | __main__:trials:29 - Trial = 21164/30000 | Total reward = 44.29
2022-01-26 14:18:08.858 | DEBUG    | __main__:trials:24 - Trial = 21165/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.860 | DEBUG    | __main__:trials:29 - Trial = 21165/30000 | Total reward = 50.10
2022-01-26 14:18:08.864 | DEBUG    | __main__:trials:24 - Trial = 21166/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.865 | DEBUG    | __main__:trials:29 - Trial = 21166/30000 | Total reward = 52.50
2022-01-26 14:18:08.868 | DEBUG    | __main__:trials:24 - Trial = 21167/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.870 | DEBUG    | __main__:trials:29 - Trial = 21167/30000 | Total reward = 55.28
2022-01-26 14:18:08.874 | DEBUG    | __main__:trials:24 - Trial = 21168/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.875 | DEBUG    | __main__:trials:29 - Trial = 21168/30000 | Total reward = 62.79
2022-01-26 14:18:08.878 | DEBUG    | __main__:trials:26 - Trial = 21169/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.879 | DEBUG    | __main__:trials:29 - Trial = 21169/30000 | Total reward = 31.51
2022-01-26 14:18:08.883 | DEBUG    | __main__:trials:24 - Trial = 21170/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.884 | DEBUG    | __main__:trials:29 - Trial = 21170/30000 | Total reward = 37.63
2022-01-26 14:18:08.888 | DEBUG    | __main__:trials:24 - Trial = 21171/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.890 | DEBUG    | __main__:trials:29 - Trial = 21171/30000 | Total reward = 39.03
2022-01-26 14:18:08.891 | DEBUG    | __main__:trials:26 - Trial = 21172/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.892 | DEBUG    | __main__:trials:29 - Trial = 21172/30000 | Total reward = 12.29
2022-01-26 14:18:08.896 | DEBUG    | __main__:trials:24 - Trial = 21173/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.897 | DEBUG    | __main__:trials:29 - Trial = 21173/30000 | Total reward = 31.94
2022-01-26 14:18:08.901 | DEBUG    | __main__:trials:24 - Trial = 21174/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.902 | DEBUG    | __main__:trials:29 - Trial = 21174/30000 | Total reward = 38.48
2022-01-26 14:18:08.905 | DEBUG    | __main__:trials:26 - Trial = 21175/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.906 | DEBUG    | __main__:trials:29 - Trial = 21175/30000 | Total reward = 22.42
2022-01-26 14:18:08.910 | DEBUG    | __main__:trials:26 - Trial = 21176/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.911 | DEBUG    | __main__:trials:29 - Trial = 21176/30000 | Total reward = 31.93
2022-01-26 14:18:08.914 | DEBUG    | __main__:trials:24 - Trial = 21177/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.916 | DEBUG    | __main__:trials:29 - Trial = 21177/30000 | Total reward = 39.93
2022-01-26 14:18:08.919 | DEBUG    | __main__:trials:24 - Trial = 21178/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.921 | DEBUG    | __main__:trials:29 - Trial = 21178/30000 | Total reward = 36.68
2022-01-26 14:18:08.924 | DEBUG    | __main__:trials:24 - Trial = 21179/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.926 | DEBUG    | __main__:trials:29 - Trial = 21179/30000 | Total reward = 38.33
2022-01-26 14:18:08.930 | DEBUG    | __main__:trials:24 - Trial = 21180/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.931 | DEBUG    | __main__:trials:29 - Trial = 21180/30000 | Total reward = 35.17
2022-01-26 14:18:08.935 | DEBUG    | __main__:trials:24 - Trial = 21181/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.935 | DEBUG    | __main__:trials:29 - Trial = 21181/30000 | Total reward = 47.06
2022-01-26 14:18:08.939 | DEBUG    | __main__:trials:26 - Trial = 21182/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:08.940 | DEBUG    | __main__:trials:29 - Trial = 21182/30000 | Total reward = 16.29
2022-01-26 14:18:08.943 | DEBUG    | __main__:trials:24 - Trial = 21183/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.945 | DEBUG    | __main__:trials:29 - Trial = 21183/30000 | Total reward = 56.06
2022-01-26 14:18:08.948 | DEBUG    | __main__:trials:24 - Trial = 21184/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.950 | DEBUG    | __main__:trials:29 - Trial = 21184/30000 | Total reward = 29.32
2022-01-26 14:18:08.953 | DEBUG    | __main__:trials:24 - Trial = 21185/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.955 | DEBUG    | __main__:trials:29 - Trial = 21185/30000 | Total reward = 38.07
2022-01-26 14:18:08.958 | DEBUG    | __main__:trials:24 - Trial = 21186/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.959 | DEBUG    | __main__:trials:29 - Trial = 21186/30000 | Total reward = 35.70
2022-01-26 14:18:08.963 | DEBUG    | __main__:trials:24 - Trial = 21187/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.965 | DEBUG    | __main__:trials:29 - Trial = 21187/30000 | Total reward = 47.27
2022-01-26 14:18:08.969 | DEBUG    | __main__:trials:24 - Trial = 21188/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.969 | DEBUG    | __main__:trials:29 - Trial = 21188/30000 | Total reward = 45.07
2022-01-26 14:18:08.973 | DEBUG    | __main__:trials:24 - Trial = 21189/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.975 | DEBUG    | __main__:trials:29 - Trial = 21189/30000 | Total reward = 36.87
2022-01-26 14:18:08.979 | DEBUG    | __main__:trials:24 - Trial = 21190/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.979 | DEBUG    | __main__:trials:29 - Trial = 21190/30000 | Total reward = 44.27
2022-01-26 14:18:08.984 | DEBUG    | __main__:trials:24 - Trial = 21191/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.984 | DEBUG    | __main__:trials:29 - Trial = 21191/30000 | Total reward = 52.51
2022-01-26 14:18:08.989 | DEBUG    | __main__:trials:24 - Trial = 21192/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.989 | DEBUG    | __main__:trials:29 - Trial = 21192/30000 | Total reward = 43.51
2022-01-26 14:18:08.993 | DEBUG    | __main__:trials:24 - Trial = 21193/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.993 | DEBUG    | __main__:trials:29 - Trial = 21193/30000 | Total reward = 34.62
2022-01-26 14:18:08.997 | DEBUG    | __main__:trials:24 - Trial = 21194/30000 | Max number of steps (20) reached
2022-01-26 14:18:08.998 | DEBUG    | __main__:trials:29 - Trial = 21194/30000 | Total reward = 33.29
2022-01-26 14:18:09.001 | DEBUG    | __main__:trials:24 - Trial = 21195/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.003 | DEBUG    | __main__:trials:29 - Trial = 21195/30000 | Total reward = 53.16
2022-01-26 14:18:09.006 | DEBUG    | __main__:trials:24 - Trial = 21196/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.007 | DEBUG    | __main__:trials:29 - Trial = 21196/30000 | Total reward = 46.73
2022-01-26 14:18:09.010 | DEBUG    | __main__:trials:24 - Trial = 21197/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.011 | DEBUG    | __main__:trials:29 - Trial = 21197/30000 | Total reward = 44.15
2022-01-26 14:18:09.014 | DEBUG    | __main__:trials:24 - Trial = 21198/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.015 | DEBUG    | __main__:trials:29 - Trial = 21198/30000 | Total reward = 51.79
2022-01-26 14:18:09.019 | DEBUG    | __main__:trials:24 - Trial = 21199/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.021 | DEBUG    | __main__:trials:29 - Trial = 21199/30000 | Total reward = 53.28
2022-01-26 14:18:09.024 | DEBUG    | __main__:trials:24 - Trial = 21200/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.026 | DEBUG    | __main__:trials:29 - Trial = 21200/30000 | Total reward = 46.98
2022-01-26 14:18:09.029 | DEBUG    | __main__:trials:24 - Trial = 21201/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.030 | DEBUG    | __main__:trials:29 - Trial = 21201/30000 | Total reward = 53.51
2022-01-26 14:18:09.034 | DEBUG    | __main__:trials:24 - Trial = 21202/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.036 | DEBUG    | __main__:trials:29 - Trial = 21202/30000 | Total reward = 35.79
2022-01-26 14:18:09.040 | DEBUG    | __main__:trials:24 - Trial = 21203/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.042 | DEBUG    | __main__:trials:29 - Trial = 21203/30000 | Total reward = 37.07
2022-01-26 14:18:09.046 | DEBUG    | __main__:trials:24 - Trial = 21204/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.046 | DEBUG    | __main__:trials:29 - Trial = 21204/30000 | Total reward = 36.02
2022-01-26 14:18:09.050 | DEBUG    | __main__:trials:24 - Trial = 21205/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.052 | DEBUG    | __main__:trials:29 - Trial = 21205/30000 | Total reward = 51.93
2022-01-26 14:18:09.055 | DEBUG    | __main__:trials:24 - Trial = 21206/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.057 | DEBUG    | __main__:trials:29 - Trial = 21206/30000 | Total reward = 45.65
2022-01-26 14:18:09.060 | DEBUG    | __main__:trials:24 - Trial = 21207/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.061 | DEBUG    | __main__:trials:29 - Trial = 21207/30000 | Total reward = 41.57
2022-01-26 14:18:09.065 | DEBUG    | __main__:trials:24 - Trial = 21208/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.066 | DEBUG    | __main__:trials:29 - Trial = 21208/30000 | Total reward = 49.16
2022-01-26 14:18:09.069 | DEBUG    | __main__:trials:26 - Trial = 21209/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.069 | DEBUG    | __main__:trials:29 - Trial = 21209/30000 | Total reward = 29.31
2022-01-26 14:18:09.073 | DEBUG    | __main__:trials:24 - Trial = 21210/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.074 | DEBUG    | __main__:trials:29 - Trial = 21210/30000 | Total reward = 54.07
2022-01-26 14:18:09.078 | DEBUG    | __main__:trials:24 - Trial = 21211/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.079 | DEBUG    | __main__:trials:29 - Trial = 21211/30000 | Total reward = 39.88
2022-01-26 14:18:09.083 | DEBUG    | __main__:trials:24 - Trial = 21212/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.084 | DEBUG    | __main__:trials:29 - Trial = 21212/30000 | Total reward = 57.70
2022-01-26 14:18:09.088 | DEBUG    | __main__:trials:26 - Trial = 21213/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.089 | DEBUG    | __main__:trials:29 - Trial = 21213/30000 | Total reward = 27.43
2022-01-26 14:18:09.093 | DEBUG    | __main__:trials:24 - Trial = 21214/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.094 | DEBUG    | __main__:trials:29 - Trial = 21214/30000 | Total reward = 41.18
2022-01-26 14:18:09.098 | DEBUG    | __main__:trials:24 - Trial = 21215/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.100 | DEBUG    | __main__:trials:29 - Trial = 21215/30000 | Total reward = 37.06
2022-01-26 14:18:09.103 | DEBUG    | __main__:trials:24 - Trial = 21216/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.105 | DEBUG    | __main__:trials:29 - Trial = 21216/30000 | Total reward = 38.08
2022-01-26 14:18:09.108 | DEBUG    | __main__:trials:24 - Trial = 21217/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.110 | DEBUG    | __main__:trials:29 - Trial = 21217/30000 | Total reward = 32.43
2022-01-26 14:18:09.113 | DEBUG    | __main__:trials:24 - Trial = 21218/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.113 | DEBUG    | __main__:trials:29 - Trial = 21218/30000 | Total reward = 39.61
2022-01-26 14:18:09.118 | DEBUG    | __main__:trials:24 - Trial = 21219/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.119 | DEBUG    | __main__:trials:29 - Trial = 21219/30000 | Total reward = 37.75
2022-01-26 14:18:09.123 | DEBUG    | __main__:trials:24 - Trial = 21220/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.124 | DEBUG    | __main__:trials:29 - Trial = 21220/30000 | Total reward = 30.09
2022-01-26 14:18:09.127 | DEBUG    | __main__:trials:24 - Trial = 21221/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.129 | DEBUG    | __main__:trials:29 - Trial = 21221/30000 | Total reward = 36.64
2022-01-26 14:18:09.132 | DEBUG    | __main__:trials:24 - Trial = 21222/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.134 | DEBUG    | __main__:trials:29 - Trial = 21222/30000 | Total reward = 41.70
2022-01-26 14:18:09.137 | DEBUG    | __main__:trials:24 - Trial = 21223/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.139 | DEBUG    | __main__:trials:29 - Trial = 21223/30000 | Total reward = 40.66
2022-01-26 14:18:09.143 | DEBUG    | __main__:trials:24 - Trial = 21224/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.143 | DEBUG    | __main__:trials:29 - Trial = 21224/30000 | Total reward = 42.31
2022-01-26 14:18:09.147 | DEBUG    | __main__:trials:26 - Trial = 21225/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.148 | DEBUG    | __main__:trials:29 - Trial = 21225/30000 | Total reward = 37.94
2022-01-26 14:18:09.152 | DEBUG    | __main__:trials:24 - Trial = 21226/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.153 | DEBUG    | __main__:trials:29 - Trial = 21226/30000 | Total reward = 37.31
2022-01-26 14:18:09.157 | DEBUG    | __main__:trials:24 - Trial = 21227/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.159 | DEBUG    | __main__:trials:29 - Trial = 21227/30000 | Total reward = 49.78
2022-01-26 14:18:09.163 | DEBUG    | __main__:trials:24 - Trial = 21228/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.164 | DEBUG    | __main__:trials:29 - Trial = 21228/30000 | Total reward = 47.59
2022-01-26 14:18:09.167 | DEBUG    | __main__:trials:24 - Trial = 21229/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.169 | DEBUG    | __main__:trials:29 - Trial = 21229/30000 | Total reward = 60.94
2022-01-26 14:18:09.172 | DEBUG    | __main__:trials:24 - Trial = 21230/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.174 | DEBUG    | __main__:trials:29 - Trial = 21230/30000 | Total reward = 42.20
2022-01-26 14:18:09.177 | DEBUG    | __main__:trials:24 - Trial = 21231/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.179 | DEBUG    | __main__:trials:29 - Trial = 21231/30000 | Total reward = 38.92
2022-01-26 14:18:09.183 | DEBUG    | __main__:trials:24 - Trial = 21232/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.184 | DEBUG    | __main__:trials:29 - Trial = 21232/30000 | Total reward = 44.76
2022-01-26 14:18:09.188 | DEBUG    | __main__:trials:24 - Trial = 21233/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.189 | DEBUG    | __main__:trials:29 - Trial = 21233/30000 | Total reward = 33.73
2022-01-26 14:18:09.193 | DEBUG    | __main__:trials:24 - Trial = 21234/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.193 | DEBUG    | __main__:trials:29 - Trial = 21234/30000 | Total reward = 43.37
2022-01-26 14:18:09.198 | DEBUG    | __main__:trials:24 - Trial = 21235/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.199 | DEBUG    | __main__:trials:29 - Trial = 21235/30000 | Total reward = 45.17
2022-01-26 14:18:09.203 | DEBUG    | __main__:trials:24 - Trial = 21236/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.204 | DEBUG    | __main__:trials:29 - Trial = 21236/30000 | Total reward = 35.43
2022-01-26 14:18:09.207 | DEBUG    | __main__:trials:24 - Trial = 21237/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.209 | DEBUG    | __main__:trials:29 - Trial = 21237/30000 | Total reward = 47.94
2022-01-26 14:18:09.213 | DEBUG    | __main__:trials:24 - Trial = 21238/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.214 | DEBUG    | __main__:trials:29 - Trial = 21238/30000 | Total reward = 36.54
2022-01-26 14:18:09.217 | DEBUG    | __main__:trials:24 - Trial = 21239/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.218 | DEBUG    | __main__:trials:29 - Trial = 21239/30000 | Total reward = 36.48
2022-01-26 14:18:09.222 | DEBUG    | __main__:trials:24 - Trial = 21240/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.224 | DEBUG    | __main__:trials:29 - Trial = 21240/30000 | Total reward = 46.52
2022-01-26 14:18:09.227 | DEBUG    | __main__:trials:24 - Trial = 21241/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.229 | DEBUG    | __main__:trials:29 - Trial = 21241/30000 | Total reward = 57.63
2022-01-26 14:18:09.232 | DEBUG    | __main__:trials:26 - Trial = 21242/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.233 | DEBUG    | __main__:trials:29 - Trial = 21242/30000 | Total reward = 33.71
2022-01-26 14:18:09.236 | DEBUG    | __main__:trials:24 - Trial = 21243/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.238 | DEBUG    | __main__:trials:29 - Trial = 21243/30000 | Total reward = 41.09
2022-01-26 14:18:09.241 | DEBUG    | __main__:trials:24 - Trial = 21244/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.242 | DEBUG    | __main__:trials:29 - Trial = 21244/30000 | Total reward = 36.71
2022-01-26 14:18:09.245 | DEBUG    | __main__:trials:24 - Trial = 21245/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.246 | DEBUG    | __main__:trials:29 - Trial = 21245/30000 | Total reward = 61.71
2022-01-26 14:18:09.249 | DEBUG    | __main__:trials:24 - Trial = 21246/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.249 | DEBUG    | __main__:trials:29 - Trial = 21246/30000 | Total reward = 56.49
2022-01-26 14:18:09.253 | DEBUG    | __main__:trials:24 - Trial = 21247/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.254 | DEBUG    | __main__:trials:29 - Trial = 21247/30000 | Total reward = 46.66
2022-01-26 14:18:09.257 | DEBUG    | __main__:trials:24 - Trial = 21248/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.259 | DEBUG    | __main__:trials:29 - Trial = 21248/30000 | Total reward = 48.71
2022-01-26 14:18:09.261 | DEBUG    | __main__:trials:24 - Trial = 21249/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.263 | DEBUG    | __main__:trials:29 - Trial = 21249/30000 | Total reward = 43.17
2022-01-26 14:18:09.267 | DEBUG    | __main__:trials:24 - Trial = 21250/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.268 | DEBUG    | __main__:trials:29 - Trial = 21250/30000 | Total reward = 57.13
2022-01-26 14:18:09.272 | DEBUG    | __main__:trials:24 - Trial = 21251/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.273 | DEBUG    | __main__:trials:29 - Trial = 21251/30000 | Total reward = 61.06
2022-01-26 14:18:09.277 | DEBUG    | __main__:trials:24 - Trial = 21252/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.278 | DEBUG    | __main__:trials:29 - Trial = 21252/30000 | Total reward = 51.50
2022-01-26 14:18:09.281 | DEBUG    | __main__:trials:24 - Trial = 21253/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.284 | DEBUG    | __main__:trials:29 - Trial = 21253/30000 | Total reward = 27.63
2022-01-26 14:18:09.287 | DEBUG    | __main__:trials:24 - Trial = 21254/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.289 | DEBUG    | __main__:trials:29 - Trial = 21254/30000 | Total reward = 51.46
2022-01-26 14:18:09.292 | DEBUG    | __main__:trials:24 - Trial = 21255/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.293 | DEBUG    | __main__:trials:29 - Trial = 21255/30000 | Total reward = 53.64
2022-01-26 14:18:09.297 | DEBUG    | __main__:trials:24 - Trial = 21256/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.299 | DEBUG    | __main__:trials:29 - Trial = 21256/30000 | Total reward = 56.15
2022-01-26 14:18:09.303 | DEBUG    | __main__:trials:24 - Trial = 21257/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.304 | DEBUG    | __main__:trials:29 - Trial = 21257/30000 | Total reward = 55.21
2022-01-26 14:18:09.308 | DEBUG    | __main__:trials:24 - Trial = 21258/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.309 | DEBUG    | __main__:trials:29 - Trial = 21258/30000 | Total reward = 53.23
2022-01-26 14:18:09.312 | DEBUG    | __main__:trials:24 - Trial = 21259/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.314 | DEBUG    | __main__:trials:29 - Trial = 21259/30000 | Total reward = 52.25
2022-01-26 14:18:09.317 | DEBUG    | __main__:trials:24 - Trial = 21260/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.319 | DEBUG    | __main__:trials:29 - Trial = 21260/30000 | Total reward = 38.10
2022-01-26 14:18:09.323 | DEBUG    | __main__:trials:24 - Trial = 21261/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.323 | DEBUG    | __main__:trials:29 - Trial = 21261/30000 | Total reward = 48.04
2022-01-26 14:18:09.328 | DEBUG    | __main__:trials:24 - Trial = 21262/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.328 | DEBUG    | __main__:trials:29 - Trial = 21262/30000 | Total reward = 42.56
2022-01-26 14:18:09.332 | DEBUG    | __main__:trials:24 - Trial = 21263/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.333 | DEBUG    | __main__:trials:29 - Trial = 21263/30000 | Total reward = 56.61
2022-01-26 14:18:09.336 | DEBUG    | __main__:trials:24 - Trial = 21264/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.338 | DEBUG    | __main__:trials:29 - Trial = 21264/30000 | Total reward = 47.29
2022-01-26 14:18:09.341 | DEBUG    | __main__:trials:24 - Trial = 21265/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.343 | DEBUG    | __main__:trials:29 - Trial = 21265/30000 | Total reward = 43.97
2022-01-26 14:18:09.346 | DEBUG    | __main__:trials:24 - Trial = 21266/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.347 | DEBUG    | __main__:trials:29 - Trial = 21266/30000 | Total reward = 46.17
2022-01-26 14:18:09.351 | DEBUG    | __main__:trials:24 - Trial = 21267/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.352 | DEBUG    | __main__:trials:29 - Trial = 21267/30000 | Total reward = 43.78
2022-01-26 14:18:09.356 | DEBUG    | __main__:trials:24 - Trial = 21268/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.358 | DEBUG    | __main__:trials:29 - Trial = 21268/30000 | Total reward = 47.94
2022-01-26 14:18:09.361 | DEBUG    | __main__:trials:24 - Trial = 21269/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.363 | DEBUG    | __main__:trials:29 - Trial = 21269/30000 | Total reward = 42.94
2022-01-26 14:18:09.366 | DEBUG    | __main__:trials:24 - Trial = 21270/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.368 | DEBUG    | __main__:trials:29 - Trial = 21270/30000 | Total reward = 29.92
2022-01-26 14:18:09.372 | DEBUG    | __main__:trials:24 - Trial = 21271/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.372 | DEBUG    | __main__:trials:29 - Trial = 21271/30000 | Total reward = 44.59
2022-01-26 14:18:09.377 | DEBUG    | __main__:trials:24 - Trial = 21272/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.378 | DEBUG    | __main__:trials:29 - Trial = 21272/30000 | Total reward = 35.46
2022-01-26 14:18:09.382 | DEBUG    | __main__:trials:24 - Trial = 21273/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.383 | DEBUG    | __main__:trials:29 - Trial = 21273/30000 | Total reward = 39.63
2022-01-26 14:18:09.387 | DEBUG    | __main__:trials:24 - Trial = 21274/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.388 | DEBUG    | __main__:trials:29 - Trial = 21274/30000 | Total reward = 39.53
2022-01-26 14:18:09.392 | DEBUG    | __main__:trials:24 - Trial = 21275/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.393 | DEBUG    | __main__:trials:29 - Trial = 21275/30000 | Total reward = 48.85
2022-01-26 14:18:09.397 | DEBUG    | __main__:trials:24 - Trial = 21276/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.398 | DEBUG    | __main__:trials:29 - Trial = 21276/30000 | Total reward = 23.57
2022-01-26 14:18:09.401 | DEBUG    | __main__:trials:24 - Trial = 21277/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.403 | DEBUG    | __main__:trials:29 - Trial = 21277/30000 | Total reward = 38.50
2022-01-26 14:18:09.406 | DEBUG    | __main__:trials:24 - Trial = 21278/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.408 | DEBUG    | __main__:trials:29 - Trial = 21278/30000 | Total reward = 39.95
2022-01-26 14:18:09.411 | DEBUG    | __main__:trials:24 - Trial = 21279/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.412 | DEBUG    | __main__:trials:29 - Trial = 21279/30000 | Total reward = 44.16
2022-01-26 14:18:09.416 | DEBUG    | __main__:trials:24 - Trial = 21280/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.417 | DEBUG    | __main__:trials:29 - Trial = 21280/30000 | Total reward = 35.35
2022-01-26 14:18:09.421 | DEBUG    | __main__:trials:24 - Trial = 21281/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.423 | DEBUG    | __main__:trials:29 - Trial = 21281/30000 | Total reward = 37.10
2022-01-26 14:18:09.426 | DEBUG    | __main__:trials:24 - Trial = 21282/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.428 | DEBUG    | __main__:trials:29 - Trial = 21282/30000 | Total reward = 45.11
2022-01-26 14:18:09.431 | DEBUG    | __main__:trials:24 - Trial = 21283/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.432 | DEBUG    | __main__:trials:29 - Trial = 21283/30000 | Total reward = 40.67
2022-01-26 14:18:09.436 | DEBUG    | __main__:trials:24 - Trial = 21284/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.437 | DEBUG    | __main__:trials:29 - Trial = 21284/30000 | Total reward = 33.89
2022-01-26 14:18:09.440 | DEBUG    | __main__:trials:24 - Trial = 21285/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.442 | DEBUG    | __main__:trials:29 - Trial = 21285/30000 | Total reward = 35.51
2022-01-26 14:18:09.446 | DEBUG    | __main__:trials:24 - Trial = 21286/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.447 | DEBUG    | __main__:trials:29 - Trial = 21286/30000 | Total reward = 34.71
2022-01-26 14:18:09.450 | DEBUG    | __main__:trials:26 - Trial = 21287/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.452 | DEBUG    | __main__:trials:29 - Trial = 21287/30000 | Total reward = 17.35
2022-01-26 14:18:09.455 | DEBUG    | __main__:trials:24 - Trial = 21288/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.457 | DEBUG    | __main__:trials:29 - Trial = 21288/30000 | Total reward = 38.87
2022-01-26 14:18:09.460 | DEBUG    | __main__:trials:24 - Trial = 21289/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.462 | DEBUG    | __main__:trials:29 - Trial = 21289/30000 | Total reward = 39.46
2022-01-26 14:18:09.466 | DEBUG    | __main__:trials:24 - Trial = 21290/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.467 | DEBUG    | __main__:trials:29 - Trial = 21290/30000 | Total reward = 29.11
2022-01-26 14:18:09.471 | DEBUG    | __main__:trials:24 - Trial = 21291/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.472 | DEBUG    | __main__:trials:29 - Trial = 21291/30000 | Total reward = 38.69
2022-01-26 14:18:09.476 | DEBUG    | __main__:trials:24 - Trial = 21292/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.477 | DEBUG    | __main__:trials:29 - Trial = 21292/30000 | Total reward = 26.30
2022-01-26 14:18:09.480 | DEBUG    | __main__:trials:24 - Trial = 21293/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.482 | DEBUG    | __main__:trials:29 - Trial = 21293/30000 | Total reward = 31.75
2022-01-26 14:18:09.485 | DEBUG    | __main__:trials:24 - Trial = 21294/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.486 | DEBUG    | __main__:trials:29 - Trial = 21294/30000 | Total reward = 33.12
2022-01-26 14:18:09.490 | DEBUG    | __main__:trials:24 - Trial = 21295/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.491 | DEBUG    | __main__:trials:29 - Trial = 21295/30000 | Total reward = 40.66
2022-01-26 14:18:09.495 | DEBUG    | __main__:trials:24 - Trial = 21296/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.496 | DEBUG    | __main__:trials:29 - Trial = 21296/30000 | Total reward = 35.76
2022-01-26 14:18:09.500 | DEBUG    | __main__:trials:24 - Trial = 21297/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.502 | DEBUG    | __main__:trials:29 - Trial = 21297/30000 | Total reward = 43.38
2022-01-26 14:18:09.505 | DEBUG    | __main__:trials:24 - Trial = 21298/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.507 | DEBUG    | __main__:trials:29 - Trial = 21298/30000 | Total reward = 34.23
2022-01-26 14:18:09.511 | DEBUG    | __main__:trials:24 - Trial = 21299/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.512 | DEBUG    | __main__:trials:29 - Trial = 21299/30000 | Total reward = 36.63
2022-01-26 14:18:09.516 | DEBUG    | __main__:trials:24 - Trial = 21300/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.516 | DEBUG    | __main__:trials:29 - Trial = 21300/30000 | Total reward = 33.67
2022-01-26 14:18:09.521 | DEBUG    | __main__:trials:24 - Trial = 21301/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.522 | DEBUG    | __main__:trials:29 - Trial = 21301/30000 | Total reward = 39.57
2022-01-26 14:18:09.525 | DEBUG    | __main__:trials:24 - Trial = 21302/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.527 | DEBUG    | __main__:trials:29 - Trial = 21302/30000 | Total reward = 40.77
2022-01-26 14:18:09.531 | DEBUG    | __main__:trials:24 - Trial = 21303/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.533 | DEBUG    | __main__:trials:29 - Trial = 21303/30000 | Total reward = 38.71
2022-01-26 14:18:09.536 | DEBUG    | __main__:trials:24 - Trial = 21304/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.537 | DEBUG    | __main__:trials:29 - Trial = 21304/30000 | Total reward = 33.57
2022-01-26 14:18:09.541 | DEBUG    | __main__:trials:24 - Trial = 21305/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.543 | DEBUG    | __main__:trials:29 - Trial = 21305/30000 | Total reward = 39.57
2022-01-26 14:18:09.547 | DEBUG    | __main__:trials:24 - Trial = 21306/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.547 | DEBUG    | __main__:trials:29 - Trial = 21306/30000 | Total reward = 36.93
2022-01-26 14:18:09.552 | DEBUG    | __main__:trials:24 - Trial = 21307/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.553 | DEBUG    | __main__:trials:29 - Trial = 21307/30000 | Total reward = 49.82
2022-01-26 14:18:09.556 | DEBUG    | __main__:trials:24 - Trial = 21308/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.558 | DEBUG    | __main__:trials:29 - Trial = 21308/30000 | Total reward = 38.21
2022-01-26 14:18:09.561 | DEBUG    | __main__:trials:24 - Trial = 21309/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.563 | DEBUG    | __main__:trials:29 - Trial = 21309/30000 | Total reward = 35.60
2022-01-26 14:18:09.566 | DEBUG    | __main__:trials:24 - Trial = 21310/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.567 | DEBUG    | __main__:trials:29 - Trial = 21310/30000 | Total reward = 35.94
2022-01-26 14:18:09.571 | DEBUG    | __main__:trials:24 - Trial = 21311/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.572 | DEBUG    | __main__:trials:29 - Trial = 21311/30000 | Total reward = 39.80
2022-01-26 14:18:09.576 | DEBUG    | __main__:trials:26 - Trial = 21312/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.577 | DEBUG    | __main__:trials:29 - Trial = 21312/30000 | Total reward = 27.11
2022-01-26 14:18:09.580 | DEBUG    | __main__:trials:24 - Trial = 21313/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.582 | DEBUG    | __main__:trials:29 - Trial = 21313/30000 | Total reward = 49.88
2022-01-26 14:18:09.585 | DEBUG    | __main__:trials:24 - Trial = 21314/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.585 | DEBUG    | __main__:trials:29 - Trial = 21314/30000 | Total reward = 37.14
2022-01-26 14:18:09.590 | DEBUG    | __main__:trials:26 - Trial = 21315/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.591 | DEBUG    | __main__:trials:29 - Trial = 21315/30000 | Total reward = 32.01
2022-01-26 14:18:09.595 | DEBUG    | __main__:trials:24 - Trial = 21316/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.596 | DEBUG    | __main__:trials:29 - Trial = 21316/30000 | Total reward = 30.91
2022-01-26 14:18:09.600 | DEBUG    | __main__:trials:24 - Trial = 21317/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.602 | DEBUG    | __main__:trials:29 - Trial = 21317/30000 | Total reward = 42.60
2022-01-26 14:18:09.605 | DEBUG    | __main__:trials:24 - Trial = 21318/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.606 | DEBUG    | __main__:trials:29 - Trial = 21318/30000 | Total reward = 35.53
2022-01-26 14:18:09.610 | DEBUG    | __main__:trials:24 - Trial = 21319/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.611 | DEBUG    | __main__:trials:29 - Trial = 21319/30000 | Total reward = 33.26
2022-01-26 14:18:09.615 | DEBUG    | __main__:trials:24 - Trial = 21320/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.617 | DEBUG    | __main__:trials:29 - Trial = 21320/30000 | Total reward = 41.54
2022-01-26 14:18:09.620 | DEBUG    | __main__:trials:24 - Trial = 21321/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.621 | DEBUG    | __main__:trials:29 - Trial = 21321/30000 | Total reward = 44.13
2022-01-26 14:18:09.624 | DEBUG    | __main__:trials:24 - Trial = 21322/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.626 | DEBUG    | __main__:trials:29 - Trial = 21322/30000 | Total reward = 47.59
2022-01-26 14:18:09.629 | DEBUG    | __main__:trials:26 - Trial = 21323/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.629 | DEBUG    | __main__:trials:29 - Trial = 21323/30000 | Total reward = 34.00
2022-01-26 14:18:09.634 | DEBUG    | __main__:trials:24 - Trial = 21324/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.636 | DEBUG    | __main__:trials:29 - Trial = 21324/30000 | Total reward = 46.01
2022-01-26 14:18:09.639 | DEBUG    | __main__:trials:24 - Trial = 21325/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.641 | DEBUG    | __main__:trials:29 - Trial = 21325/30000 | Total reward = 37.05
2022-01-26 14:18:09.645 | DEBUG    | __main__:trials:24 - Trial = 21326/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.645 | DEBUG    | __main__:trials:29 - Trial = 21326/30000 | Total reward = 40.89
2022-01-26 14:18:09.650 | DEBUG    | __main__:trials:24 - Trial = 21327/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.651 | DEBUG    | __main__:trials:29 - Trial = 21327/30000 | Total reward = 39.48
2022-01-26 14:18:09.655 | DEBUG    | __main__:trials:24 - Trial = 21328/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.656 | DEBUG    | __main__:trials:29 - Trial = 21328/30000 | Total reward = 33.19
2022-01-26 14:18:09.660 | DEBUG    | __main__:trials:26 - Trial = 21329/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.662 | DEBUG    | __main__:trials:29 - Trial = 21329/30000 | Total reward = 28.58
2022-01-26 14:18:09.664 | DEBUG    | __main__:trials:24 - Trial = 21330/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.666 | DEBUG    | __main__:trials:29 - Trial = 21330/30000 | Total reward = 41.29
2022-01-26 14:18:09.670 | DEBUG    | __main__:trials:24 - Trial = 21331/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.671 | DEBUG    | __main__:trials:29 - Trial = 21331/30000 | Total reward = 33.50
2022-01-26 14:18:09.674 | DEBUG    | __main__:trials:24 - Trial = 21332/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.676 | DEBUG    | __main__:trials:29 - Trial = 21332/30000 | Total reward = 33.03
2022-01-26 14:18:09.679 | DEBUG    | __main__:trials:24 - Trial = 21333/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.681 | DEBUG    | __main__:trials:29 - Trial = 21333/30000 | Total reward = 36.76
2022-01-26 14:18:09.684 | DEBUG    | __main__:trials:24 - Trial = 21334/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.685 | DEBUG    | __main__:trials:29 - Trial = 21334/30000 | Total reward = 38.76
2022-01-26 14:18:09.688 | DEBUG    | __main__:trials:24 - Trial = 21335/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.691 | DEBUG    | __main__:trials:29 - Trial = 21335/30000 | Total reward = 40.05
2022-01-26 14:18:09.693 | DEBUG    | __main__:trials:26 - Trial = 21336/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.694 | DEBUG    | __main__:trials:29 - Trial = 21336/30000 | Total reward = 22.86
2022-01-26 14:18:09.698 | DEBUG    | __main__:trials:24 - Trial = 21337/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.700 | DEBUG    | __main__:trials:29 - Trial = 21337/30000 | Total reward = 49.14
2022-01-26 14:18:09.703 | DEBUG    | __main__:trials:24 - Trial = 21338/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.705 | DEBUG    | __main__:trials:29 - Trial = 21338/30000 | Total reward = 39.57
2022-01-26 14:18:09.708 | DEBUG    | __main__:trials:24 - Trial = 21339/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.710 | DEBUG    | __main__:trials:29 - Trial = 21339/30000 | Total reward = 44.50
2022-01-26 14:18:09.715 | DEBUG    | __main__:trials:24 - Trial = 21340/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.717 | DEBUG    | __main__:trials:29 - Trial = 21340/30000 | Total reward = 41.25
2022-01-26 14:18:09.720 | DEBUG    | __main__:trials:24 - Trial = 21341/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.722 | DEBUG    | __main__:trials:29 - Trial = 21341/30000 | Total reward = 38.61
2022-01-26 14:18:09.725 | DEBUG    | __main__:trials:24 - Trial = 21342/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.727 | DEBUG    | __main__:trials:29 - Trial = 21342/30000 | Total reward = 36.18
2022-01-26 14:18:09.731 | DEBUG    | __main__:trials:24 - Trial = 21343/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.732 | DEBUG    | __main__:trials:29 - Trial = 21343/30000 | Total reward = 39.85
2022-01-26 14:18:09.736 | DEBUG    | __main__:trials:24 - Trial = 21344/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.737 | DEBUG    | __main__:trials:29 - Trial = 21344/30000 | Total reward = 39.61
2022-01-26 14:18:09.740 | DEBUG    | __main__:trials:24 - Trial = 21345/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.742 | DEBUG    | __main__:trials:29 - Trial = 21345/30000 | Total reward = 57.56
2022-01-26 14:18:09.746 | DEBUG    | __main__:trials:24 - Trial = 21346/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.747 | DEBUG    | __main__:trials:29 - Trial = 21346/30000 | Total reward = 34.55
2022-01-26 14:18:09.751 | DEBUG    | __main__:trials:24 - Trial = 21347/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.752 | DEBUG    | __main__:trials:29 - Trial = 21347/30000 | Total reward = 43.27
2022-01-26 14:18:09.756 | DEBUG    | __main__:trials:24 - Trial = 21348/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.757 | DEBUG    | __main__:trials:29 - Trial = 21348/30000 | Total reward = 42.15
2022-01-26 14:18:09.761 | DEBUG    | __main__:trials:24 - Trial = 21349/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.763 | DEBUG    | __main__:trials:29 - Trial = 21349/30000 | Total reward = 40.72
2022-01-26 14:18:09.766 | DEBUG    | __main__:trials:24 - Trial = 21350/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.768 | DEBUG    | __main__:trials:29 - Trial = 21350/30000 | Total reward = 39.57
2022-01-26 14:18:09.771 | DEBUG    | __main__:trials:26 - Trial = 21351/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.773 | DEBUG    | __main__:trials:29 - Trial = 21351/30000 | Total reward = 24.63
2022-01-26 14:18:09.776 | DEBUG    | __main__:trials:24 - Trial = 21352/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.777 | DEBUG    | __main__:trials:29 - Trial = 21352/30000 | Total reward = 42.67
2022-01-26 14:18:09.780 | DEBUG    | __main__:trials:24 - Trial = 21353/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.782 | DEBUG    | __main__:trials:29 - Trial = 21353/30000 | Total reward = 32.10
2022-01-26 14:18:09.785 | DEBUG    | __main__:trials:24 - Trial = 21354/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.786 | DEBUG    | __main__:trials:29 - Trial = 21354/30000 | Total reward = 33.99
2022-01-26 14:18:09.790 | DEBUG    | __main__:trials:26 - Trial = 21355/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.791 | DEBUG    | __main__:trials:29 - Trial = 21355/30000 | Total reward = 28.63
2022-01-26 14:18:09.795 | DEBUG    | __main__:trials:24 - Trial = 21356/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.796 | DEBUG    | __main__:trials:29 - Trial = 21356/30000 | Total reward = 33.21
2022-01-26 14:18:09.800 | DEBUG    | __main__:trials:24 - Trial = 21357/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.802 | DEBUG    | __main__:trials:29 - Trial = 21357/30000 | Total reward = 41.35
2022-01-26 14:18:09.806 | DEBUG    | __main__:trials:26 - Trial = 21358/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.807 | DEBUG    | __main__:trials:29 - Trial = 21358/30000 | Total reward = 27.35
2022-01-26 14:18:09.811 | DEBUG    | __main__:trials:24 - Trial = 21359/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.811 | DEBUG    | __main__:trials:29 - Trial = 21359/30000 | Total reward = 56.20
2022-01-26 14:18:09.816 | DEBUG    | __main__:trials:24 - Trial = 21360/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.818 | DEBUG    | __main__:trials:29 - Trial = 21360/30000 | Total reward = 36.71
2022-01-26 14:18:09.821 | DEBUG    | __main__:trials:24 - Trial = 21361/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.822 | DEBUG    | __main__:trials:29 - Trial = 21361/30000 | Total reward = 34.80
2022-01-26 14:18:09.827 | DEBUG    | __main__:trials:24 - Trial = 21362/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.828 | DEBUG    | __main__:trials:29 - Trial = 21362/30000 | Total reward = 38.97
2022-01-26 14:18:09.831 | DEBUG    | __main__:trials:26 - Trial = 21363/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.832 | DEBUG    | __main__:trials:29 - Trial = 21363/30000 | Total reward = 22.85
2022-01-26 14:18:09.835 | DEBUG    | __main__:trials:24 - Trial = 21364/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.837 | DEBUG    | __main__:trials:29 - Trial = 21364/30000 | Total reward = 54.95
2022-01-26 14:18:09.840 | DEBUG    | __main__:trials:24 - Trial = 21365/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.842 | DEBUG    | __main__:trials:29 - Trial = 21365/30000 | Total reward = 35.67
2022-01-26 14:18:09.845 | DEBUG    | __main__:trials:24 - Trial = 21366/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.847 | DEBUG    | __main__:trials:29 - Trial = 21366/30000 | Total reward = 35.50
2022-01-26 14:18:09.850 | DEBUG    | __main__:trials:24 - Trial = 21367/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.852 | DEBUG    | __main__:trials:29 - Trial = 21367/30000 | Total reward = 39.39
2022-01-26 14:18:09.855 | DEBUG    | __main__:trials:24 - Trial = 21368/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.856 | DEBUG    | __main__:trials:29 - Trial = 21368/30000 | Total reward = 48.91
2022-01-26 14:18:09.860 | DEBUG    | __main__:trials:24 - Trial = 21369/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.861 | DEBUG    | __main__:trials:29 - Trial = 21369/30000 | Total reward = 34.47
2022-01-26 14:18:09.865 | DEBUG    | __main__:trials:24 - Trial = 21370/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.867 | DEBUG    | __main__:trials:29 - Trial = 21370/30000 | Total reward = 39.57
2022-01-26 14:18:09.870 | DEBUG    | __main__:trials:24 - Trial = 21371/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.871 | DEBUG    | __main__:trials:29 - Trial = 21371/30000 | Total reward = 38.74
2022-01-26 14:18:09.875 | DEBUG    | __main__:trials:24 - Trial = 21372/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.877 | DEBUG    | __main__:trials:29 - Trial = 21372/30000 | Total reward = 44.65
2022-01-26 14:18:09.880 | DEBUG    | __main__:trials:24 - Trial = 21373/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.881 | DEBUG    | __main__:trials:29 - Trial = 21373/30000 | Total reward = 39.57
2022-01-26 14:18:09.885 | DEBUG    | __main__:trials:24 - Trial = 21374/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.887 | DEBUG    | __main__:trials:29 - Trial = 21374/30000 | Total reward = 33.10
2022-01-26 14:18:09.891 | DEBUG    | __main__:trials:26 - Trial = 21375/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:09.892 | DEBUG    | __main__:trials:29 - Trial = 21375/30000 | Total reward = 33.55
2022-01-26 14:18:09.896 | DEBUG    | __main__:trials:24 - Trial = 21376/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.897 | DEBUG    | __main__:trials:29 - Trial = 21376/30000 | Total reward = 42.67
2022-01-26 14:18:09.901 | DEBUG    | __main__:trials:24 - Trial = 21377/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.903 | DEBUG    | __main__:trials:29 - Trial = 21377/30000 | Total reward = 38.02
2022-01-26 14:18:09.906 | DEBUG    | __main__:trials:24 - Trial = 21378/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.907 | DEBUG    | __main__:trials:29 - Trial = 21378/30000 | Total reward = 37.95
2022-01-26 14:18:09.911 | DEBUG    | __main__:trials:24 - Trial = 21379/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.913 | DEBUG    | __main__:trials:29 - Trial = 21379/30000 | Total reward = 39.10
2022-01-26 14:18:09.916 | DEBUG    | __main__:trials:24 - Trial = 21380/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.917 | DEBUG    | __main__:trials:29 - Trial = 21380/30000 | Total reward = 42.60
2022-01-26 14:18:09.922 | DEBUG    | __main__:trials:24 - Trial = 21381/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.922 | DEBUG    | __main__:trials:29 - Trial = 21381/30000 | Total reward = 38.29
2022-01-26 14:18:09.926 | DEBUG    | __main__:trials:24 - Trial = 21382/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.928 | DEBUG    | __main__:trials:29 - Trial = 21382/30000 | Total reward = 42.34
2022-01-26 14:18:09.931 | DEBUG    | __main__:trials:24 - Trial = 21383/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.933 | DEBUG    | __main__:trials:29 - Trial = 21383/30000 | Total reward = 35.85
2022-01-26 14:18:09.936 | DEBUG    | __main__:trials:24 - Trial = 21384/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.937 | DEBUG    | __main__:trials:29 - Trial = 21384/30000 | Total reward = 34.45
2022-01-26 14:18:09.941 | DEBUG    | __main__:trials:24 - Trial = 21385/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.943 | DEBUG    | __main__:trials:29 - Trial = 21385/30000 | Total reward = 52.10
2022-01-26 14:18:09.946 | DEBUG    | __main__:trials:24 - Trial = 21386/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.948 | DEBUG    | __main__:trials:29 - Trial = 21386/30000 | Total reward = 37.13
2022-01-26 14:18:09.951 | DEBUG    | __main__:trials:24 - Trial = 21387/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.952 | DEBUG    | __main__:trials:29 - Trial = 21387/30000 | Total reward = 43.65
2022-01-26 14:18:09.955 | DEBUG    | __main__:trials:24 - Trial = 21388/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.957 | DEBUG    | __main__:trials:29 - Trial = 21388/30000 | Total reward = 35.82
2022-01-26 14:18:09.960 | DEBUG    | __main__:trials:24 - Trial = 21389/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.962 | DEBUG    | __main__:trials:29 - Trial = 21389/30000 | Total reward = 39.57
2022-01-26 14:18:09.965 | DEBUG    | __main__:trials:24 - Trial = 21390/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.967 | DEBUG    | __main__:trials:29 - Trial = 21390/30000 | Total reward = 36.85
2022-01-26 14:18:09.970 | DEBUG    | __main__:trials:24 - Trial = 21391/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.972 | DEBUG    | __main__:trials:29 - Trial = 21391/30000 | Total reward = 39.23
2022-01-26 14:18:09.976 | DEBUG    | __main__:trials:24 - Trial = 21392/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.976 | DEBUG    | __main__:trials:29 - Trial = 21392/30000 | Total reward = 35.57
2022-01-26 14:18:09.981 | DEBUG    | __main__:trials:24 - Trial = 21393/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.983 | DEBUG    | __main__:trials:29 - Trial = 21393/30000 | Total reward = 36.64
2022-01-26 14:18:09.986 | DEBUG    | __main__:trials:24 - Trial = 21394/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.987 | DEBUG    | __main__:trials:29 - Trial = 21394/30000 | Total reward = 52.98
2022-01-26 14:18:09.991 | DEBUG    | __main__:trials:24 - Trial = 21395/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.992 | DEBUG    | __main__:trials:29 - Trial = 21395/30000 | Total reward = 34.01
2022-01-26 14:18:09.996 | DEBUG    | __main__:trials:24 - Trial = 21396/30000 | Max number of steps (20) reached
2022-01-26 14:18:09.997 | DEBUG    | __main__:trials:29 - Trial = 21396/30000 | Total reward = 39.03
2022-01-26 14:18:10.000 | DEBUG    | __main__:trials:24 - Trial = 21397/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.002 | DEBUG    | __main__:trials:29 - Trial = 21397/30000 | Total reward = 37.01
2022-01-26 14:18:10.005 | DEBUG    | __main__:trials:24 - Trial = 21398/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.006 | DEBUG    | __main__:trials:29 - Trial = 21398/30000 | Total reward = 39.57
2022-01-26 14:18:10.011 | DEBUG    | __main__:trials:24 - Trial = 21399/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.012 | DEBUG    | __main__:trials:29 - Trial = 21399/30000 | Total reward = 46.20
2022-01-26 14:18:10.016 | DEBUG    | __main__:trials:24 - Trial = 21400/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.017 | DEBUG    | __main__:trials:29 - Trial = 21400/30000 | Total reward = 39.57
2022-01-26 14:18:10.021 | DEBUG    | __main__:trials:24 - Trial = 21401/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.022 | DEBUG    | __main__:trials:29 - Trial = 21401/30000 | Total reward = 38.20
2022-01-26 14:18:10.026 | DEBUG    | __main__:trials:24 - Trial = 21402/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.027 | DEBUG    | __main__:trials:29 - Trial = 21402/30000 | Total reward = 48.09
2022-01-26 14:18:10.030 | DEBUG    | __main__:trials:24 - Trial = 21403/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.032 | DEBUG    | __main__:trials:29 - Trial = 21403/30000 | Total reward = 33.91
2022-01-26 14:18:10.036 | DEBUG    | __main__:trials:24 - Trial = 21404/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.036 | DEBUG    | __main__:trials:29 - Trial = 21404/30000 | Total reward = 40.29
2022-01-26 14:18:10.040 | DEBUG    | __main__:trials:24 - Trial = 21405/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.042 | DEBUG    | __main__:trials:29 - Trial = 21405/30000 | Total reward = 47.82
2022-01-26 14:18:10.046 | DEBUG    | __main__:trials:24 - Trial = 21406/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.047 | DEBUG    | __main__:trials:29 - Trial = 21406/30000 | Total reward = 32.63
2022-01-26 14:18:10.050 | DEBUG    | __main__:trials:24 - Trial = 21407/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.052 | DEBUG    | __main__:trials:29 - Trial = 21407/30000 | Total reward = 37.08
2022-01-26 14:18:10.055 | DEBUG    | __main__:trials:24 - Trial = 21408/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.057 | DEBUG    | __main__:trials:29 - Trial = 21408/30000 | Total reward = 43.81
2022-01-26 14:18:10.060 | DEBUG    | __main__:trials:24 - Trial = 21409/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.061 | DEBUG    | __main__:trials:29 - Trial = 21409/30000 | Total reward = 57.27
2022-01-26 14:18:10.066 | DEBUG    | __main__:trials:24 - Trial = 21410/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.066 | DEBUG    | __main__:trials:29 - Trial = 21410/30000 | Total reward = 41.78
2022-01-26 14:18:10.071 | DEBUG    | __main__:trials:24 - Trial = 21411/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.072 | DEBUG    | __main__:trials:29 - Trial = 21411/30000 | Total reward = 37.25
2022-01-26 14:18:10.075 | DEBUG    | __main__:trials:26 - Trial = 21412/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:10.076 | DEBUG    | __main__:trials:29 - Trial = 21412/30000 | Total reward = 26.15
2022-01-26 14:18:10.080 | DEBUG    | __main__:trials:24 - Trial = 21413/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.081 | DEBUG    | __main__:trials:29 - Trial = 21413/30000 | Total reward = 52.65
2022-01-26 14:18:10.084 | DEBUG    | __main__:trials:24 - Trial = 21414/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.085 | DEBUG    | __main__:trials:29 - Trial = 21414/30000 | Total reward = 48.21
2022-01-26 14:18:10.089 | DEBUG    | __main__:trials:24 - Trial = 21415/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.090 | DEBUG    | __main__:trials:29 - Trial = 21415/30000 | Total reward = 51.87
2022-01-26 14:18:10.094 | DEBUG    | __main__:trials:24 - Trial = 21416/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.096 | DEBUG    | __main__:trials:29 - Trial = 21416/30000 | Total reward = 53.23
2022-01-26 14:18:10.098 | DEBUG    | __main__:trials:24 - Trial = 21417/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.100 | DEBUG    | __main__:trials:29 - Trial = 21417/30000 | Total reward = 55.45
2022-01-26 14:18:10.103 | DEBUG    | __main__:trials:24 - Trial = 21418/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.104 | DEBUG    | __main__:trials:29 - Trial = 21418/30000 | Total reward = 49.38
2022-01-26 14:18:10.108 | DEBUG    | __main__:trials:24 - Trial = 21419/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.109 | DEBUG    | __main__:trials:29 - Trial = 21419/30000 | Total reward = 40.72
2022-01-26 14:18:10.112 | DEBUG    | __main__:trials:24 - Trial = 21420/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.114 | DEBUG    | __main__:trials:29 - Trial = 21420/30000 | Total reward = 53.40
2022-01-26 14:18:10.118 | DEBUG    | __main__:trials:24 - Trial = 21421/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.118 | DEBUG    | __main__:trials:29 - Trial = 21421/30000 | Total reward = 57.64
2022-01-26 14:18:10.122 | DEBUG    | __main__:trials:24 - Trial = 21422/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.124 | DEBUG    | __main__:trials:29 - Trial = 21422/30000 | Total reward = 53.12
2022-01-26 14:18:10.127 | DEBUG    | __main__:trials:24 - Trial = 21423/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.129 | DEBUG    | __main__:trials:29 - Trial = 21423/30000 | Total reward = 28.77
2022-01-26 14:18:10.132 | DEBUG    | __main__:trials:24 - Trial = 21424/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.133 | DEBUG    | __main__:trials:29 - Trial = 21424/30000 | Total reward = 47.27
2022-01-26 14:18:10.138 | DEBUG    | __main__:trials:24 - Trial = 21425/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.139 | DEBUG    | __main__:trials:29 - Trial = 21425/30000 | Total reward = 52.70
2022-01-26 14:18:10.143 | DEBUG    | __main__:trials:24 - Trial = 21426/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.145 | DEBUG    | __main__:trials:29 - Trial = 21426/30000 | Total reward = 53.99
2022-01-26 14:18:10.148 | DEBUG    | __main__:trials:24 - Trial = 21427/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.149 | DEBUG    | __main__:trials:29 - Trial = 21427/30000 | Total reward = 44.47
2022-01-26 14:18:10.154 | DEBUG    | __main__:trials:24 - Trial = 21428/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.155 | DEBUG    | __main__:trials:29 - Trial = 21428/30000 | Total reward = 45.66
2022-01-26 14:18:10.159 | DEBUG    | __main__:trials:24 - Trial = 21429/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.160 | DEBUG    | __main__:trials:29 - Trial = 21429/30000 | Total reward = 48.75
2022-01-26 14:18:10.164 | DEBUG    | __main__:trials:24 - Trial = 21430/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.165 | DEBUG    | __main__:trials:29 - Trial = 21430/30000 | Total reward = 63.74
2022-01-26 14:18:10.170 | DEBUG    | __main__:trials:24 - Trial = 21431/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.171 | DEBUG    | __main__:trials:29 - Trial = 21431/30000 | Total reward = 39.98
2022-01-26 14:18:10.175 | DEBUG    | __main__:trials:24 - Trial = 21432/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.176 | DEBUG    | __main__:trials:29 - Trial = 21432/30000 | Total reward = 52.76
2022-01-26 14:18:10.181 | DEBUG    | __main__:trials:24 - Trial = 21433/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.181 | DEBUG    | __main__:trials:29 - Trial = 21433/30000 | Total reward = 52.59
2022-01-26 14:18:10.185 | DEBUG    | __main__:trials:24 - Trial = 21434/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.187 | DEBUG    | __main__:trials:29 - Trial = 21434/30000 | Total reward = 26.31
2022-01-26 14:18:10.190 | DEBUG    | __main__:trials:24 - Trial = 21435/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.192 | DEBUG    | __main__:trials:29 - Trial = 21435/30000 | Total reward = 61.00
2022-01-26 14:18:10.195 | DEBUG    | __main__:trials:24 - Trial = 21436/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.197 | DEBUG    | __main__:trials:29 - Trial = 21436/30000 | Total reward = 58.48
2022-01-26 14:18:10.200 | DEBUG    | __main__:trials:24 - Trial = 21437/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.202 | DEBUG    | __main__:trials:29 - Trial = 21437/30000 | Total reward = 32.96
2022-01-26 14:18:10.205 | DEBUG    | __main__:trials:24 - Trial = 21438/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.206 | DEBUG    | __main__:trials:29 - Trial = 21438/30000 | Total reward = 48.70
2022-01-26 14:18:10.209 | DEBUG    | __main__:trials:24 - Trial = 21439/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.211 | DEBUG    | __main__:trials:29 - Trial = 21439/30000 | Total reward = 59.33
2022-01-26 14:18:10.214 | DEBUG    | __main__:trials:24 - Trial = 21440/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.216 | DEBUG    | __main__:trials:29 - Trial = 21440/30000 | Total reward = 56.95
2022-01-26 14:18:10.219 | DEBUG    | __main__:trials:24 - Trial = 21441/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.221 | DEBUG    | __main__:trials:29 - Trial = 21441/30000 | Total reward = 44.65
2022-01-26 14:18:10.224 | DEBUG    | __main__:trials:24 - Trial = 21442/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.226 | DEBUG    | __main__:trials:29 - Trial = 21442/30000 | Total reward = 53.23
2022-01-26 14:18:10.230 | DEBUG    | __main__:trials:24 - Trial = 21443/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.231 | DEBUG    | __main__:trials:29 - Trial = 21443/30000 | Total reward = 33.48
2022-01-26 14:18:10.235 | DEBUG    | __main__:trials:24 - Trial = 21444/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.236 | DEBUG    | __main__:trials:29 - Trial = 21444/30000 | Total reward = 42.50
2022-01-26 14:18:10.240 | DEBUG    | __main__:trials:24 - Trial = 21445/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.242 | DEBUG    | __main__:trials:29 - Trial = 21445/30000 | Total reward = 36.79
2022-01-26 14:18:10.245 | DEBUG    | __main__:trials:24 - Trial = 21446/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.247 | DEBUG    | __main__:trials:29 - Trial = 21446/30000 | Total reward = 55.27
2022-01-26 14:18:10.251 | DEBUG    | __main__:trials:24 - Trial = 21447/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.251 | DEBUG    | __main__:trials:29 - Trial = 21447/30000 | Total reward = 53.23
2022-01-26 14:18:10.256 | DEBUG    | __main__:trials:24 - Trial = 21448/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.257 | DEBUG    | __main__:trials:29 - Trial = 21448/30000 | Total reward = 43.04
2022-01-26 14:18:10.261 | DEBUG    | __main__:trials:24 - Trial = 21449/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.261 | DEBUG    | __main__:trials:29 - Trial = 21449/30000 | Total reward = 56.24
2022-01-26 14:18:10.266 | DEBUG    | __main__:trials:24 - Trial = 21450/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.267 | DEBUG    | __main__:trials:29 - Trial = 21450/30000 | Total reward = 52.85
2022-01-26 14:18:10.271 | DEBUG    | __main__:trials:24 - Trial = 21451/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.273 | DEBUG    | __main__:trials:29 - Trial = 21451/30000 | Total reward = 52.22
2022-01-26 14:18:10.276 | DEBUG    | __main__:trials:24 - Trial = 21452/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.277 | DEBUG    | __main__:trials:29 - Trial = 21452/30000 | Total reward = 49.63
2022-01-26 14:18:10.280 | DEBUG    | __main__:trials:24 - Trial = 21453/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.282 | DEBUG    | __main__:trials:29 - Trial = 21453/30000 | Total reward = 52.64
2022-01-26 14:18:10.285 | DEBUG    | __main__:trials:24 - Trial = 21454/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.286 | DEBUG    | __main__:trials:29 - Trial = 21454/30000 | Total reward = 36.05
2022-01-26 14:18:10.290 | DEBUG    | __main__:trials:24 - Trial = 21455/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.292 | DEBUG    | __main__:trials:29 - Trial = 21455/30000 | Total reward = 50.68
2022-01-26 14:18:10.294 | DEBUG    | __main__:trials:24 - Trial = 21456/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.296 | DEBUG    | __main__:trials:29 - Trial = 21456/30000 | Total reward = 54.24
2022-01-26 14:18:10.300 | DEBUG    | __main__:trials:24 - Trial = 21457/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.301 | DEBUG    | __main__:trials:29 - Trial = 21457/30000 | Total reward = 53.23
2022-01-26 14:18:10.305 | DEBUG    | __main__:trials:24 - Trial = 21458/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.305 | DEBUG    | __main__:trials:29 - Trial = 21458/30000 | Total reward = 60.45
2022-01-26 14:18:10.309 | DEBUG    | __main__:trials:24 - Trial = 21459/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.310 | DEBUG    | __main__:trials:29 - Trial = 21459/30000 | Total reward = 53.98
2022-01-26 14:18:10.314 | DEBUG    | __main__:trials:24 - Trial = 21460/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.316 | DEBUG    | __main__:trials:29 - Trial = 21460/30000 | Total reward = 39.49
2022-01-26 14:18:10.319 | DEBUG    | __main__:trials:24 - Trial = 21461/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.321 | DEBUG    | __main__:trials:29 - Trial = 21461/30000 | Total reward = 34.82
2022-01-26 14:18:10.324 | DEBUG    | __main__:trials:24 - Trial = 21462/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.325 | DEBUG    | __main__:trials:29 - Trial = 21462/30000 | Total reward = 38.69
2022-01-26 14:18:10.329 | DEBUG    | __main__:trials:24 - Trial = 21463/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.330 | DEBUG    | __main__:trials:29 - Trial = 21463/30000 | Total reward = 56.62
2022-01-26 14:18:10.334 | DEBUG    | __main__:trials:24 - Trial = 21464/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.335 | DEBUG    | __main__:trials:29 - Trial = 21464/30000 | Total reward = 40.43
2022-01-26 14:18:10.339 | DEBUG    | __main__:trials:24 - Trial = 21465/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.340 | DEBUG    | __main__:trials:29 - Trial = 21465/30000 | Total reward = 30.02
2022-01-26 14:18:10.345 | DEBUG    | __main__:trials:24 - Trial = 21466/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.346 | DEBUG    | __main__:trials:29 - Trial = 21466/30000 | Total reward = 38.69
2022-01-26 14:18:10.350 | DEBUG    | __main__:trials:24 - Trial = 21467/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.350 | DEBUG    | __main__:trials:29 - Trial = 21467/30000 | Total reward = 29.78
2022-01-26 14:18:10.355 | DEBUG    | __main__:trials:24 - Trial = 21468/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.356 | DEBUG    | __main__:trials:29 - Trial = 21468/30000 | Total reward = 42.03
2022-01-26 14:18:10.360 | DEBUG    | __main__:trials:24 - Trial = 21469/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.362 | DEBUG    | __main__:trials:29 - Trial = 21469/30000 | Total reward = 38.05
2022-01-26 14:18:10.365 | DEBUG    | __main__:trials:24 - Trial = 21470/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.367 | DEBUG    | __main__:trials:29 - Trial = 21470/30000 | Total reward = 32.41
2022-01-26 14:18:10.371 | DEBUG    | __main__:trials:24 - Trial = 21471/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.371 | DEBUG    | __main__:trials:29 - Trial = 21471/30000 | Total reward = 50.56
2022-01-26 14:18:10.376 | DEBUG    | __main__:trials:24 - Trial = 21472/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.377 | DEBUG    | __main__:trials:29 - Trial = 21472/30000 | Total reward = 51.22
2022-01-26 14:18:10.380 | DEBUG    | __main__:trials:24 - Trial = 21473/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.382 | DEBUG    | __main__:trials:29 - Trial = 21473/30000 | Total reward = 63.58
2022-01-26 14:18:10.386 | DEBUG    | __main__:trials:24 - Trial = 21474/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.386 | DEBUG    | __main__:trials:29 - Trial = 21474/30000 | Total reward = 53.32
2022-01-26 14:18:10.391 | DEBUG    | __main__:trials:24 - Trial = 21475/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.392 | DEBUG    | __main__:trials:29 - Trial = 21475/30000 | Total reward = 40.27
2022-01-26 14:18:10.397 | DEBUG    | __main__:trials:24 - Trial = 21476/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.398 | DEBUG    | __main__:trials:29 - Trial = 21476/30000 | Total reward = 40.05
2022-01-26 14:18:10.401 | DEBUG    | __main__:trials:24 - Trial = 21477/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.403 | DEBUG    | __main__:trials:29 - Trial = 21477/30000 | Total reward = 57.39
2022-01-26 14:18:10.407 | DEBUG    | __main__:trials:24 - Trial = 21478/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.409 | DEBUG    | __main__:trials:29 - Trial = 21478/30000 | Total reward = 36.28
2022-01-26 14:18:10.412 | DEBUG    | __main__:trials:24 - Trial = 21479/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.413 | DEBUG    | __main__:trials:29 - Trial = 21479/30000 | Total reward = 43.41
2022-01-26 14:18:10.418 | DEBUG    | __main__:trials:24 - Trial = 21480/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.418 | DEBUG    | __main__:trials:29 - Trial = 21480/30000 | Total reward = 30.89
2022-01-26 14:18:10.423 | DEBUG    | __main__:trials:24 - Trial = 21481/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.425 | DEBUG    | __main__:trials:29 - Trial = 21481/30000 | Total reward = 37.27
2022-01-26 14:18:10.428 | DEBUG    | __main__:trials:24 - Trial = 21482/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.429 | DEBUG    | __main__:trials:29 - Trial = 21482/30000 | Total reward = 45.52
2022-01-26 14:18:10.434 | DEBUG    | __main__:trials:24 - Trial = 21483/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.434 | DEBUG    | __main__:trials:29 - Trial = 21483/30000 | Total reward = 39.80
2022-01-26 14:18:10.439 | DEBUG    | __main__:trials:24 - Trial = 21484/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.441 | DEBUG    | __main__:trials:29 - Trial = 21484/30000 | Total reward = 32.08
2022-01-26 14:18:10.444 | DEBUG    | __main__:trials:24 - Trial = 21485/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.446 | DEBUG    | __main__:trials:29 - Trial = 21485/30000 | Total reward = 39.27
2022-01-26 14:18:10.449 | DEBUG    | __main__:trials:24 - Trial = 21486/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.450 | DEBUG    | __main__:trials:29 - Trial = 21486/30000 | Total reward = 42.56
2022-01-26 14:18:10.803 | DEBUG    | __main__:trials:24 - Trial = 21487/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.806 | DEBUG    | __main__:trials:29 - Trial = 21487/30000 | Total reward = 36.41
2022-01-26 14:18:10.810 | DEBUG    | __main__:trials:24 - Trial = 21488/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.812 | DEBUG    | __main__:trials:29 - Trial = 21488/30000 | Total reward = 36.42
2022-01-26 14:18:10.816 | DEBUG    | __main__:trials:24 - Trial = 21489/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.816 | DEBUG    | __main__:trials:29 - Trial = 21489/30000 | Total reward = 44.48
2022-01-26 14:18:10.820 | DEBUG    | __main__:trials:24 - Trial = 21490/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.821 | DEBUG    | __main__:trials:29 - Trial = 21490/30000 | Total reward = 50.75
2022-01-26 14:18:10.826 | DEBUG    | __main__:trials:24 - Trial = 21491/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.827 | DEBUG    | __main__:trials:29 - Trial = 21491/30000 | Total reward = 31.51
2022-01-26 14:18:10.831 | DEBUG    | __main__:trials:24 - Trial = 21492/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.832 | DEBUG    | __main__:trials:29 - Trial = 21492/30000 | Total reward = 36.93
2022-01-26 14:18:10.836 | DEBUG    | __main__:trials:24 - Trial = 21493/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.838 | DEBUG    | __main__:trials:29 - Trial = 21493/30000 | Total reward = 39.80
2022-01-26 14:18:10.842 | DEBUG    | __main__:trials:24 - Trial = 21494/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.843 | DEBUG    | __main__:trials:29 - Trial = 21494/30000 | Total reward = 47.43
2022-01-26 14:18:10.847 | DEBUG    | __main__:trials:24 - Trial = 21495/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.848 | DEBUG    | __main__:trials:29 - Trial = 21495/30000 | Total reward = 52.56
2022-01-26 14:18:10.852 | DEBUG    | __main__:trials:24 - Trial = 21496/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.853 | DEBUG    | __main__:trials:29 - Trial = 21496/30000 | Total reward = 46.44
2022-01-26 14:18:10.856 | DEBUG    | __main__:trials:24 - Trial = 21497/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.857 | DEBUG    | __main__:trials:29 - Trial = 21497/30000 | Total reward = 39.64
2022-01-26 14:18:10.861 | DEBUG    | __main__:trials:24 - Trial = 21498/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.861 | DEBUG    | __main__:trials:29 - Trial = 21498/30000 | Total reward = 34.22
2022-01-26 14:18:10.865 | DEBUG    | __main__:trials:24 - Trial = 21499/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.866 | DEBUG    | __main__:trials:29 - Trial = 21499/30000 | Total reward = 38.92
2022-01-26 14:18:10.870 | DEBUG    | __main__:trials:26 - Trial = 21500/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:10.870 | DEBUG    | __main__:trials:29 - Trial = 21500/30000 | Total reward = 26.27
2022-01-26 14:18:10.875 | DEBUG    | __main__:trials:24 - Trial = 21501/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.877 | DEBUG    | __main__:trials:29 - Trial = 21501/30000 | Total reward = 47.77
2022-01-26 14:18:10.880 | DEBUG    | __main__:trials:24 - Trial = 21502/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.882 | DEBUG    | __main__:trials:29 - Trial = 21502/30000 | Total reward = 34.14
2022-01-26 14:18:10.886 | DEBUG    | __main__:trials:24 - Trial = 21503/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.887 | DEBUG    | __main__:trials:29 - Trial = 21503/30000 | Total reward = 52.95
2022-01-26 14:18:10.890 | DEBUG    | __main__:trials:24 - Trial = 21504/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.892 | DEBUG    | __main__:trials:29 - Trial = 21504/30000 | Total reward = 39.57
2022-01-26 14:18:10.895 | DEBUG    | __main__:trials:24 - Trial = 21505/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.897 | DEBUG    | __main__:trials:29 - Trial = 21505/30000 | Total reward = 52.21
2022-01-26 14:18:10.901 | DEBUG    | __main__:trials:26 - Trial = 21506/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:10.902 | DEBUG    | __main__:trials:29 - Trial = 21506/30000 | Total reward = 31.66
2022-01-26 14:18:10.907 | DEBUG    | __main__:trials:24 - Trial = 21507/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.908 | DEBUG    | __main__:trials:29 - Trial = 21507/30000 | Total reward = 53.16
2022-01-26 14:18:10.912 | DEBUG    | __main__:trials:24 - Trial = 21508/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.913 | DEBUG    | __main__:trials:29 - Trial = 21508/30000 | Total reward = 54.39
2022-01-26 14:18:10.916 | DEBUG    | __main__:trials:24 - Trial = 21509/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.918 | DEBUG    | __main__:trials:29 - Trial = 21509/30000 | Total reward = 40.29
2022-01-26 14:18:10.921 | DEBUG    | __main__:trials:24 - Trial = 21510/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.922 | DEBUG    | __main__:trials:29 - Trial = 21510/30000 | Total reward = 38.47
2022-01-26 14:18:10.925 | DEBUG    | __main__:trials:24 - Trial = 21511/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.926 | DEBUG    | __main__:trials:29 - Trial = 21511/30000 | Total reward = 36.84
2022-01-26 14:18:10.929 | DEBUG    | __main__:trials:24 - Trial = 21512/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.930 | DEBUG    | __main__:trials:29 - Trial = 21512/30000 | Total reward = 41.99
2022-01-26 14:18:10.934 | DEBUG    | __main__:trials:24 - Trial = 21513/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.935 | DEBUG    | __main__:trials:29 - Trial = 21513/30000 | Total reward = 38.16
2022-01-26 14:18:10.939 | DEBUG    | __main__:trials:24 - Trial = 21514/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.940 | DEBUG    | __main__:trials:29 - Trial = 21514/30000 | Total reward = 50.08
2022-01-26 14:18:10.944 | DEBUG    | __main__:trials:24 - Trial = 21515/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.945 | DEBUG    | __main__:trials:29 - Trial = 21515/30000 | Total reward = 56.57
2022-01-26 14:18:10.949 | DEBUG    | __main__:trials:24 - Trial = 21516/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.950 | DEBUG    | __main__:trials:29 - Trial = 21516/30000 | Total reward = 41.24
2022-01-26 14:18:10.954 | DEBUG    | __main__:trials:24 - Trial = 21517/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.955 | DEBUG    | __main__:trials:29 - Trial = 21517/30000 | Total reward = 50.50
2022-01-26 14:18:10.959 | DEBUG    | __main__:trials:24 - Trial = 21518/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.960 | DEBUG    | __main__:trials:29 - Trial = 21518/30000 | Total reward = 33.44
2022-01-26 14:18:10.965 | DEBUG    | __main__:trials:24 - Trial = 21519/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.965 | DEBUG    | __main__:trials:29 - Trial = 21519/30000 | Total reward = 40.09
2022-01-26 14:18:10.968 | DEBUG    | __main__:trials:24 - Trial = 21520/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.969 | DEBUG    | __main__:trials:29 - Trial = 21520/30000 | Total reward = 32.23
2022-01-26 14:18:10.973 | DEBUG    | __main__:trials:24 - Trial = 21521/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.974 | DEBUG    | __main__:trials:29 - Trial = 21521/30000 | Total reward = 25.86
2022-01-26 14:18:10.977 | DEBUG    | __main__:trials:24 - Trial = 21522/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.979 | DEBUG    | __main__:trials:29 - Trial = 21522/30000 | Total reward = 38.35
2022-01-26 14:18:10.981 | DEBUG    | __main__:trials:24 - Trial = 21523/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.983 | DEBUG    | __main__:trials:29 - Trial = 21523/30000 | Total reward = 50.26
2022-01-26 14:18:10.986 | DEBUG    | __main__:trials:24 - Trial = 21524/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.987 | DEBUG    | __main__:trials:29 - Trial = 21524/30000 | Total reward = 39.89
2022-01-26 14:18:10.991 | DEBUG    | __main__:trials:26 - Trial = 21525/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:10.993 | DEBUG    | __main__:trials:29 - Trial = 21525/30000 | Total reward = 28.97
2022-01-26 14:18:10.996 | DEBUG    | __main__:trials:24 - Trial = 21526/30000 | Max number of steps (20) reached
2022-01-26 14:18:10.998 | DEBUG    | __main__:trials:29 - Trial = 21526/30000 | Total reward = 47.46
2022-01-26 14:18:11.001 | DEBUG    | __main__:trials:24 - Trial = 21527/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.003 | DEBUG    | __main__:trials:29 - Trial = 21527/30000 | Total reward = 23.79
2022-01-26 14:18:11.007 | DEBUG    | __main__:trials:24 - Trial = 21528/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.008 | DEBUG    | __main__:trials:29 - Trial = 21528/30000 | Total reward = 40.20
2022-01-26 14:18:11.012 | DEBUG    | __main__:trials:24 - Trial = 21529/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.014 | DEBUG    | __main__:trials:29 - Trial = 21529/30000 | Total reward = 38.23
2022-01-26 14:18:11.017 | DEBUG    | __main__:trials:24 - Trial = 21530/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.018 | DEBUG    | __main__:trials:29 - Trial = 21530/30000 | Total reward = 46.76
2022-01-26 14:18:11.022 | DEBUG    | __main__:trials:24 - Trial = 21531/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.023 | DEBUG    | __main__:trials:29 - Trial = 21531/30000 | Total reward = 27.15
2022-01-26 14:18:11.027 | DEBUG    | __main__:trials:24 - Trial = 21532/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.028 | DEBUG    | __main__:trials:29 - Trial = 21532/30000 | Total reward = 47.19
2022-01-26 14:18:11.032 | DEBUG    | __main__:trials:24 - Trial = 21533/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.033 | DEBUG    | __main__:trials:29 - Trial = 21533/30000 | Total reward = 48.77
2022-01-26 14:18:11.037 | DEBUG    | __main__:trials:24 - Trial = 21534/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.039 | DEBUG    | __main__:trials:29 - Trial = 21534/30000 | Total reward = 36.51
2022-01-26 14:18:11.042 | DEBUG    | __main__:trials:24 - Trial = 21535/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.043 | DEBUG    | __main__:trials:29 - Trial = 21535/30000 | Total reward = 55.33
2022-01-26 14:18:11.047 | DEBUG    | __main__:trials:24 - Trial = 21536/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.048 | DEBUG    | __main__:trials:29 - Trial = 21536/30000 | Total reward = 34.51
2022-01-26 14:18:11.052 | DEBUG    | __main__:trials:24 - Trial = 21537/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.053 | DEBUG    | __main__:trials:29 - Trial = 21537/30000 | Total reward = 41.50
2022-01-26 14:18:11.057 | DEBUG    | __main__:trials:26 - Trial = 21538/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.059 | DEBUG    | __main__:trials:29 - Trial = 21538/30000 | Total reward = 24.57
2022-01-26 14:18:11.063 | DEBUG    | __main__:trials:24 - Trial = 21539/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.065 | DEBUG    | __main__:trials:29 - Trial = 21539/30000 | Total reward = 52.84
2022-01-26 14:18:11.069 | DEBUG    | __main__:trials:24 - Trial = 21540/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.071 | DEBUG    | __main__:trials:29 - Trial = 21540/30000 | Total reward = 42.69
2022-01-26 14:18:11.075 | DEBUG    | __main__:trials:24 - Trial = 21541/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.076 | DEBUG    | __main__:trials:29 - Trial = 21541/30000 | Total reward = 34.73
2022-01-26 14:18:11.080 | DEBUG    | __main__:trials:24 - Trial = 21542/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.081 | DEBUG    | __main__:trials:29 - Trial = 21542/30000 | Total reward = 28.58
2022-01-26 14:18:11.085 | DEBUG    | __main__:trials:26 - Trial = 21543/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.086 | DEBUG    | __main__:trials:29 - Trial = 21543/30000 | Total reward = 15.84
2022-01-26 14:18:11.091 | DEBUG    | __main__:trials:24 - Trial = 21544/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.092 | DEBUG    | __main__:trials:29 - Trial = 21544/30000 | Total reward = 51.04
2022-01-26 14:18:11.096 | DEBUG    | __main__:trials:24 - Trial = 21545/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.097 | DEBUG    | __main__:trials:29 - Trial = 21545/30000 | Total reward = 38.01
2022-01-26 14:18:11.101 | DEBUG    | __main__:trials:24 - Trial = 21546/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.103 | DEBUG    | __main__:trials:29 - Trial = 21546/30000 | Total reward = 33.94
2022-01-26 14:18:11.106 | DEBUG    | __main__:trials:24 - Trial = 21547/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.107 | DEBUG    | __main__:trials:29 - Trial = 21547/30000 | Total reward = 39.11
2022-01-26 14:18:11.111 | DEBUG    | __main__:trials:24 - Trial = 21548/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.112 | DEBUG    | __main__:trials:29 - Trial = 21548/30000 | Total reward = 47.34
2022-01-26 14:18:11.116 | DEBUG    | __main__:trials:24 - Trial = 21549/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.117 | DEBUG    | __main__:trials:29 - Trial = 21549/30000 | Total reward = 36.59
2022-01-26 14:18:11.121 | DEBUG    | __main__:trials:24 - Trial = 21550/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.123 | DEBUG    | __main__:trials:29 - Trial = 21550/30000 | Total reward = 39.64
2022-01-26 14:18:11.127 | DEBUG    | __main__:trials:24 - Trial = 21551/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.128 | DEBUG    | __main__:trials:29 - Trial = 21551/30000 | Total reward = 42.97
2022-01-26 14:18:11.131 | DEBUG    | __main__:trials:24 - Trial = 21552/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.133 | DEBUG    | __main__:trials:29 - Trial = 21552/30000 | Total reward = 35.65
2022-01-26 14:18:11.137 | DEBUG    | __main__:trials:24 - Trial = 21553/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.139 | DEBUG    | __main__:trials:29 - Trial = 21553/30000 | Total reward = 34.42
2022-01-26 14:18:11.142 | DEBUG    | __main__:trials:24 - Trial = 21554/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.144 | DEBUG    | __main__:trials:29 - Trial = 21554/30000 | Total reward = 34.82
2022-01-26 14:18:11.147 | DEBUG    | __main__:trials:24 - Trial = 21555/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.148 | DEBUG    | __main__:trials:29 - Trial = 21555/30000 | Total reward = 34.84
2022-01-26 14:18:11.151 | DEBUG    | __main__:trials:24 - Trial = 21556/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.153 | DEBUG    | __main__:trials:29 - Trial = 21556/30000 | Total reward = 38.69
2022-01-26 14:18:11.156 | DEBUG    | __main__:trials:24 - Trial = 21557/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.158 | DEBUG    | __main__:trials:29 - Trial = 21557/30000 | Total reward = 34.27
2022-01-26 14:18:11.162 | DEBUG    | __main__:trials:24 - Trial = 21558/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.162 | DEBUG    | __main__:trials:29 - Trial = 21558/30000 | Total reward = 48.46
2022-01-26 14:18:11.167 | DEBUG    | __main__:trials:26 - Trial = 21559/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.169 | DEBUG    | __main__:trials:29 - Trial = 21559/30000 | Total reward = 33.73
2022-01-26 14:18:11.172 | DEBUG    | __main__:trials:24 - Trial = 21560/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.174 | DEBUG    | __main__:trials:29 - Trial = 21560/30000 | Total reward = 34.40
2022-01-26 14:18:11.177 | DEBUG    | __main__:trials:24 - Trial = 21561/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.178 | DEBUG    | __main__:trials:29 - Trial = 21561/30000 | Total reward = 40.33
2022-01-26 14:18:11.183 | DEBUG    | __main__:trials:24 - Trial = 21562/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.184 | DEBUG    | __main__:trials:29 - Trial = 21562/30000 | Total reward = 39.57
2022-01-26 14:18:11.188 | DEBUG    | __main__:trials:26 - Trial = 21563/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.189 | DEBUG    | __main__:trials:29 - Trial = 21563/30000 | Total reward = 24.01
2022-01-26 14:18:11.192 | DEBUG    | __main__:trials:26 - Trial = 21564/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.194 | DEBUG    | __main__:trials:29 - Trial = 21564/30000 | Total reward = 21.55
2022-01-26 14:18:11.198 | DEBUG    | __main__:trials:24 - Trial = 21565/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.199 | DEBUG    | __main__:trials:29 - Trial = 21565/30000 | Total reward = 41.58
2022-01-26 14:18:11.202 | DEBUG    | __main__:trials:24 - Trial = 21566/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.203 | DEBUG    | __main__:trials:29 - Trial = 21566/30000 | Total reward = 48.90
2022-01-26 14:18:11.206 | DEBUG    | __main__:trials:24 - Trial = 21567/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.208 | DEBUG    | __main__:trials:29 - Trial = 21567/30000 | Total reward = 39.88
2022-01-26 14:18:11.211 | DEBUG    | __main__:trials:24 - Trial = 21568/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.212 | DEBUG    | __main__:trials:29 - Trial = 21568/30000 | Total reward = 35.88
2022-01-26 14:18:11.216 | DEBUG    | __main__:trials:24 - Trial = 21569/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.217 | DEBUG    | __main__:trials:29 - Trial = 21569/30000 | Total reward = 39.15
2022-01-26 14:18:11.220 | DEBUG    | __main__:trials:24 - Trial = 21570/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.221 | DEBUG    | __main__:trials:29 - Trial = 21570/30000 | Total reward = 33.56
2022-01-26 14:18:11.224 | DEBUG    | __main__:trials:24 - Trial = 21571/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.225 | DEBUG    | __main__:trials:29 - Trial = 21571/30000 | Total reward = 42.18
2022-01-26 14:18:11.228 | DEBUG    | __main__:trials:24 - Trial = 21572/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.230 | DEBUG    | __main__:trials:29 - Trial = 21572/30000 | Total reward = 32.74
2022-01-26 14:18:11.233 | DEBUG    | __main__:trials:24 - Trial = 21573/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.235 | DEBUG    | __main__:trials:29 - Trial = 21573/30000 | Total reward = 53.62
2022-01-26 14:18:11.238 | DEBUG    | __main__:trials:24 - Trial = 21574/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.238 | DEBUG    | __main__:trials:29 - Trial = 21574/30000 | Total reward = 46.78
2022-01-26 14:18:11.242 | DEBUG    | __main__:trials:24 - Trial = 21575/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.244 | DEBUG    | __main__:trials:29 - Trial = 21575/30000 | Total reward = 46.78
2022-01-26 14:18:11.247 | DEBUG    | __main__:trials:24 - Trial = 21576/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.248 | DEBUG    | __main__:trials:29 - Trial = 21576/30000 | Total reward = 53.35
2022-01-26 14:18:11.252 | DEBUG    | __main__:trials:24 - Trial = 21577/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.253 | DEBUG    | __main__:trials:29 - Trial = 21577/30000 | Total reward = 32.70
2022-01-26 14:18:11.256 | DEBUG    | __main__:trials:24 - Trial = 21578/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.258 | DEBUG    | __main__:trials:29 - Trial = 21578/30000 | Total reward = 34.03
2022-01-26 14:18:11.261 | DEBUG    | __main__:trials:24 - Trial = 21579/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.261 | DEBUG    | __main__:trials:29 - Trial = 21579/30000 | Total reward = 29.60
2022-01-26 14:18:11.265 | DEBUG    | __main__:trials:24 - Trial = 21580/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.266 | DEBUG    | __main__:trials:29 - Trial = 21580/30000 | Total reward = 38.87
2022-01-26 14:18:11.269 | DEBUG    | __main__:trials:24 - Trial = 21581/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.270 | DEBUG    | __main__:trials:29 - Trial = 21581/30000 | Total reward = 37.36
2022-01-26 14:18:11.273 | DEBUG    | __main__:trials:24 - Trial = 21582/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.274 | DEBUG    | __main__:trials:29 - Trial = 21582/30000 | Total reward = 44.62
2022-01-26 14:18:11.277 | DEBUG    | __main__:trials:24 - Trial = 21583/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.278 | DEBUG    | __main__:trials:29 - Trial = 21583/30000 | Total reward = 41.52
2022-01-26 14:18:11.281 | DEBUG    | __main__:trials:24 - Trial = 21584/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.282 | DEBUG    | __main__:trials:29 - Trial = 21584/30000 | Total reward = 37.62
2022-01-26 14:18:11.286 | DEBUG    | __main__:trials:24 - Trial = 21585/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.287 | DEBUG    | __main__:trials:29 - Trial = 21585/30000 | Total reward = 29.20
2022-01-26 14:18:11.290 | DEBUG    | __main__:trials:24 - Trial = 21586/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.291 | DEBUG    | __main__:trials:29 - Trial = 21586/30000 | Total reward = 36.89
2022-01-26 14:18:11.295 | DEBUG    | __main__:trials:24 - Trial = 21587/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.297 | DEBUG    | __main__:trials:29 - Trial = 21587/30000 | Total reward = 50.59
2022-01-26 14:18:11.300 | DEBUG    | __main__:trials:24 - Trial = 21588/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.300 | DEBUG    | __main__:trials:29 - Trial = 21588/30000 | Total reward = 49.52
2022-01-26 14:18:11.304 | DEBUG    | __main__:trials:24 - Trial = 21589/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.306 | DEBUG    | __main__:trials:29 - Trial = 21589/30000 | Total reward = 59.55
2022-01-26 14:18:11.309 | DEBUG    | __main__:trials:24 - Trial = 21590/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.309 | DEBUG    | __main__:trials:29 - Trial = 21590/30000 | Total reward = 33.58
2022-01-26 14:18:11.313 | DEBUG    | __main__:trials:24 - Trial = 21591/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.313 | DEBUG    | __main__:trials:29 - Trial = 21591/30000 | Total reward = 49.26
2022-01-26 14:18:11.317 | DEBUG    | __main__:trials:24 - Trial = 21592/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.318 | DEBUG    | __main__:trials:29 - Trial = 21592/30000 | Total reward = 47.32
2022-01-26 14:18:11.321 | DEBUG    | __main__:trials:24 - Trial = 21593/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.322 | DEBUG    | __main__:trials:29 - Trial = 21593/30000 | Total reward = 51.23
2022-01-26 14:18:11.326 | DEBUG    | __main__:trials:24 - Trial = 21594/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.327 | DEBUG    | __main__:trials:29 - Trial = 21594/30000 | Total reward = 55.61
2022-01-26 14:18:11.330 | DEBUG    | __main__:trials:24 - Trial = 21595/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.331 | DEBUG    | __main__:trials:29 - Trial = 21595/30000 | Total reward = 53.01
2022-01-26 14:18:11.335 | DEBUG    | __main__:trials:24 - Trial = 21596/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.336 | DEBUG    | __main__:trials:29 - Trial = 21596/30000 | Total reward = 48.57
2022-01-26 14:18:11.339 | DEBUG    | __main__:trials:24 - Trial = 21597/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.340 | DEBUG    | __main__:trials:29 - Trial = 21597/30000 | Total reward = 55.35
2022-01-26 14:18:11.343 | DEBUG    | __main__:trials:24 - Trial = 21598/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.344 | DEBUG    | __main__:trials:29 - Trial = 21598/30000 | Total reward = 49.57
2022-01-26 14:18:11.348 | DEBUG    | __main__:trials:24 - Trial = 21599/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.348 | DEBUG    | __main__:trials:29 - Trial = 21599/30000 | Total reward = 47.88
2022-01-26 14:18:11.352 | DEBUG    | __main__:trials:24 - Trial = 21600/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.352 | DEBUG    | __main__:trials:29 - Trial = 21600/30000 | Total reward = 56.31
2022-01-26 14:18:11.356 | DEBUG    | __main__:trials:24 - Trial = 21601/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.357 | DEBUG    | __main__:trials:29 - Trial = 21601/30000 | Total reward = 45.39
2022-01-26 14:18:11.360 | DEBUG    | __main__:trials:24 - Trial = 21602/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.362 | DEBUG    | __main__:trials:29 - Trial = 21602/30000 | Total reward = 53.70
2022-01-26 14:18:11.365 | DEBUG    | __main__:trials:24 - Trial = 21603/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.366 | DEBUG    | __main__:trials:29 - Trial = 21603/30000 | Total reward = 41.29
2022-01-26 14:18:11.369 | DEBUG    | __main__:trials:24 - Trial = 21604/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.371 | DEBUG    | __main__:trials:29 - Trial = 21604/30000 | Total reward = 53.17
2022-01-26 14:18:11.374 | DEBUG    | __main__:trials:24 - Trial = 21605/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.375 | DEBUG    | __main__:trials:29 - Trial = 21605/30000 | Total reward = 40.40
2022-01-26 14:18:11.379 | DEBUG    | __main__:trials:24 - Trial = 21606/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.380 | DEBUG    | __main__:trials:29 - Trial = 21606/30000 | Total reward = 50.15
2022-01-26 14:18:11.384 | DEBUG    | __main__:trials:24 - Trial = 21607/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.384 | DEBUG    | __main__:trials:29 - Trial = 21607/30000 | Total reward = 43.07
2022-01-26 14:18:11.388 | DEBUG    | __main__:trials:24 - Trial = 21608/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.390 | DEBUG    | __main__:trials:29 - Trial = 21608/30000 | Total reward = 63.10
2022-01-26 14:18:11.393 | DEBUG    | __main__:trials:24 - Trial = 21609/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.395 | DEBUG    | __main__:trials:29 - Trial = 21609/30000 | Total reward = 43.28
2022-01-26 14:18:11.398 | DEBUG    | __main__:trials:24 - Trial = 21610/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.399 | DEBUG    | __main__:trials:29 - Trial = 21610/30000 | Total reward = 48.42
2022-01-26 14:18:11.402 | DEBUG    | __main__:trials:24 - Trial = 21611/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.404 | DEBUG    | __main__:trials:29 - Trial = 21611/30000 | Total reward = 54.07
2022-01-26 14:18:11.407 | DEBUG    | __main__:trials:24 - Trial = 21612/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.408 | DEBUG    | __main__:trials:29 - Trial = 21612/30000 | Total reward = 32.17
2022-01-26 14:18:11.411 | DEBUG    | __main__:trials:24 - Trial = 21613/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.412 | DEBUG    | __main__:trials:29 - Trial = 21613/30000 | Total reward = 42.30
2022-01-26 14:18:11.416 | DEBUG    | __main__:trials:24 - Trial = 21614/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.417 | DEBUG    | __main__:trials:29 - Trial = 21614/30000 | Total reward = 41.70
2022-01-26 14:18:11.420 | DEBUG    | __main__:trials:24 - Trial = 21615/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.421 | DEBUG    | __main__:trials:29 - Trial = 21615/30000 | Total reward = 60.28
2022-01-26 14:18:11.424 | DEBUG    | __main__:trials:24 - Trial = 21616/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.425 | DEBUG    | __main__:trials:29 - Trial = 21616/30000 | Total reward = 54.26
2022-01-26 14:18:11.430 | DEBUG    | __main__:trials:24 - Trial = 21617/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.431 | DEBUG    | __main__:trials:29 - Trial = 21617/30000 | Total reward = 58.23
2022-01-26 14:18:11.435 | DEBUG    | __main__:trials:24 - Trial = 21618/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.435 | DEBUG    | __main__:trials:29 - Trial = 21618/30000 | Total reward = 46.62
2022-01-26 14:18:11.439 | DEBUG    | __main__:trials:24 - Trial = 21619/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.439 | DEBUG    | __main__:trials:29 - Trial = 21619/30000 | Total reward = 53.26
2022-01-26 14:18:11.443 | DEBUG    | __main__:trials:24 - Trial = 21620/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.445 | DEBUG    | __main__:trials:29 - Trial = 21620/30000 | Total reward = 53.12
2022-01-26 14:18:11.448 | DEBUG    | __main__:trials:24 - Trial = 21621/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.449 | DEBUG    | __main__:trials:29 - Trial = 21621/30000 | Total reward = 40.31
2022-01-26 14:18:11.453 | DEBUG    | __main__:trials:24 - Trial = 21622/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.454 | DEBUG    | __main__:trials:29 - Trial = 21622/30000 | Total reward = 30.66
2022-01-26 14:18:11.458 | DEBUG    | __main__:trials:24 - Trial = 21623/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.458 | DEBUG    | __main__:trials:29 - Trial = 21623/30000 | Total reward = 50.58
2022-01-26 14:18:11.462 | DEBUG    | __main__:trials:24 - Trial = 21624/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.463 | DEBUG    | __main__:trials:29 - Trial = 21624/30000 | Total reward = 41.11
2022-01-26 14:18:11.466 | DEBUG    | __main__:trials:24 - Trial = 21625/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.467 | DEBUG    | __main__:trials:29 - Trial = 21625/30000 | Total reward = 56.95
2022-01-26 14:18:11.470 | DEBUG    | __main__:trials:24 - Trial = 21626/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.472 | DEBUG    | __main__:trials:29 - Trial = 21626/30000 | Total reward = 57.76
2022-01-26 14:18:11.475 | DEBUG    | __main__:trials:24 - Trial = 21627/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.476 | DEBUG    | __main__:trials:29 - Trial = 21627/30000 | Total reward = 55.98
2022-01-26 14:18:11.479 | DEBUG    | __main__:trials:24 - Trial = 21628/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.481 | DEBUG    | __main__:trials:29 - Trial = 21628/30000 | Total reward = 50.77
2022-01-26 14:18:11.484 | DEBUG    | __main__:trials:24 - Trial = 21629/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.486 | DEBUG    | __main__:trials:29 - Trial = 21629/30000 | Total reward = 49.69
2022-01-26 14:18:11.489 | DEBUG    | __main__:trials:24 - Trial = 21630/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.489 | DEBUG    | __main__:trials:29 - Trial = 21630/30000 | Total reward = 30.66
2022-01-26 14:18:11.493 | DEBUG    | __main__:trials:24 - Trial = 21631/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.494 | DEBUG    | __main__:trials:29 - Trial = 21631/30000 | Total reward = 39.57
2022-01-26 14:18:11.497 | DEBUG    | __main__:trials:24 - Trial = 21632/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.498 | DEBUG    | __main__:trials:29 - Trial = 21632/30000 | Total reward = 51.60
2022-01-26 14:18:11.501 | DEBUG    | __main__:trials:24 - Trial = 21633/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.502 | DEBUG    | __main__:trials:29 - Trial = 21633/30000 | Total reward = 39.64
2022-01-26 14:18:11.505 | DEBUG    | __main__:trials:24 - Trial = 21634/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.506 | DEBUG    | __main__:trials:29 - Trial = 21634/30000 | Total reward = 51.65
2022-01-26 14:18:11.510 | DEBUG    | __main__:trials:24 - Trial = 21635/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.511 | DEBUG    | __main__:trials:29 - Trial = 21635/30000 | Total reward = 52.88
2022-01-26 14:18:11.514 | DEBUG    | __main__:trials:24 - Trial = 21636/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.516 | DEBUG    | __main__:trials:29 - Trial = 21636/30000 | Total reward = 56.62
2022-01-26 14:18:11.519 | DEBUG    | __main__:trials:24 - Trial = 21637/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.520 | DEBUG    | __main__:trials:29 - Trial = 21637/30000 | Total reward = 48.75
2022-01-26 14:18:11.523 | DEBUG    | __main__:trials:24 - Trial = 21638/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.523 | DEBUG    | __main__:trials:29 - Trial = 21638/30000 | Total reward = 54.81
2022-01-26 14:18:11.527 | DEBUG    | __main__:trials:24 - Trial = 21639/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.528 | DEBUG    | __main__:trials:29 - Trial = 21639/30000 | Total reward = 51.46
2022-01-26 14:18:11.532 | DEBUG    | __main__:trials:24 - Trial = 21640/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.532 | DEBUG    | __main__:trials:29 - Trial = 21640/30000 | Total reward = 56.43
2022-01-26 14:18:11.536 | DEBUG    | __main__:trials:24 - Trial = 21641/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.536 | DEBUG    | __main__:trials:29 - Trial = 21641/30000 | Total reward = 49.23
2022-01-26 14:18:11.541 | DEBUG    | __main__:trials:24 - Trial = 21642/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.542 | DEBUG    | __main__:trials:29 - Trial = 21642/30000 | Total reward = 39.32
2022-01-26 14:18:11.546 | DEBUG    | __main__:trials:26 - Trial = 21643/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.546 | DEBUG    | __main__:trials:29 - Trial = 21643/30000 | Total reward = 31.14
2022-01-26 14:18:11.550 | DEBUG    | __main__:trials:24 - Trial = 21644/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.551 | DEBUG    | __main__:trials:29 - Trial = 21644/30000 | Total reward = 52.93
2022-01-26 14:18:11.554 | DEBUG    | __main__:trials:24 - Trial = 21645/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.556 | DEBUG    | __main__:trials:29 - Trial = 21645/30000 | Total reward = 62.86
2022-01-26 14:18:11.559 | DEBUG    | __main__:trials:24 - Trial = 21646/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.559 | DEBUG    | __main__:trials:29 - Trial = 21646/30000 | Total reward = 59.19
2022-01-26 14:18:11.563 | DEBUG    | __main__:trials:24 - Trial = 21647/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.565 | DEBUG    | __main__:trials:29 - Trial = 21647/30000 | Total reward = 52.67
2022-01-26 14:18:11.568 | DEBUG    | __main__:trials:24 - Trial = 21648/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.569 | DEBUG    | __main__:trials:29 - Trial = 21648/30000 | Total reward = 41.67
2022-01-26 14:18:11.572 | DEBUG    | __main__:trials:24 - Trial = 21649/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.574 | DEBUG    | __main__:trials:29 - Trial = 21649/30000 | Total reward = 39.57
2022-01-26 14:18:11.578 | DEBUG    | __main__:trials:24 - Trial = 21650/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.578 | DEBUG    | __main__:trials:29 - Trial = 21650/30000 | Total reward = 39.54
2022-01-26 14:18:11.582 | DEBUG    | __main__:trials:24 - Trial = 21651/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.584 | DEBUG    | __main__:trials:29 - Trial = 21651/30000 | Total reward = 33.03
2022-01-26 14:18:11.587 | DEBUG    | __main__:trials:24 - Trial = 21652/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.588 | DEBUG    | __main__:trials:29 - Trial = 21652/30000 | Total reward = 47.30
2022-01-26 14:18:11.591 | DEBUG    | __main__:trials:24 - Trial = 21653/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.593 | DEBUG    | __main__:trials:29 - Trial = 21653/30000 | Total reward = 49.35
2022-01-26 14:18:11.597 | DEBUG    | __main__:trials:24 - Trial = 21654/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.598 | DEBUG    | __main__:trials:29 - Trial = 21654/30000 | Total reward = 47.51
2022-01-26 14:18:11.601 | DEBUG    | __main__:trials:24 - Trial = 21655/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.603 | DEBUG    | __main__:trials:29 - Trial = 21655/30000 | Total reward = 32.17
2022-01-26 14:18:11.606 | DEBUG    | __main__:trials:24 - Trial = 21656/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.608 | DEBUG    | __main__:trials:29 - Trial = 21656/30000 | Total reward = 37.41
2022-01-26 14:18:11.611 | DEBUG    | __main__:trials:24 - Trial = 21657/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.612 | DEBUG    | __main__:trials:29 - Trial = 21657/30000 | Total reward = 36.22
2022-01-26 14:18:11.615 | DEBUG    | __main__:trials:24 - Trial = 21658/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.617 | DEBUG    | __main__:trials:29 - Trial = 21658/30000 | Total reward = 34.15
2022-01-26 14:18:11.620 | DEBUG    | __main__:trials:24 - Trial = 21659/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.621 | DEBUG    | __main__:trials:29 - Trial = 21659/30000 | Total reward = 36.82
2022-01-26 14:18:11.625 | DEBUG    | __main__:trials:24 - Trial = 21660/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.626 | DEBUG    | __main__:trials:29 - Trial = 21660/30000 | Total reward = 37.16
2022-01-26 14:18:11.630 | DEBUG    | __main__:trials:24 - Trial = 21661/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.631 | DEBUG    | __main__:trials:29 - Trial = 21661/30000 | Total reward = 42.33
2022-01-26 14:18:11.634 | DEBUG    | __main__:trials:24 - Trial = 21662/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.636 | DEBUG    | __main__:trials:29 - Trial = 21662/30000 | Total reward = 60.28
2022-01-26 14:18:11.639 | DEBUG    | __main__:trials:24 - Trial = 21663/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.641 | DEBUG    | __main__:trials:29 - Trial = 21663/30000 | Total reward = 35.97
2022-01-26 14:18:11.643 | DEBUG    | __main__:trials:26 - Trial = 21664/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.644 | DEBUG    | __main__:trials:29 - Trial = 21664/30000 | Total reward = 29.74
2022-01-26 14:18:11.647 | DEBUG    | __main__:trials:24 - Trial = 21665/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.648 | DEBUG    | __main__:trials:29 - Trial = 21665/30000 | Total reward = 37.43
2022-01-26 14:18:11.651 | DEBUG    | __main__:trials:24 - Trial = 21666/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.653 | DEBUG    | __main__:trials:29 - Trial = 21666/30000 | Total reward = 39.18
2022-01-26 14:18:11.656 | DEBUG    | __main__:trials:24 - Trial = 21667/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.658 | DEBUG    | __main__:trials:29 - Trial = 21667/30000 | Total reward = 43.92
2022-01-26 14:18:11.662 | DEBUG    | __main__:trials:24 - Trial = 21668/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.662 | DEBUG    | __main__:trials:29 - Trial = 21668/30000 | Total reward = 34.33
2022-01-26 14:18:11.666 | DEBUG    | __main__:trials:24 - Trial = 21669/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.667 | DEBUG    | __main__:trials:29 - Trial = 21669/30000 | Total reward = 39.57
2022-01-26 14:18:11.671 | DEBUG    | __main__:trials:26 - Trial = 21670/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.673 | DEBUG    | __main__:trials:29 - Trial = 21670/30000 | Total reward = 20.86
2022-01-26 14:18:11.676 | DEBUG    | __main__:trials:24 - Trial = 21671/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.676 | DEBUG    | __main__:trials:29 - Trial = 21671/30000 | Total reward = 41.67
2022-01-26 14:18:11.680 | DEBUG    | __main__:trials:24 - Trial = 21672/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.681 | DEBUG    | __main__:trials:29 - Trial = 21672/30000 | Total reward = 39.88
2022-01-26 14:18:11.684 | DEBUG    | __main__:trials:24 - Trial = 21673/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.685 | DEBUG    | __main__:trials:29 - Trial = 21673/30000 | Total reward = 39.53
2022-01-26 14:18:11.689 | DEBUG    | __main__:trials:24 - Trial = 21674/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.690 | DEBUG    | __main__:trials:29 - Trial = 21674/30000 | Total reward = 36.75
2022-01-26 14:18:11.694 | DEBUG    | __main__:trials:24 - Trial = 21675/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.695 | DEBUG    | __main__:trials:29 - Trial = 21675/30000 | Total reward = 38.34
2022-01-26 14:18:11.698 | DEBUG    | __main__:trials:24 - Trial = 21676/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.699 | DEBUG    | __main__:trials:29 - Trial = 21676/30000 | Total reward = 55.45
2022-01-26 14:18:11.703 | DEBUG    | __main__:trials:24 - Trial = 21677/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.704 | DEBUG    | __main__:trials:29 - Trial = 21677/30000 | Total reward = 64.23
2022-01-26 14:18:11.708 | DEBUG    | __main__:trials:26 - Trial = 21678/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.709 | DEBUG    | __main__:trials:29 - Trial = 21678/30000 | Total reward = 28.69
2022-01-26 14:18:11.712 | DEBUG    | __main__:trials:24 - Trial = 21679/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.714 | DEBUG    | __main__:trials:29 - Trial = 21679/30000 | Total reward = 28.98
2022-01-26 14:18:11.717 | DEBUG    | __main__:trials:24 - Trial = 21680/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.718 | DEBUG    | __main__:trials:29 - Trial = 21680/30000 | Total reward = 55.65
2022-01-26 14:18:11.722 | DEBUG    | __main__:trials:24 - Trial = 21681/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.723 | DEBUG    | __main__:trials:29 - Trial = 21681/30000 | Total reward = 36.99
2022-01-26 14:18:11.726 | DEBUG    | __main__:trials:24 - Trial = 21682/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.727 | DEBUG    | __main__:trials:29 - Trial = 21682/30000 | Total reward = 44.55
2022-01-26 14:18:11.731 | DEBUG    | __main__:trials:24 - Trial = 21683/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.732 | DEBUG    | __main__:trials:29 - Trial = 21683/30000 | Total reward = 43.17
2022-01-26 14:18:11.735 | DEBUG    | __main__:trials:24 - Trial = 21684/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.737 | DEBUG    | __main__:trials:29 - Trial = 21684/30000 | Total reward = 38.01
2022-01-26 14:18:11.740 | DEBUG    | __main__:trials:24 - Trial = 21685/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.742 | DEBUG    | __main__:trials:29 - Trial = 21685/30000 | Total reward = 34.80
2022-01-26 14:18:11.745 | DEBUG    | __main__:trials:24 - Trial = 21686/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.746 | DEBUG    | __main__:trials:29 - Trial = 21686/30000 | Total reward = 57.01
2022-01-26 14:18:11.749 | DEBUG    | __main__:trials:24 - Trial = 21687/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.750 | DEBUG    | __main__:trials:29 - Trial = 21687/30000 | Total reward = 41.62
2022-01-26 14:18:11.753 | DEBUG    | __main__:trials:24 - Trial = 21688/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.754 | DEBUG    | __main__:trials:29 - Trial = 21688/30000 | Total reward = 53.55
2022-01-26 14:18:11.757 | DEBUG    | __main__:trials:24 - Trial = 21689/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.759 | DEBUG    | __main__:trials:29 - Trial = 21689/30000 | Total reward = 30.44
2022-01-26 14:18:11.762 | DEBUG    | __main__:trials:24 - Trial = 21690/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.764 | DEBUG    | __main__:trials:29 - Trial = 21690/30000 | Total reward = 52.06
2022-01-26 14:18:11.767 | DEBUG    | __main__:trials:24 - Trial = 21691/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.769 | DEBUG    | __main__:trials:29 - Trial = 21691/30000 | Total reward = 37.02
2022-01-26 14:18:11.772 | DEBUG    | __main__:trials:24 - Trial = 21692/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.773 | DEBUG    | __main__:trials:29 - Trial = 21692/30000 | Total reward = 56.30
2022-01-26 14:18:11.776 | DEBUG    | __main__:trials:24 - Trial = 21693/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.777 | DEBUG    | __main__:trials:29 - Trial = 21693/30000 | Total reward = 37.86
2022-01-26 14:18:11.780 | DEBUG    | __main__:trials:24 - Trial = 21694/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.782 | DEBUG    | __main__:trials:29 - Trial = 21694/30000 | Total reward = 39.57
2022-01-26 14:18:11.786 | DEBUG    | __main__:trials:24 - Trial = 21695/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.787 | DEBUG    | __main__:trials:29 - Trial = 21695/30000 | Total reward = 50.74
2022-01-26 14:18:11.790 | DEBUG    | __main__:trials:26 - Trial = 21696/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.792 | DEBUG    | __main__:trials:29 - Trial = 21696/30000 | Total reward = 26.64
2022-01-26 14:18:11.795 | DEBUG    | __main__:trials:24 - Trial = 21697/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.795 | DEBUG    | __main__:trials:29 - Trial = 21697/30000 | Total reward = 40.60
2022-01-26 14:18:11.799 | DEBUG    | __main__:trials:24 - Trial = 21698/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.800 | DEBUG    | __main__:trials:29 - Trial = 21698/30000 | Total reward = 59.86
2022-01-26 14:18:11.803 | DEBUG    | __main__:trials:24 - Trial = 21699/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.805 | DEBUG    | __main__:trials:29 - Trial = 21699/30000 | Total reward = 50.86
2022-01-26 14:18:11.808 | DEBUG    | __main__:trials:24 - Trial = 21700/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.810 | DEBUG    | __main__:trials:29 - Trial = 21700/30000 | Total reward = 52.71
2022-01-26 14:18:11.813 | DEBUG    | __main__:trials:24 - Trial = 21701/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.814 | DEBUG    | __main__:trials:29 - Trial = 21701/30000 | Total reward = 46.34
2022-01-26 14:18:11.817 | DEBUG    | __main__:trials:24 - Trial = 21702/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.819 | DEBUG    | __main__:trials:29 - Trial = 21702/30000 | Total reward = 54.42
2022-01-26 14:18:11.822 | DEBUG    | __main__:trials:24 - Trial = 21703/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.824 | DEBUG    | __main__:trials:29 - Trial = 21703/30000 | Total reward = 41.24
2022-01-26 14:18:11.827 | DEBUG    | __main__:trials:24 - Trial = 21704/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.829 | DEBUG    | __main__:trials:29 - Trial = 21704/30000 | Total reward = 51.97
2022-01-26 14:18:11.832 | DEBUG    | __main__:trials:24 - Trial = 21705/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.834 | DEBUG    | __main__:trials:29 - Trial = 21705/30000 | Total reward = 37.22
2022-01-26 14:18:11.836 | DEBUG    | __main__:trials:24 - Trial = 21706/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.837 | DEBUG    | __main__:trials:29 - Trial = 21706/30000 | Total reward = 32.80
2022-01-26 14:18:11.841 | DEBUG    | __main__:trials:24 - Trial = 21707/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.841 | DEBUG    | __main__:trials:29 - Trial = 21707/30000 | Total reward = 37.86
2022-01-26 14:18:11.845 | DEBUG    | __main__:trials:24 - Trial = 21708/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.846 | DEBUG    | __main__:trials:29 - Trial = 21708/30000 | Total reward = 36.95
2022-01-26 14:18:11.849 | DEBUG    | __main__:trials:24 - Trial = 21709/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.850 | DEBUG    | __main__:trials:29 - Trial = 21709/30000 | Total reward = 58.98
2022-01-26 14:18:11.853 | DEBUG    | __main__:trials:24 - Trial = 21710/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.854 | DEBUG    | __main__:trials:29 - Trial = 21710/30000 | Total reward = 54.75
2022-01-26 14:18:11.858 | DEBUG    | __main__:trials:26 - Trial = 21711/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.859 | DEBUG    | __main__:trials:29 - Trial = 21711/30000 | Total reward = 27.43
2022-01-26 14:18:11.862 | DEBUG    | __main__:trials:24 - Trial = 21712/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.862 | DEBUG    | __main__:trials:29 - Trial = 21712/30000 | Total reward = 37.63
2022-01-26 14:18:11.866 | DEBUG    | __main__:trials:24 - Trial = 21713/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.867 | DEBUG    | __main__:trials:29 - Trial = 21713/30000 | Total reward = 43.89
2022-01-26 14:18:11.871 | DEBUG    | __main__:trials:24 - Trial = 21714/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.871 | DEBUG    | __main__:trials:29 - Trial = 21714/30000 | Total reward = 37.48
2022-01-26 14:18:11.875 | DEBUG    | __main__:trials:24 - Trial = 21715/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.875 | DEBUG    | __main__:trials:29 - Trial = 21715/30000 | Total reward = 35.79
2022-01-26 14:18:11.879 | DEBUG    | __main__:trials:24 - Trial = 21716/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.880 | DEBUG    | __main__:trials:29 - Trial = 21716/30000 | Total reward = 34.77
2022-01-26 14:18:11.883 | DEBUG    | __main__:trials:24 - Trial = 21717/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.885 | DEBUG    | __main__:trials:29 - Trial = 21717/30000 | Total reward = 48.45
2022-01-26 14:18:11.889 | DEBUG    | __main__:trials:24 - Trial = 21718/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.890 | DEBUG    | __main__:trials:29 - Trial = 21718/30000 | Total reward = 39.35
2022-01-26 14:18:11.894 | DEBUG    | __main__:trials:24 - Trial = 21719/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.895 | DEBUG    | __main__:trials:29 - Trial = 21719/30000 | Total reward = 37.66
2022-01-26 14:18:11.899 | DEBUG    | __main__:trials:24 - Trial = 21720/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.900 | DEBUG    | __main__:trials:29 - Trial = 21720/30000 | Total reward = 39.84
2022-01-26 14:18:11.903 | DEBUG    | __main__:trials:24 - Trial = 21721/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.905 | DEBUG    | __main__:trials:29 - Trial = 21721/30000 | Total reward = 34.44
2022-01-26 14:18:11.909 | DEBUG    | __main__:trials:24 - Trial = 21722/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.910 | DEBUG    | __main__:trials:29 - Trial = 21722/30000 | Total reward = 34.63
2022-01-26 14:18:11.914 | DEBUG    | __main__:trials:24 - Trial = 21723/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.914 | DEBUG    | __main__:trials:29 - Trial = 21723/30000 | Total reward = 35.42
2022-01-26 14:18:11.919 | DEBUG    | __main__:trials:24 - Trial = 21724/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.921 | DEBUG    | __main__:trials:29 - Trial = 21724/30000 | Total reward = 31.47
2022-01-26 14:18:11.923 | DEBUG    | __main__:trials:26 - Trial = 21725/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.925 | DEBUG    | __main__:trials:29 - Trial = 21725/30000 | Total reward = 24.30
2022-01-26 14:18:11.929 | DEBUG    | __main__:trials:24 - Trial = 21726/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.930 | DEBUG    | __main__:trials:29 - Trial = 21726/30000 | Total reward = 51.18
2022-01-26 14:18:11.933 | DEBUG    | __main__:trials:24 - Trial = 21727/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.934 | DEBUG    | __main__:trials:29 - Trial = 21727/30000 | Total reward = 52.10
2022-01-26 14:18:11.937 | DEBUG    | __main__:trials:24 - Trial = 21728/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.938 | DEBUG    | __main__:trials:29 - Trial = 21728/30000 | Total reward = 53.23
2022-01-26 14:18:11.941 | DEBUG    | __main__:trials:24 - Trial = 21729/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.943 | DEBUG    | __main__:trials:29 - Trial = 21729/30000 | Total reward = 56.64
2022-01-26 14:18:11.947 | DEBUG    | __main__:trials:24 - Trial = 21730/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.948 | DEBUG    | __main__:trials:29 - Trial = 21730/30000 | Total reward = 50.62
2022-01-26 14:18:11.952 | DEBUG    | __main__:trials:24 - Trial = 21731/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.953 | DEBUG    | __main__:trials:29 - Trial = 21731/30000 | Total reward = 53.55
2022-01-26 14:18:11.957 | DEBUG    | __main__:trials:26 - Trial = 21732/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.958 | DEBUG    | __main__:trials:29 - Trial = 21732/30000 | Total reward = 29.55
2022-01-26 14:18:11.962 | DEBUG    | __main__:trials:24 - Trial = 21733/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.963 | DEBUG    | __main__:trials:29 - Trial = 21733/30000 | Total reward = 40.89
2022-01-26 14:18:11.967 | DEBUG    | __main__:trials:24 - Trial = 21734/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.967 | DEBUG    | __main__:trials:29 - Trial = 21734/30000 | Total reward = 53.55
2022-01-26 14:18:11.972 | DEBUG    | __main__:trials:26 - Trial = 21735/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:11.973 | DEBUG    | __main__:trials:29 - Trial = 21735/30000 | Total reward = 24.59
2022-01-26 14:18:11.977 | DEBUG    | __main__:trials:24 - Trial = 21736/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.979 | DEBUG    | __main__:trials:29 - Trial = 21736/30000 | Total reward = 33.66
2022-01-26 14:18:11.982 | DEBUG    | __main__:trials:24 - Trial = 21737/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.983 | DEBUG    | __main__:trials:29 - Trial = 21737/30000 | Total reward = 51.16
2022-01-26 14:18:11.986 | DEBUG    | __main__:trials:24 - Trial = 21738/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.988 | DEBUG    | __main__:trials:29 - Trial = 21738/30000 | Total reward = 50.72
2022-01-26 14:18:11.992 | DEBUG    | __main__:trials:24 - Trial = 21739/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.993 | DEBUG    | __main__:trials:29 - Trial = 21739/30000 | Total reward = 41.66
2022-01-26 14:18:11.996 | DEBUG    | __main__:trials:24 - Trial = 21740/30000 | Max number of steps (20) reached
2022-01-26 14:18:11.998 | DEBUG    | __main__:trials:29 - Trial = 21740/30000 | Total reward = 53.23
2022-01-26 14:18:12.000 | DEBUG    | __main__:trials:24 - Trial = 21741/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.001 | DEBUG    | __main__:trials:29 - Trial = 21741/30000 | Total reward = 49.59
2022-01-26 14:18:12.005 | DEBUG    | __main__:trials:24 - Trial = 21742/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.006 | DEBUG    | __main__:trials:29 - Trial = 21742/30000 | Total reward = 47.98
2022-01-26 14:18:12.009 | DEBUG    | __main__:trials:26 - Trial = 21743/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.010 | DEBUG    | __main__:trials:29 - Trial = 21743/30000 | Total reward = 29.43
2022-01-26 14:18:12.014 | DEBUG    | __main__:trials:24 - Trial = 21744/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.016 | DEBUG    | __main__:trials:29 - Trial = 21744/30000 | Total reward = 52.91
2022-01-26 14:18:12.019 | DEBUG    | __main__:trials:24 - Trial = 21745/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.020 | DEBUG    | __main__:trials:29 - Trial = 21745/30000 | Total reward = 56.48
2022-01-26 14:18:12.024 | DEBUG    | __main__:trials:24 - Trial = 21746/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.025 | DEBUG    | __main__:trials:29 - Trial = 21746/30000 | Total reward = 47.31
2022-01-26 14:18:12.029 | DEBUG    | __main__:trials:24 - Trial = 21747/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.029 | DEBUG    | __main__:trials:29 - Trial = 21747/30000 | Total reward = 26.55
2022-01-26 14:18:12.033 | DEBUG    | __main__:trials:24 - Trial = 21748/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.034 | DEBUG    | __main__:trials:29 - Trial = 21748/30000 | Total reward = 43.58
2022-01-26 14:18:12.038 | DEBUG    | __main__:trials:24 - Trial = 21749/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.039 | DEBUG    | __main__:trials:29 - Trial = 21749/30000 | Total reward = 50.68
2022-01-26 14:18:12.042 | DEBUG    | __main__:trials:24 - Trial = 21750/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.043 | DEBUG    | __main__:trials:29 - Trial = 21750/30000 | Total reward = 46.49
2022-01-26 14:18:12.046 | DEBUG    | __main__:trials:24 - Trial = 21751/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.048 | DEBUG    | __main__:trials:29 - Trial = 21751/30000 | Total reward = 54.47
2022-01-26 14:18:12.052 | DEBUG    | __main__:trials:24 - Trial = 21752/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.053 | DEBUG    | __main__:trials:29 - Trial = 21752/30000 | Total reward = 58.64
2022-01-26 14:18:12.058 | DEBUG    | __main__:trials:24 - Trial = 21753/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.060 | DEBUG    | __main__:trials:29 - Trial = 21753/30000 | Total reward = 57.87
2022-01-26 14:18:12.063 | DEBUG    | __main__:trials:24 - Trial = 21754/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.065 | DEBUG    | __main__:trials:29 - Trial = 21754/30000 | Total reward = 39.70
2022-01-26 14:18:12.068 | DEBUG    | __main__:trials:24 - Trial = 21755/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.069 | DEBUG    | __main__:trials:29 - Trial = 21755/30000 | Total reward = 42.48
2022-01-26 14:18:12.073 | DEBUG    | __main__:trials:24 - Trial = 21756/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.073 | DEBUG    | __main__:trials:29 - Trial = 21756/30000 | Total reward = 58.21
2022-01-26 14:18:12.077 | DEBUG    | __main__:trials:24 - Trial = 21757/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.078 | DEBUG    | __main__:trials:29 - Trial = 21757/30000 | Total reward = 52.27
2022-01-26 14:18:12.081 | DEBUG    | __main__:trials:24 - Trial = 21758/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.082 | DEBUG    | __main__:trials:29 - Trial = 21758/30000 | Total reward = 36.36
2022-01-26 14:18:12.086 | DEBUG    | __main__:trials:24 - Trial = 21759/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.086 | DEBUG    | __main__:trials:29 - Trial = 21759/30000 | Total reward = 48.33
2022-01-26 14:18:12.090 | DEBUG    | __main__:trials:24 - Trial = 21760/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.092 | DEBUG    | __main__:trials:29 - Trial = 21760/30000 | Total reward = 42.13
2022-01-26 14:18:12.095 | DEBUG    | __main__:trials:24 - Trial = 21761/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.097 | DEBUG    | __main__:trials:29 - Trial = 21761/30000 | Total reward = 57.03
2022-01-26 14:18:12.100 | DEBUG    | __main__:trials:24 - Trial = 21762/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.100 | DEBUG    | __main__:trials:29 - Trial = 21762/30000 | Total reward = 47.96
2022-01-26 14:18:12.104 | DEBUG    | __main__:trials:24 - Trial = 21763/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.106 | DEBUG    | __main__:trials:29 - Trial = 21763/30000 | Total reward = 59.60
2022-01-26 14:18:12.109 | DEBUG    | __main__:trials:24 - Trial = 21764/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.110 | DEBUG    | __main__:trials:29 - Trial = 21764/30000 | Total reward = 49.62
2022-01-26 14:18:12.114 | DEBUG    | __main__:trials:24 - Trial = 21765/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.114 | DEBUG    | __main__:trials:29 - Trial = 21765/30000 | Total reward = 56.66
2022-01-26 14:18:12.118 | DEBUG    | __main__:trials:24 - Trial = 21766/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.119 | DEBUG    | __main__:trials:29 - Trial = 21766/30000 | Total reward = 54.12
2022-01-26 14:18:12.123 | DEBUG    | __main__:trials:24 - Trial = 21767/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.124 | DEBUG    | __main__:trials:29 - Trial = 21767/30000 | Total reward = 43.08
2022-01-26 14:18:12.128 | DEBUG    | __main__:trials:24 - Trial = 21768/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.128 | DEBUG    | __main__:trials:29 - Trial = 21768/30000 | Total reward = 57.02
2022-01-26 14:18:12.132 | DEBUG    | __main__:trials:24 - Trial = 21769/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.133 | DEBUG    | __main__:trials:29 - Trial = 21769/30000 | Total reward = 50.43
2022-01-26 14:18:12.136 | DEBUG    | __main__:trials:24 - Trial = 21770/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.137 | DEBUG    | __main__:trials:29 - Trial = 21770/30000 | Total reward = 54.53
2022-01-26 14:18:12.141 | DEBUG    | __main__:trials:24 - Trial = 21771/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.142 | DEBUG    | __main__:trials:29 - Trial = 21771/30000 | Total reward = 59.04
2022-01-26 14:18:12.145 | DEBUG    | __main__:trials:24 - Trial = 21772/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.146 | DEBUG    | __main__:trials:29 - Trial = 21772/30000 | Total reward = 43.85
2022-01-26 14:18:12.150 | DEBUG    | __main__:trials:24 - Trial = 21773/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.151 | DEBUG    | __main__:trials:29 - Trial = 21773/30000 | Total reward = 52.99
2022-01-26 14:18:12.155 | DEBUG    | __main__:trials:24 - Trial = 21774/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.157 | DEBUG    | __main__:trials:29 - Trial = 21774/30000 | Total reward = 52.23
2022-01-26 14:18:12.160 | DEBUG    | __main__:trials:24 - Trial = 21775/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.162 | DEBUG    | __main__:trials:29 - Trial = 21775/30000 | Total reward = 40.56
2022-01-26 14:18:12.165 | DEBUG    | __main__:trials:24 - Trial = 21776/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.166 | DEBUG    | __main__:trials:29 - Trial = 21776/30000 | Total reward = 56.65
2022-01-26 14:18:12.169 | DEBUG    | __main__:trials:24 - Trial = 21777/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.170 | DEBUG    | __main__:trials:29 - Trial = 21777/30000 | Total reward = 26.53
2022-01-26 14:18:12.173 | DEBUG    | __main__:trials:24 - Trial = 21778/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.174 | DEBUG    | __main__:trials:29 - Trial = 21778/30000 | Total reward = 43.98
2022-01-26 14:18:12.178 | DEBUG    | __main__:trials:24 - Trial = 21779/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.180 | DEBUG    | __main__:trials:29 - Trial = 21779/30000 | Total reward = 42.49
2022-01-26 14:18:12.183 | DEBUG    | __main__:trials:24 - Trial = 21780/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.185 | DEBUG    | __main__:trials:29 - Trial = 21780/30000 | Total reward = 33.42
2022-01-26 14:18:12.188 | DEBUG    | __main__:trials:24 - Trial = 21781/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.189 | DEBUG    | __main__:trials:29 - Trial = 21781/30000 | Total reward = 32.67
2022-01-26 14:18:12.192 | DEBUG    | __main__:trials:24 - Trial = 21782/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.194 | DEBUG    | __main__:trials:29 - Trial = 21782/30000 | Total reward = 47.04
2022-01-26 14:18:12.198 | DEBUG    | __main__:trials:24 - Trial = 21783/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.199 | DEBUG    | __main__:trials:29 - Trial = 21783/30000 | Total reward = 42.81
2022-01-26 14:18:12.202 | DEBUG    | __main__:trials:24 - Trial = 21784/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.204 | DEBUG    | __main__:trials:29 - Trial = 21784/30000 | Total reward = 39.61
2022-01-26 14:18:12.207 | DEBUG    | __main__:trials:24 - Trial = 21785/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.208 | DEBUG    | __main__:trials:29 - Trial = 21785/30000 | Total reward = 39.80
2022-01-26 14:18:12.212 | DEBUG    | __main__:trials:24 - Trial = 21786/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.212 | DEBUG    | __main__:trials:29 - Trial = 21786/30000 | Total reward = 34.00
2022-01-26 14:18:12.216 | DEBUG    | __main__:trials:24 - Trial = 21787/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.218 | DEBUG    | __main__:trials:29 - Trial = 21787/30000 | Total reward = 40.89
2022-01-26 14:18:12.221 | DEBUG    | __main__:trials:24 - Trial = 21788/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.222 | DEBUG    | __main__:trials:29 - Trial = 21788/30000 | Total reward = 49.22
2022-01-26 14:18:12.225 | DEBUG    | __main__:trials:24 - Trial = 21789/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.226 | DEBUG    | __main__:trials:29 - Trial = 21789/30000 | Total reward = 37.75
2022-01-26 14:18:12.230 | DEBUG    | __main__:trials:24 - Trial = 21790/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.231 | DEBUG    | __main__:trials:29 - Trial = 21790/30000 | Total reward = 46.45
2022-01-26 14:18:12.234 | DEBUG    | __main__:trials:26 - Trial = 21791/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.236 | DEBUG    | __main__:trials:29 - Trial = 21791/30000 | Total reward = 17.74
2022-01-26 14:18:12.239 | DEBUG    | __main__:trials:24 - Trial = 21792/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.239 | DEBUG    | __main__:trials:29 - Trial = 21792/30000 | Total reward = 39.57
2022-01-26 14:18:12.243 | DEBUG    | __main__:trials:24 - Trial = 21793/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.243 | DEBUG    | __main__:trials:29 - Trial = 21793/30000 | Total reward = 35.75
2022-01-26 14:18:12.247 | DEBUG    | __main__:trials:26 - Trial = 21794/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.248 | DEBUG    | __main__:trials:29 - Trial = 21794/30000 | Total reward = 22.48
2022-01-26 14:18:12.251 | DEBUG    | __main__:trials:26 - Trial = 21795/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.252 | DEBUG    | __main__:trials:29 - Trial = 21795/30000 | Total reward = 21.36
2022-01-26 14:18:12.255 | DEBUG    | __main__:trials:24 - Trial = 21796/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.257 | DEBUG    | __main__:trials:29 - Trial = 21796/30000 | Total reward = 33.87
2022-01-26 14:18:12.261 | DEBUG    | __main__:trials:24 - Trial = 21797/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.262 | DEBUG    | __main__:trials:29 - Trial = 21797/30000 | Total reward = 53.96
2022-01-26 14:18:12.265 | DEBUG    | __main__:trials:24 - Trial = 21798/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.266 | DEBUG    | __main__:trials:29 - Trial = 21798/30000 | Total reward = 44.02
2022-01-26 14:18:12.270 | DEBUG    | __main__:trials:24 - Trial = 21799/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.271 | DEBUG    | __main__:trials:29 - Trial = 21799/30000 | Total reward = 48.21
2022-01-26 14:18:12.273 | DEBUG    | __main__:trials:26 - Trial = 21800/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.274 | DEBUG    | __main__:trials:29 - Trial = 21800/30000 | Total reward = 13.16
2022-01-26 14:18:12.277 | DEBUG    | __main__:trials:26 - Trial = 21801/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.278 | DEBUG    | __main__:trials:29 - Trial = 21801/30000 | Total reward = 30.98
2022-01-26 14:18:12.281 | DEBUG    | __main__:trials:24 - Trial = 21802/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.283 | DEBUG    | __main__:trials:29 - Trial = 21802/30000 | Total reward = 34.69
2022-01-26 14:18:12.286 | DEBUG    | __main__:trials:24 - Trial = 21803/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.287 | DEBUG    | __main__:trials:29 - Trial = 21803/30000 | Total reward = 29.21
2022-01-26 14:18:12.290 | DEBUG    | __main__:trials:24 - Trial = 21804/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.291 | DEBUG    | __main__:trials:29 - Trial = 21804/30000 | Total reward = 36.09
2022-01-26 14:18:12.294 | DEBUG    | __main__:trials:24 - Trial = 21805/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.296 | DEBUG    | __main__:trials:29 - Trial = 21805/30000 | Total reward = 39.92
2022-01-26 14:18:12.300 | DEBUG    | __main__:trials:24 - Trial = 21806/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.301 | DEBUG    | __main__:trials:29 - Trial = 21806/30000 | Total reward = 36.87
2022-01-26 14:18:12.305 | DEBUG    | __main__:trials:24 - Trial = 21807/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.307 | DEBUG    | __main__:trials:29 - Trial = 21807/30000 | Total reward = 41.34
2022-01-26 14:18:12.311 | DEBUG    | __main__:trials:24 - Trial = 21808/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.312 | DEBUG    | __main__:trials:29 - Trial = 21808/30000 | Total reward = 38.16
2022-01-26 14:18:12.315 | DEBUG    | __main__:trials:24 - Trial = 21809/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.316 | DEBUG    | __main__:trials:29 - Trial = 21809/30000 | Total reward = 40.35
2022-01-26 14:18:12.320 | DEBUG    | __main__:trials:24 - Trial = 21810/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.322 | DEBUG    | __main__:trials:29 - Trial = 21810/30000 | Total reward = 40.54
2022-01-26 14:18:12.326 | DEBUG    | __main__:trials:24 - Trial = 21811/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.327 | DEBUG    | __main__:trials:29 - Trial = 21811/30000 | Total reward = 47.22
2022-01-26 14:18:12.330 | DEBUG    | __main__:trials:24 - Trial = 21812/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.332 | DEBUG    | __main__:trials:29 - Trial = 21812/30000 | Total reward = 53.54
2022-01-26 14:18:12.335 | DEBUG    | __main__:trials:24 - Trial = 21813/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.336 | DEBUG    | __main__:trials:29 - Trial = 21813/30000 | Total reward = 53.30
2022-01-26 14:18:12.339 | DEBUG    | __main__:trials:24 - Trial = 21814/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.341 | DEBUG    | __main__:trials:29 - Trial = 21814/30000 | Total reward = 52.12
2022-01-26 14:18:12.344 | DEBUG    | __main__:trials:24 - Trial = 21815/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.346 | DEBUG    | __main__:trials:29 - Trial = 21815/30000 | Total reward = 43.22
2022-01-26 14:18:12.349 | DEBUG    | __main__:trials:24 - Trial = 21816/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.350 | DEBUG    | __main__:trials:29 - Trial = 21816/30000 | Total reward = 47.96
2022-01-26 14:18:12.353 | DEBUG    | __main__:trials:24 - Trial = 21817/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.353 | DEBUG    | __main__:trials:29 - Trial = 21817/30000 | Total reward = 32.42
2022-01-26 14:18:12.357 | DEBUG    | __main__:trials:24 - Trial = 21818/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.358 | DEBUG    | __main__:trials:29 - Trial = 21818/30000 | Total reward = 47.60
2022-01-26 14:18:12.362 | DEBUG    | __main__:trials:24 - Trial = 21819/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.363 | DEBUG    | __main__:trials:29 - Trial = 21819/30000 | Total reward = 48.52
2022-01-26 14:18:12.367 | DEBUG    | __main__:trials:24 - Trial = 21820/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.368 | DEBUG    | __main__:trials:29 - Trial = 21820/30000 | Total reward = 48.68
2022-01-26 14:18:12.371 | DEBUG    | __main__:trials:24 - Trial = 21821/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.373 | DEBUG    | __main__:trials:29 - Trial = 21821/30000 | Total reward = 48.82
2022-01-26 14:18:12.376 | DEBUG    | __main__:trials:24 - Trial = 21822/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.378 | DEBUG    | __main__:trials:29 - Trial = 21822/30000 | Total reward = 41.44
2022-01-26 14:18:12.381 | DEBUG    | __main__:trials:24 - Trial = 21823/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.381 | DEBUG    | __main__:trials:29 - Trial = 21823/30000 | Total reward = 31.96
2022-01-26 14:18:12.385 | DEBUG    | __main__:trials:24 - Trial = 21824/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.385 | DEBUG    | __main__:trials:29 - Trial = 21824/30000 | Total reward = 51.07
2022-01-26 14:18:12.388 | DEBUG    | __main__:trials:24 - Trial = 21825/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.390 | DEBUG    | __main__:trials:29 - Trial = 21825/30000 | Total reward = 49.09
2022-01-26 14:18:12.394 | DEBUG    | __main__:trials:24 - Trial = 21826/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.395 | DEBUG    | __main__:trials:29 - Trial = 21826/30000 | Total reward = 42.52
2022-01-26 14:18:12.399 | DEBUG    | __main__:trials:24 - Trial = 21827/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.400 | DEBUG    | __main__:trials:29 - Trial = 21827/30000 | Total reward = 37.88
2022-01-26 14:18:12.404 | DEBUG    | __main__:trials:24 - Trial = 21828/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.405 | DEBUG    | __main__:trials:29 - Trial = 21828/30000 | Total reward = 52.47
2022-01-26 14:18:12.408 | DEBUG    | __main__:trials:24 - Trial = 21829/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.410 | DEBUG    | __main__:trials:29 - Trial = 21829/30000 | Total reward = 53.94
2022-01-26 14:18:12.413 | DEBUG    | __main__:trials:24 - Trial = 21830/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.414 | DEBUG    | __main__:trials:29 - Trial = 21830/30000 | Total reward = 36.19
2022-01-26 14:18:12.417 | DEBUG    | __main__:trials:24 - Trial = 21831/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.419 | DEBUG    | __main__:trials:29 - Trial = 21831/30000 | Total reward = 34.69
2022-01-26 14:18:12.422 | DEBUG    | __main__:trials:24 - Trial = 21832/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.423 | DEBUG    | __main__:trials:29 - Trial = 21832/30000 | Total reward = 47.21
2022-01-26 14:18:12.427 | DEBUG    | __main__:trials:24 - Trial = 21833/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.428 | DEBUG    | __main__:trials:29 - Trial = 21833/30000 | Total reward = 37.51
2022-01-26 14:18:12.431 | DEBUG    | __main__:trials:24 - Trial = 21834/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.433 | DEBUG    | __main__:trials:29 - Trial = 21834/30000 | Total reward = 34.87
2022-01-26 14:18:12.436 | DEBUG    | __main__:trials:24 - Trial = 21835/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.437 | DEBUG    | __main__:trials:29 - Trial = 21835/30000 | Total reward = 29.63
2022-01-26 14:18:12.440 | DEBUG    | __main__:trials:24 - Trial = 21836/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.442 | DEBUG    | __main__:trials:29 - Trial = 21836/30000 | Total reward = 38.55
2022-01-26 14:18:12.445 | DEBUG    | __main__:trials:26 - Trial = 21837/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.446 | DEBUG    | __main__:trials:29 - Trial = 21837/30000 | Total reward = 32.34
2022-01-26 14:18:12.449 | DEBUG    | __main__:trials:24 - Trial = 21838/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.450 | DEBUG    | __main__:trials:29 - Trial = 21838/30000 | Total reward = 47.43
2022-01-26 14:18:12.454 | DEBUG    | __main__:trials:24 - Trial = 21839/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.455 | DEBUG    | __main__:trials:29 - Trial = 21839/30000 | Total reward = 50.48
2022-01-26 14:18:12.458 | DEBUG    | __main__:trials:24 - Trial = 21840/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.460 | DEBUG    | __main__:trials:29 - Trial = 21840/30000 | Total reward = 39.64
2022-01-26 14:18:12.463 | DEBUG    | __main__:trials:24 - Trial = 21841/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.464 | DEBUG    | __main__:trials:29 - Trial = 21841/30000 | Total reward = 49.32
2022-01-26 14:18:12.468 | DEBUG    | __main__:trials:24 - Trial = 21842/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.469 | DEBUG    | __main__:trials:29 - Trial = 21842/30000 | Total reward = 48.56
2022-01-26 14:18:12.472 | DEBUG    | __main__:trials:26 - Trial = 21843/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.473 | DEBUG    | __main__:trials:29 - Trial = 21843/30000 | Total reward = 24.61
2022-01-26 14:18:12.477 | DEBUG    | __main__:trials:24 - Trial = 21844/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.478 | DEBUG    | __main__:trials:29 - Trial = 21844/30000 | Total reward = 56.25
2022-01-26 14:18:12.481 | DEBUG    | __main__:trials:24 - Trial = 21845/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.482 | DEBUG    | __main__:trials:29 - Trial = 21845/30000 | Total reward = 43.68
2022-01-26 14:18:12.486 | DEBUG    | __main__:trials:24 - Trial = 21846/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.488 | DEBUG    | __main__:trials:29 - Trial = 21846/30000 | Total reward = 48.41
2022-01-26 14:18:12.491 | DEBUG    | __main__:trials:24 - Trial = 21847/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.493 | DEBUG    | __main__:trials:29 - Trial = 21847/30000 | Total reward = 42.63
2022-01-26 14:18:12.497 | DEBUG    | __main__:trials:24 - Trial = 21848/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.498 | DEBUG    | __main__:trials:29 - Trial = 21848/30000 | Total reward = 41.86
2022-01-26 14:18:12.501 | DEBUG    | __main__:trials:24 - Trial = 21849/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.503 | DEBUG    | __main__:trials:29 - Trial = 21849/30000 | Total reward = 43.64
2022-01-26 14:18:12.507 | DEBUG    | __main__:trials:24 - Trial = 21850/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.509 | DEBUG    | __main__:trials:29 - Trial = 21850/30000 | Total reward = 34.11
2022-01-26 14:18:12.512 | DEBUG    | __main__:trials:24 - Trial = 21851/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.514 | DEBUG    | __main__:trials:29 - Trial = 21851/30000 | Total reward = 29.58
2022-01-26 14:18:12.517 | DEBUG    | __main__:trials:24 - Trial = 21852/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.519 | DEBUG    | __main__:trials:29 - Trial = 21852/30000 | Total reward = 38.52
2022-01-26 14:18:12.522 | DEBUG    | __main__:trials:24 - Trial = 21853/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.524 | DEBUG    | __main__:trials:29 - Trial = 21853/30000 | Total reward = 41.31
2022-01-26 14:18:12.528 | DEBUG    | __main__:trials:24 - Trial = 21854/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.529 | DEBUG    | __main__:trials:29 - Trial = 21854/30000 | Total reward = 47.26
2022-01-26 14:18:12.533 | DEBUG    | __main__:trials:24 - Trial = 21855/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.533 | DEBUG    | __main__:trials:29 - Trial = 21855/30000 | Total reward = 51.59
2022-01-26 14:18:12.537 | DEBUG    | __main__:trials:24 - Trial = 21856/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.538 | DEBUG    | __main__:trials:29 - Trial = 21856/30000 | Total reward = 62.31
2022-01-26 14:18:12.541 | DEBUG    | __main__:trials:24 - Trial = 21857/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.543 | DEBUG    | __main__:trials:29 - Trial = 21857/30000 | Total reward = 41.95
2022-01-26 14:18:12.547 | DEBUG    | __main__:trials:24 - Trial = 21858/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.548 | DEBUG    | __main__:trials:29 - Trial = 21858/30000 | Total reward = 42.83
2022-01-26 14:18:12.551 | DEBUG    | __main__:trials:26 - Trial = 21859/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.552 | DEBUG    | __main__:trials:29 - Trial = 21859/30000 | Total reward = 30.94
2022-01-26 14:18:12.555 | DEBUG    | __main__:trials:24 - Trial = 21860/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.557 | DEBUG    | __main__:trials:29 - Trial = 21860/30000 | Total reward = 36.15
2022-01-26 14:18:12.560 | DEBUG    | __main__:trials:24 - Trial = 21861/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.561 | DEBUG    | __main__:trials:29 - Trial = 21861/30000 | Total reward = 49.65
2022-01-26 14:18:12.565 | DEBUG    | __main__:trials:24 - Trial = 21862/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.566 | DEBUG    | __main__:trials:29 - Trial = 21862/30000 | Total reward = 47.25
2022-01-26 14:18:12.569 | DEBUG    | __main__:trials:24 - Trial = 21863/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.571 | DEBUG    | __main__:trials:29 - Trial = 21863/30000 | Total reward = 58.36
2022-01-26 14:18:12.574 | DEBUG    | __main__:trials:24 - Trial = 21864/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.576 | DEBUG    | __main__:trials:29 - Trial = 21864/30000 | Total reward = 50.98
2022-01-26 14:18:12.579 | DEBUG    | __main__:trials:24 - Trial = 21865/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.580 | DEBUG    | __main__:trials:29 - Trial = 21865/30000 | Total reward = 37.92
2022-01-26 14:18:12.584 | DEBUG    | __main__:trials:24 - Trial = 21866/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.586 | DEBUG    | __main__:trials:29 - Trial = 21866/30000 | Total reward = 34.92
2022-01-26 14:18:12.590 | DEBUG    | __main__:trials:24 - Trial = 21867/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.591 | DEBUG    | __main__:trials:29 - Trial = 21867/30000 | Total reward = 23.48
2022-01-26 14:18:12.594 | DEBUG    | __main__:trials:24 - Trial = 21868/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.596 | DEBUG    | __main__:trials:29 - Trial = 21868/30000 | Total reward = 59.34
2022-01-26 14:18:12.599 | DEBUG    | __main__:trials:24 - Trial = 21869/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.601 | DEBUG    | __main__:trials:29 - Trial = 21869/30000 | Total reward = 67.03
2022-01-26 14:18:12.604 | DEBUG    | __main__:trials:24 - Trial = 21870/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.604 | DEBUG    | __main__:trials:29 - Trial = 21870/30000 | Total reward = 44.29
2022-01-26 14:18:12.608 | DEBUG    | __main__:trials:24 - Trial = 21871/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.610 | DEBUG    | __main__:trials:29 - Trial = 21871/30000 | Total reward = 43.28
2022-01-26 14:18:12.613 | DEBUG    | __main__:trials:24 - Trial = 21872/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.614 | DEBUG    | __main__:trials:29 - Trial = 21872/30000 | Total reward = 44.75
2022-01-26 14:18:12.617 | DEBUG    | __main__:trials:24 - Trial = 21873/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.618 | DEBUG    | __main__:trials:29 - Trial = 21873/30000 | Total reward = 53.33
2022-01-26 14:18:12.622 | DEBUG    | __main__:trials:24 - Trial = 21874/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.622 | DEBUG    | __main__:trials:29 - Trial = 21874/30000 | Total reward = 36.18
2022-01-26 14:18:12.626 | DEBUG    | __main__:trials:24 - Trial = 21875/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.627 | DEBUG    | __main__:trials:29 - Trial = 21875/30000 | Total reward = 32.17
2022-01-26 14:18:12.631 | DEBUG    | __main__:trials:24 - Trial = 21876/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.631 | DEBUG    | __main__:trials:29 - Trial = 21876/30000 | Total reward = 31.18
2022-01-26 14:18:12.635 | DEBUG    | __main__:trials:24 - Trial = 21877/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.636 | DEBUG    | __main__:trials:29 - Trial = 21877/30000 | Total reward = 36.32
2022-01-26 14:18:12.640 | DEBUG    | __main__:trials:24 - Trial = 21878/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.642 | DEBUG    | __main__:trials:29 - Trial = 21878/30000 | Total reward = 42.23
2022-01-26 14:18:12.646 | DEBUG    | __main__:trials:24 - Trial = 21879/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.646 | DEBUG    | __main__:trials:29 - Trial = 21879/30000 | Total reward = 36.10
2022-01-26 14:18:12.651 | DEBUG    | __main__:trials:24 - Trial = 21880/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.652 | DEBUG    | __main__:trials:29 - Trial = 21880/30000 | Total reward = 42.42
2022-01-26 14:18:12.655 | DEBUG    | __main__:trials:24 - Trial = 21881/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.657 | DEBUG    | __main__:trials:29 - Trial = 21881/30000 | Total reward = 31.71
2022-01-26 14:18:12.660 | DEBUG    | __main__:trials:24 - Trial = 21882/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.662 | DEBUG    | __main__:trials:29 - Trial = 21882/30000 | Total reward = 46.06
2022-01-26 14:18:12.665 | DEBUG    | __main__:trials:24 - Trial = 21883/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.667 | DEBUG    | __main__:trials:29 - Trial = 21883/30000 | Total reward = 38.79
2022-01-26 14:18:12.669 | DEBUG    | __main__:trials:24 - Trial = 21884/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.670 | DEBUG    | __main__:trials:29 - Trial = 21884/30000 | Total reward = 43.45
2022-01-26 14:18:12.674 | DEBUG    | __main__:trials:24 - Trial = 21885/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.674 | DEBUG    | __main__:trials:29 - Trial = 21885/30000 | Total reward = 31.54
2022-01-26 14:18:12.678 | DEBUG    | __main__:trials:24 - Trial = 21886/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.679 | DEBUG    | __main__:trials:29 - Trial = 21886/30000 | Total reward = 34.71
2022-01-26 14:18:12.682 | DEBUG    | __main__:trials:26 - Trial = 21887/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.684 | DEBUG    | __main__:trials:29 - Trial = 21887/30000 | Total reward = 23.41
2022-01-26 14:18:12.687 | DEBUG    | __main__:trials:26 - Trial = 21888/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.689 | DEBUG    | __main__:trials:29 - Trial = 21888/30000 | Total reward = 26.62
2022-01-26 14:18:12.692 | DEBUG    | __main__:trials:24 - Trial = 21889/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.692 | DEBUG    | __main__:trials:29 - Trial = 21889/30000 | Total reward = 30.00
2022-01-26 14:18:12.696 | DEBUG    | __main__:trials:24 - Trial = 21890/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.698 | DEBUG    | __main__:trials:29 - Trial = 21890/30000 | Total reward = 47.82
2022-01-26 14:18:12.702 | DEBUG    | __main__:trials:24 - Trial = 21891/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.704 | DEBUG    | __main__:trials:29 - Trial = 21891/30000 | Total reward = 44.24
2022-01-26 14:18:12.707 | DEBUG    | __main__:trials:24 - Trial = 21892/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.708 | DEBUG    | __main__:trials:29 - Trial = 21892/30000 | Total reward = 32.33
2022-01-26 14:18:12.712 | DEBUG    | __main__:trials:24 - Trial = 21893/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.713 | DEBUG    | __main__:trials:29 - Trial = 21893/30000 | Total reward = 45.63
2022-01-26 14:18:12.716 | DEBUG    | __main__:trials:24 - Trial = 21894/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.718 | DEBUG    | __main__:trials:29 - Trial = 21894/30000 | Total reward = 35.61
2022-01-26 14:18:12.721 | DEBUG    | __main__:trials:26 - Trial = 21895/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.723 | DEBUG    | __main__:trials:29 - Trial = 21895/30000 | Total reward = 32.45
2022-01-26 14:18:12.726 | DEBUG    | __main__:trials:24 - Trial = 21896/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.727 | DEBUG    | __main__:trials:29 - Trial = 21896/30000 | Total reward = 51.62
2022-01-26 14:18:12.731 | DEBUG    | __main__:trials:24 - Trial = 21897/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.731 | DEBUG    | __main__:trials:29 - Trial = 21897/30000 | Total reward = 34.70
2022-01-26 14:18:12.735 | DEBUG    | __main__:trials:24 - Trial = 21898/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.737 | DEBUG    | __main__:trials:29 - Trial = 21898/30000 | Total reward = 32.60
2022-01-26 14:18:12.741 | DEBUG    | __main__:trials:24 - Trial = 21899/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.742 | DEBUG    | __main__:trials:29 - Trial = 21899/30000 | Total reward = 47.60
2022-01-26 14:18:12.746 | DEBUG    | __main__:trials:24 - Trial = 21900/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.747 | DEBUG    | __main__:trials:29 - Trial = 21900/30000 | Total reward = 38.28
2022-01-26 14:18:12.751 | DEBUG    | __main__:trials:24 - Trial = 21901/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.752 | DEBUG    | __main__:trials:29 - Trial = 21901/30000 | Total reward = 40.08
2022-01-26 14:18:12.755 | DEBUG    | __main__:trials:24 - Trial = 21902/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.757 | DEBUG    | __main__:trials:29 - Trial = 21902/30000 | Total reward = 50.57
2022-01-26 14:18:12.760 | DEBUG    | __main__:trials:24 - Trial = 21903/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.761 | DEBUG    | __main__:trials:29 - Trial = 21903/30000 | Total reward = 41.59
2022-01-26 14:18:12.765 | DEBUG    | __main__:trials:24 - Trial = 21904/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.766 | DEBUG    | __main__:trials:29 - Trial = 21904/30000 | Total reward = 31.05
2022-01-26 14:18:12.769 | DEBUG    | __main__:trials:24 - Trial = 21905/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.770 | DEBUG    | __main__:trials:29 - Trial = 21905/30000 | Total reward = 36.74
2022-01-26 14:18:12.773 | DEBUG    | __main__:trials:24 - Trial = 21906/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.774 | DEBUG    | __main__:trials:29 - Trial = 21906/30000 | Total reward = 26.37
2022-01-26 14:18:12.778 | DEBUG    | __main__:trials:24 - Trial = 21907/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.780 | DEBUG    | __main__:trials:29 - Trial = 21907/30000 | Total reward = 32.85
2022-01-26 14:18:12.783 | DEBUG    | __main__:trials:24 - Trial = 21908/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.784 | DEBUG    | __main__:trials:29 - Trial = 21908/30000 | Total reward = 38.77
2022-01-26 14:18:12.788 | DEBUG    | __main__:trials:24 - Trial = 21909/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.790 | DEBUG    | __main__:trials:29 - Trial = 21909/30000 | Total reward = 29.57
2022-01-26 14:18:12.793 | DEBUG    | __main__:trials:24 - Trial = 21910/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.794 | DEBUG    | __main__:trials:29 - Trial = 21910/30000 | Total reward = 37.07
2022-01-26 14:18:12.797 | DEBUG    | __main__:trials:24 - Trial = 21911/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.798 | DEBUG    | __main__:trials:29 - Trial = 21911/30000 | Total reward = 38.30
2022-01-26 14:18:12.802 | DEBUG    | __main__:trials:24 - Trial = 21912/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.802 | DEBUG    | __main__:trials:29 - Trial = 21912/30000 | Total reward = 41.36
2022-01-26 14:18:12.806 | DEBUG    | __main__:trials:24 - Trial = 21913/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.808 | DEBUG    | __main__:trials:29 - Trial = 21913/30000 | Total reward = 39.03
2022-01-26 14:18:12.811 | DEBUG    | __main__:trials:24 - Trial = 21914/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.812 | DEBUG    | __main__:trials:29 - Trial = 21914/30000 | Total reward = 45.10
2022-01-26 14:18:12.816 | DEBUG    | __main__:trials:24 - Trial = 21915/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.817 | DEBUG    | __main__:trials:29 - Trial = 21915/30000 | Total reward = 50.60
2022-01-26 14:18:12.820 | DEBUG    | __main__:trials:24 - Trial = 21916/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.822 | DEBUG    | __main__:trials:29 - Trial = 21916/30000 | Total reward = 39.33
2022-01-26 14:18:12.825 | DEBUG    | __main__:trials:24 - Trial = 21917/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.826 | DEBUG    | __main__:trials:29 - Trial = 21917/30000 | Total reward = 38.56
2022-01-26 14:18:12.830 | DEBUG    | __main__:trials:24 - Trial = 21918/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.831 | DEBUG    | __main__:trials:29 - Trial = 21918/30000 | Total reward = 37.26
2022-01-26 14:18:12.834 | DEBUG    | __main__:trials:24 - Trial = 21919/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.836 | DEBUG    | __main__:trials:29 - Trial = 21919/30000 | Total reward = 43.99
2022-01-26 14:18:12.840 | DEBUG    | __main__:trials:24 - Trial = 21920/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.840 | DEBUG    | __main__:trials:29 - Trial = 21920/30000 | Total reward = 34.76
2022-01-26 14:18:12.844 | DEBUG    | __main__:trials:24 - Trial = 21921/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.845 | DEBUG    | __main__:trials:29 - Trial = 21921/30000 | Total reward = 38.01
2022-01-26 14:18:12.848 | DEBUG    | __main__:trials:24 - Trial = 21922/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.849 | DEBUG    | __main__:trials:29 - Trial = 21922/30000 | Total reward = 38.46
2022-01-26 14:18:12.853 | DEBUG    | __main__:trials:24 - Trial = 21923/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.853 | DEBUG    | __main__:trials:29 - Trial = 21923/30000 | Total reward = 34.80
2022-01-26 14:18:12.857 | DEBUG    | __main__:trials:24 - Trial = 21924/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.858 | DEBUG    | __main__:trials:29 - Trial = 21924/30000 | Total reward = 36.69
2022-01-26 14:18:12.861 | DEBUG    | __main__:trials:24 - Trial = 21925/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.862 | DEBUG    | __main__:trials:29 - Trial = 21925/30000 | Total reward = 26.67
2022-01-26 14:18:12.864 | DEBUG    | __main__:trials:26 - Trial = 21926/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.865 | DEBUG    | __main__:trials:29 - Trial = 21926/30000 | Total reward = 15.91
2022-01-26 14:18:12.868 | DEBUG    | __main__:trials:24 - Trial = 21927/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.869 | DEBUG    | __main__:trials:29 - Trial = 21927/30000 | Total reward = 38.34
2022-01-26 14:18:12.873 | DEBUG    | __main__:trials:24 - Trial = 21928/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.874 | DEBUG    | __main__:trials:29 - Trial = 21928/30000 | Total reward = 20.63
2022-01-26 14:18:12.877 | DEBUG    | __main__:trials:24 - Trial = 21929/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.879 | DEBUG    | __main__:trials:29 - Trial = 21929/30000 | Total reward = 29.79
2022-01-26 14:18:12.882 | DEBUG    | __main__:trials:24 - Trial = 21930/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.883 | DEBUG    | __main__:trials:29 - Trial = 21930/30000 | Total reward = 39.88
2022-01-26 14:18:12.887 | DEBUG    | __main__:trials:24 - Trial = 21931/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.888 | DEBUG    | __main__:trials:29 - Trial = 21931/30000 | Total reward = 33.45
2022-01-26 14:18:12.892 | DEBUG    | __main__:trials:24 - Trial = 21932/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.894 | DEBUG    | __main__:trials:29 - Trial = 21932/30000 | Total reward = 38.91
2022-01-26 14:18:12.897 | DEBUG    | __main__:trials:24 - Trial = 21933/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.898 | DEBUG    | __main__:trials:29 - Trial = 21933/30000 | Total reward = 36.22
2022-01-26 14:18:12.902 | DEBUG    | __main__:trials:24 - Trial = 21934/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.903 | DEBUG    | __main__:trials:29 - Trial = 21934/30000 | Total reward = 39.62
2022-01-26 14:18:12.907 | DEBUG    | __main__:trials:24 - Trial = 21935/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.909 | DEBUG    | __main__:trials:29 - Trial = 21935/30000 | Total reward = 37.55
2022-01-26 14:18:12.912 | DEBUG    | __main__:trials:24 - Trial = 21936/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.913 | DEBUG    | __main__:trials:29 - Trial = 21936/30000 | Total reward = 40.41
2022-01-26 14:18:12.918 | DEBUG    | __main__:trials:24 - Trial = 21937/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.918 | DEBUG    | __main__:trials:29 - Trial = 21937/30000 | Total reward = 37.09
2022-01-26 14:18:12.923 | DEBUG    | __main__:trials:24 - Trial = 21938/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.925 | DEBUG    | __main__:trials:29 - Trial = 21938/30000 | Total reward = 50.19
2022-01-26 14:18:12.928 | DEBUG    | __main__:trials:24 - Trial = 21939/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.930 | DEBUG    | __main__:trials:29 - Trial = 21939/30000 | Total reward = 32.11
2022-01-26 14:18:12.934 | DEBUG    | __main__:trials:24 - Trial = 21940/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.935 | DEBUG    | __main__:trials:29 - Trial = 21940/30000 | Total reward = 38.66
2022-01-26 14:18:12.939 | DEBUG    | __main__:trials:24 - Trial = 21941/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.940 | DEBUG    | __main__:trials:29 - Trial = 21941/30000 | Total reward = 28.68
2022-01-26 14:18:12.943 | DEBUG    | __main__:trials:26 - Trial = 21942/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:12.945 | DEBUG    | __main__:trials:29 - Trial = 21942/30000 | Total reward = 36.23
2022-01-26 14:18:12.948 | DEBUG    | __main__:trials:24 - Trial = 21943/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.950 | DEBUG    | __main__:trials:29 - Trial = 21943/30000 | Total reward = 36.12
2022-01-26 14:18:12.953 | DEBUG    | __main__:trials:24 - Trial = 21944/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.954 | DEBUG    | __main__:trials:29 - Trial = 21944/30000 | Total reward = 42.36
2022-01-26 14:18:12.959 | DEBUG    | __main__:trials:24 - Trial = 21945/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.962 | DEBUG    | __main__:trials:29 - Trial = 21945/30000 | Total reward = 39.46
2022-01-26 14:18:12.966 | DEBUG    | __main__:trials:24 - Trial = 21946/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.967 | DEBUG    | __main__:trials:29 - Trial = 21946/30000 | Total reward = 35.04
2022-01-26 14:18:12.971 | DEBUG    | __main__:trials:24 - Trial = 21947/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.972 | DEBUG    | __main__:trials:29 - Trial = 21947/30000 | Total reward = 34.42
2022-01-26 14:18:12.976 | DEBUG    | __main__:trials:24 - Trial = 21948/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.978 | DEBUG    | __main__:trials:29 - Trial = 21948/30000 | Total reward = 38.47
2022-01-26 14:18:12.982 | DEBUG    | __main__:trials:24 - Trial = 21949/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.983 | DEBUG    | __main__:trials:29 - Trial = 21949/30000 | Total reward = 39.57
2022-01-26 14:18:12.987 | DEBUG    | __main__:trials:24 - Trial = 21950/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.988 | DEBUG    | __main__:trials:29 - Trial = 21950/30000 | Total reward = 33.96
2022-01-26 14:18:12.992 | DEBUG    | __main__:trials:24 - Trial = 21951/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.994 | DEBUG    | __main__:trials:29 - Trial = 21951/30000 | Total reward = 34.80
2022-01-26 14:18:12.997 | DEBUG    | __main__:trials:24 - Trial = 21952/30000 | Max number of steps (20) reached
2022-01-26 14:18:12.999 | DEBUG    | __main__:trials:29 - Trial = 21952/30000 | Total reward = 52.55
2022-01-26 14:18:13.003 | DEBUG    | __main__:trials:24 - Trial = 21953/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.003 | DEBUG    | __main__:trials:29 - Trial = 21953/30000 | Total reward = 35.70
2022-01-26 14:18:13.008 | DEBUG    | __main__:trials:24 - Trial = 21954/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.009 | DEBUG    | __main__:trials:29 - Trial = 21954/30000 | Total reward = 47.64
2022-01-26 14:18:13.012 | DEBUG    | __main__:trials:24 - Trial = 21955/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.013 | DEBUG    | __main__:trials:29 - Trial = 21955/30000 | Total reward = 39.64
2022-01-26 14:18:13.018 | DEBUG    | __main__:trials:24 - Trial = 21956/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.019 | DEBUG    | __main__:trials:29 - Trial = 21956/30000 | Total reward = 37.36
2022-01-26 14:18:13.022 | DEBUG    | __main__:trials:24 - Trial = 21957/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.024 | DEBUG    | __main__:trials:29 - Trial = 21957/30000 | Total reward = 34.40
2022-01-26 14:18:13.027 | DEBUG    | __main__:trials:24 - Trial = 21958/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.029 | DEBUG    | __main__:trials:29 - Trial = 21958/30000 | Total reward = 44.23
2022-01-26 14:18:13.033 | DEBUG    | __main__:trials:24 - Trial = 21959/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.035 | DEBUG    | __main__:trials:29 - Trial = 21959/30000 | Total reward = 37.34
2022-01-26 14:18:13.038 | DEBUG    | __main__:trials:24 - Trial = 21960/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.040 | DEBUG    | __main__:trials:29 - Trial = 21960/30000 | Total reward = 38.82
2022-01-26 14:18:13.043 | DEBUG    | __main__:trials:24 - Trial = 21961/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.045 | DEBUG    | __main__:trials:29 - Trial = 21961/30000 | Total reward = 39.44
2022-01-26 14:18:13.048 | DEBUG    | __main__:trials:24 - Trial = 21962/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.050 | DEBUG    | __main__:trials:29 - Trial = 21962/30000 | Total reward = 39.64
2022-01-26 14:18:13.052 | DEBUG    | __main__:trials:24 - Trial = 21963/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.054 | DEBUG    | __main__:trials:29 - Trial = 21963/30000 | Total reward = 38.00
2022-01-26 14:18:13.057 | DEBUG    | __main__:trials:24 - Trial = 21964/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.059 | DEBUG    | __main__:trials:29 - Trial = 21964/30000 | Total reward = 43.68
2022-01-26 14:18:13.063 | DEBUG    | __main__:trials:24 - Trial = 21965/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.063 | DEBUG    | __main__:trials:29 - Trial = 21965/30000 | Total reward = 38.61
2022-01-26 14:18:13.066 | DEBUG    | __main__:trials:26 - Trial = 21966/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.068 | DEBUG    | __main__:trials:29 - Trial = 21966/30000 | Total reward = 18.10
2022-01-26 14:18:13.071 | DEBUG    | __main__:trials:24 - Trial = 21967/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.072 | DEBUG    | __main__:trials:29 - Trial = 21967/30000 | Total reward = 31.43
2022-01-26 14:18:13.075 | DEBUG    | __main__:trials:24 - Trial = 21968/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.076 | DEBUG    | __main__:trials:29 - Trial = 21968/30000 | Total reward = 36.60
2022-01-26 14:18:13.079 | DEBUG    | __main__:trials:24 - Trial = 21969/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.081 | DEBUG    | __main__:trials:29 - Trial = 21969/30000 | Total reward = 41.09
2022-01-26 14:18:13.084 | DEBUG    | __main__:trials:24 - Trial = 21970/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.086 | DEBUG    | __main__:trials:29 - Trial = 21970/30000 | Total reward = 38.23
2022-01-26 14:18:13.089 | DEBUG    | __main__:trials:24 - Trial = 21971/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.089 | DEBUG    | __main__:trials:29 - Trial = 21971/30000 | Total reward = 39.30
2022-01-26 14:18:13.092 | DEBUG    | __main__:trials:24 - Trial = 21972/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.093 | DEBUG    | __main__:trials:29 - Trial = 21972/30000 | Total reward = 44.33
2022-01-26 14:18:13.097 | DEBUG    | __main__:trials:24 - Trial = 21973/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.097 | DEBUG    | __main__:trials:29 - Trial = 21973/30000 | Total reward = 51.32
2022-01-26 14:18:13.101 | DEBUG    | __main__:trials:24 - Trial = 21974/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.102 | DEBUG    | __main__:trials:29 - Trial = 21974/30000 | Total reward = 49.14
2022-01-26 14:18:13.105 | DEBUG    | __main__:trials:24 - Trial = 21975/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.106 | DEBUG    | __main__:trials:29 - Trial = 21975/30000 | Total reward = 35.47
2022-01-26 14:18:13.110 | DEBUG    | __main__:trials:24 - Trial = 21976/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.110 | DEBUG    | __main__:trials:29 - Trial = 21976/30000 | Total reward = 52.01
2022-01-26 14:18:13.114 | DEBUG    | __main__:trials:24 - Trial = 21977/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.116 | DEBUG    | __main__:trials:29 - Trial = 21977/30000 | Total reward = 35.25
2022-01-26 14:18:13.119 | DEBUG    | __main__:trials:24 - Trial = 21978/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.120 | DEBUG    | __main__:trials:29 - Trial = 21978/30000 | Total reward = 36.80
2022-01-26 14:18:13.123 | DEBUG    | __main__:trials:24 - Trial = 21979/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.125 | DEBUG    | __main__:trials:29 - Trial = 21979/30000 | Total reward = 38.05
2022-01-26 14:18:13.128 | DEBUG    | __main__:trials:24 - Trial = 21980/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.129 | DEBUG    | __main__:trials:29 - Trial = 21980/30000 | Total reward = 38.01
2022-01-26 14:18:13.133 | DEBUG    | __main__:trials:24 - Trial = 21981/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.133 | DEBUG    | __main__:trials:29 - Trial = 21981/30000 | Total reward = 36.27
2022-01-26 14:18:13.137 | DEBUG    | __main__:trials:24 - Trial = 21982/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.138 | DEBUG    | __main__:trials:29 - Trial = 21982/30000 | Total reward = 39.33
2022-01-26 14:18:13.141 | DEBUG    | __main__:trials:24 - Trial = 21983/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.143 | DEBUG    | __main__:trials:29 - Trial = 21983/30000 | Total reward = 36.91
2022-01-26 14:18:13.146 | DEBUG    | __main__:trials:24 - Trial = 21984/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.148 | DEBUG    | __main__:trials:29 - Trial = 21984/30000 | Total reward = 38.11
2022-01-26 14:18:13.151 | DEBUG    | __main__:trials:24 - Trial = 21985/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.153 | DEBUG    | __main__:trials:29 - Trial = 21985/30000 | Total reward = 36.61
2022-01-26 14:18:13.156 | DEBUG    | __main__:trials:24 - Trial = 21986/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.157 | DEBUG    | __main__:trials:29 - Trial = 21986/30000 | Total reward = 29.51
2022-01-26 14:18:13.160 | DEBUG    | __main__:trials:24 - Trial = 21987/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.162 | DEBUG    | __main__:trials:29 - Trial = 21987/30000 | Total reward = 39.56
2022-01-26 14:18:13.165 | DEBUG    | __main__:trials:24 - Trial = 21988/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.166 | DEBUG    | __main__:trials:29 - Trial = 21988/30000 | Total reward = 41.96
2022-01-26 14:18:13.170 | DEBUG    | __main__:trials:24 - Trial = 21989/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.171 | DEBUG    | __main__:trials:29 - Trial = 21989/30000 | Total reward = 34.44
2022-01-26 14:18:13.175 | DEBUG    | __main__:trials:24 - Trial = 21990/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.177 | DEBUG    | __main__:trials:29 - Trial = 21990/30000 | Total reward = 36.79
2022-01-26 14:18:13.180 | DEBUG    | __main__:trials:24 - Trial = 21991/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.182 | DEBUG    | __main__:trials:29 - Trial = 21991/30000 | Total reward = 35.56
2022-01-26 14:18:13.186 | DEBUG    | __main__:trials:24 - Trial = 21992/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.186 | DEBUG    | __main__:trials:29 - Trial = 21992/30000 | Total reward = 47.56
2022-01-26 14:18:13.191 | DEBUG    | __main__:trials:24 - Trial = 21993/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.192 | DEBUG    | __main__:trials:29 - Trial = 21993/30000 | Total reward = 34.11
2022-01-26 14:18:13.195 | DEBUG    | __main__:trials:24 - Trial = 21994/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.196 | DEBUG    | __main__:trials:29 - Trial = 21994/30000 | Total reward = 30.79
2022-01-26 14:18:13.199 | DEBUG    | __main__:trials:24 - Trial = 21995/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.200 | DEBUG    | __main__:trials:29 - Trial = 21995/30000 | Total reward = 43.24
2022-01-26 14:18:13.204 | DEBUG    | __main__:trials:24 - Trial = 21996/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.205 | DEBUG    | __main__:trials:29 - Trial = 21996/30000 | Total reward = 31.34
2022-01-26 14:18:13.208 | DEBUG    | __main__:trials:24 - Trial = 21997/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.210 | DEBUG    | __main__:trials:29 - Trial = 21997/30000 | Total reward = 58.15
2022-01-26 14:18:13.213 | DEBUG    | __main__:trials:24 - Trial = 21998/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.213 | DEBUG    | __main__:trials:29 - Trial = 21998/30000 | Total reward = 44.72
2022-01-26 14:18:13.217 | DEBUG    | __main__:trials:24 - Trial = 21999/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.217 | DEBUG    | __main__:trials:29 - Trial = 21999/30000 | Total reward = 38.61
2022-01-26 14:18:13.221 | DEBUG    | __main__:trials:26 - Trial = 22000/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.221 | DEBUG    | __main__:trials:29 - Trial = 22000/30000 | Total reward = 37.26
2022-01-26 14:18:13.225 | DEBUG    | __main__:trials:26 - Trial = 22001/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.226 | DEBUG    | __main__:trials:29 - Trial = 22001/30000 | Total reward = 30.00
2022-01-26 14:18:13.229 | DEBUG    | __main__:trials:24 - Trial = 22002/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.230 | DEBUG    | __main__:trials:29 - Trial = 22002/30000 | Total reward = 33.74
2022-01-26 14:18:13.233 | DEBUG    | __main__:trials:24 - Trial = 22003/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.234 | DEBUG    | __main__:trials:29 - Trial = 22003/30000 | Total reward = 38.27
2022-01-26 14:18:13.237 | DEBUG    | __main__:trials:24 - Trial = 22004/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.239 | DEBUG    | __main__:trials:29 - Trial = 22004/30000 | Total reward = 39.64
2022-01-26 14:18:13.242 | DEBUG    | __main__:trials:24 - Trial = 22005/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.242 | DEBUG    | __main__:trials:29 - Trial = 22005/30000 | Total reward = 42.54
2022-01-26 14:18:13.246 | DEBUG    | __main__:trials:24 - Trial = 22006/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.247 | DEBUG    | __main__:trials:29 - Trial = 22006/30000 | Total reward = 38.27
2022-01-26 14:18:13.250 | DEBUG    | __main__:trials:24 - Trial = 22007/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.251 | DEBUG    | __main__:trials:29 - Trial = 22007/30000 | Total reward = 39.57
2022-01-26 14:18:13.255 | DEBUG    | __main__:trials:24 - Trial = 22008/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.257 | DEBUG    | __main__:trials:29 - Trial = 22008/30000 | Total reward = 51.82
2022-01-26 14:18:13.260 | DEBUG    | __main__:trials:24 - Trial = 22009/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.261 | DEBUG    | __main__:trials:29 - Trial = 22009/30000 | Total reward = 34.49
2022-01-26 14:18:13.264 | DEBUG    | __main__:trials:24 - Trial = 22010/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.265 | DEBUG    | __main__:trials:29 - Trial = 22010/30000 | Total reward = 39.66
2022-01-26 14:18:13.269 | DEBUG    | __main__:trials:24 - Trial = 22011/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.270 | DEBUG    | __main__:trials:29 - Trial = 22011/30000 | Total reward = 39.76
2022-01-26 14:18:13.273 | DEBUG    | __main__:trials:26 - Trial = 22012/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.274 | DEBUG    | __main__:trials:29 - Trial = 22012/30000 | Total reward = 34.01
2022-01-26 14:18:13.277 | DEBUG    | __main__:trials:24 - Trial = 22013/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.277 | DEBUG    | __main__:trials:29 - Trial = 22013/30000 | Total reward = 36.17
2022-01-26 14:18:13.282 | DEBUG    | __main__:trials:24 - Trial = 22014/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.282 | DEBUG    | __main__:trials:29 - Trial = 22014/30000 | Total reward = 52.53
2022-01-26 14:18:13.286 | DEBUG    | __main__:trials:24 - Trial = 22015/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.287 | DEBUG    | __main__:trials:29 - Trial = 22015/30000 | Total reward = 39.64
2022-01-26 14:18:13.291 | DEBUG    | __main__:trials:24 - Trial = 22016/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.293 | DEBUG    | __main__:trials:29 - Trial = 22016/30000 | Total reward = 38.70
2022-01-26 14:18:13.296 | DEBUG    | __main__:trials:24 - Trial = 22017/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.297 | DEBUG    | __main__:trials:29 - Trial = 22017/30000 | Total reward = 35.19
2022-01-26 14:18:13.301 | DEBUG    | __main__:trials:26 - Trial = 22018/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.301 | DEBUG    | __main__:trials:29 - Trial = 22018/30000 | Total reward = 36.38
2022-01-26 14:18:13.305 | DEBUG    | __main__:trials:26 - Trial = 22019/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.305 | DEBUG    | __main__:trials:29 - Trial = 22019/30000 | Total reward = 38.32
2022-01-26 14:18:13.309 | DEBUG    | __main__:trials:24 - Trial = 22020/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.311 | DEBUG    | __main__:trials:29 - Trial = 22020/30000 | Total reward = 39.68
2022-01-26 14:18:13.314 | DEBUG    | __main__:trials:24 - Trial = 22021/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.314 | DEBUG    | __main__:trials:29 - Trial = 22021/30000 | Total reward = 28.45
2022-01-26 14:18:13.318 | DEBUG    | __main__:trials:24 - Trial = 22022/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.320 | DEBUG    | __main__:trials:29 - Trial = 22022/30000 | Total reward = 34.56
2022-01-26 14:18:13.322 | DEBUG    | __main__:trials:24 - Trial = 22023/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.323 | DEBUG    | __main__:trials:29 - Trial = 22023/30000 | Total reward = 33.11
2022-01-26 14:18:13.327 | DEBUG    | __main__:trials:24 - Trial = 22024/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.328 | DEBUG    | __main__:trials:29 - Trial = 22024/30000 | Total reward = 36.73
2022-01-26 14:18:13.331 | DEBUG    | __main__:trials:24 - Trial = 22025/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.332 | DEBUG    | __main__:trials:29 - Trial = 22025/30000 | Total reward = 30.74
2022-01-26 14:18:13.335 | DEBUG    | __main__:trials:24 - Trial = 22026/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.336 | DEBUG    | __main__:trials:29 - Trial = 22026/30000 | Total reward = 33.72
2022-01-26 14:18:13.340 | DEBUG    | __main__:trials:24 - Trial = 22027/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.341 | DEBUG    | __main__:trials:29 - Trial = 22027/30000 | Total reward = 41.32
2022-01-26 14:18:13.345 | DEBUG    | __main__:trials:24 - Trial = 22028/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.345 | DEBUG    | __main__:trials:29 - Trial = 22028/30000 | Total reward = 39.57
2022-01-26 14:18:13.349 | DEBUG    | __main__:trials:24 - Trial = 22029/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.350 | DEBUG    | __main__:trials:29 - Trial = 22029/30000 | Total reward = 39.64
2022-01-26 14:18:13.353 | DEBUG    | __main__:trials:24 - Trial = 22030/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.354 | DEBUG    | __main__:trials:29 - Trial = 22030/30000 | Total reward = 38.61
2022-01-26 14:18:13.357 | DEBUG    | __main__:trials:24 - Trial = 22031/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.359 | DEBUG    | __main__:trials:29 - Trial = 22031/30000 | Total reward = 45.65
2022-01-26 14:18:13.362 | DEBUG    | __main__:trials:26 - Trial = 22032/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.362 | DEBUG    | __main__:trials:29 - Trial = 22032/30000 | Total reward = 28.04
2022-01-26 14:18:13.366 | DEBUG    | __main__:trials:24 - Trial = 22033/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.367 | DEBUG    | __main__:trials:29 - Trial = 22033/30000 | Total reward = 30.87
2022-01-26 14:18:13.370 | DEBUG    | __main__:trials:24 - Trial = 22034/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.371 | DEBUG    | __main__:trials:29 - Trial = 22034/30000 | Total reward = 39.19
2022-01-26 14:18:13.374 | DEBUG    | __main__:trials:26 - Trial = 22035/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.374 | DEBUG    | __main__:trials:29 - Trial = 22035/30000 | Total reward = 16.05
2022-01-26 14:18:13.377 | DEBUG    | __main__:trials:24 - Trial = 22036/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.378 | DEBUG    | __main__:trials:29 - Trial = 22036/30000 | Total reward = 37.22
2022-01-26 14:18:13.381 | DEBUG    | __main__:trials:26 - Trial = 22037/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.383 | DEBUG    | __main__:trials:29 - Trial = 22037/30000 | Total reward = 38.63
2022-01-26 14:18:13.386 | DEBUG    | __main__:trials:24 - Trial = 22038/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.388 | DEBUG    | __main__:trials:29 - Trial = 22038/30000 | Total reward = 33.71
2022-01-26 14:18:13.391 | DEBUG    | __main__:trials:24 - Trial = 22039/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.392 | DEBUG    | __main__:trials:29 - Trial = 22039/30000 | Total reward = 39.41
2022-01-26 14:18:13.395 | DEBUG    | __main__:trials:24 - Trial = 22040/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.397 | DEBUG    | __main__:trials:29 - Trial = 22040/30000 | Total reward = 34.56
2022-01-26 14:18:13.400 | DEBUG    | __main__:trials:24 - Trial = 22041/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.401 | DEBUG    | __main__:trials:29 - Trial = 22041/30000 | Total reward = 42.39
2022-01-26 14:18:13.404 | DEBUG    | __main__:trials:24 - Trial = 22042/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.406 | DEBUG    | __main__:trials:29 - Trial = 22042/30000 | Total reward = 37.36
2022-01-26 14:18:13.409 | DEBUG    | __main__:trials:24 - Trial = 22043/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.410 | DEBUG    | __main__:trials:29 - Trial = 22043/30000 | Total reward = 39.95
2022-01-26 14:18:13.414 | DEBUG    | __main__:trials:24 - Trial = 22044/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.415 | DEBUG    | __main__:trials:29 - Trial = 22044/30000 | Total reward = 39.85
2022-01-26 14:18:13.418 | DEBUG    | __main__:trials:24 - Trial = 22045/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.419 | DEBUG    | __main__:trials:29 - Trial = 22045/30000 | Total reward = 37.58
2022-01-26 14:18:13.422 | DEBUG    | __main__:trials:24 - Trial = 22046/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.423 | DEBUG    | __main__:trials:29 - Trial = 22046/30000 | Total reward = 30.78
2022-01-26 14:18:13.426 | DEBUG    | __main__:trials:24 - Trial = 22047/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.428 | DEBUG    | __main__:trials:29 - Trial = 22047/30000 | Total reward = 37.27
2022-01-26 14:18:13.431 | DEBUG    | __main__:trials:26 - Trial = 22048/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.433 | DEBUG    | __main__:trials:29 - Trial = 22048/30000 | Total reward = 24.41
2022-01-26 14:18:13.436 | DEBUG    | __main__:trials:24 - Trial = 22049/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.436 | DEBUG    | __main__:trials:29 - Trial = 22049/30000 | Total reward = 34.76
2022-01-26 14:18:13.441 | DEBUG    | __main__:trials:24 - Trial = 22050/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.441 | DEBUG    | __main__:trials:29 - Trial = 22050/30000 | Total reward = 41.00
2022-01-26 14:18:13.445 | DEBUG    | __main__:trials:24 - Trial = 22051/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.445 | DEBUG    | __main__:trials:29 - Trial = 22051/30000 | Total reward = 37.92
2022-01-26 14:18:13.449 | DEBUG    | __main__:trials:24 - Trial = 22052/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.450 | DEBUG    | __main__:trials:29 - Trial = 22052/30000 | Total reward = 36.40
2022-01-26 14:18:13.453 | DEBUG    | __main__:trials:24 - Trial = 22053/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.454 | DEBUG    | __main__:trials:29 - Trial = 22053/30000 | Total reward = 51.81
2022-01-26 14:18:13.457 | DEBUG    | __main__:trials:24 - Trial = 22054/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.458 | DEBUG    | __main__:trials:29 - Trial = 22054/30000 | Total reward = 37.07
2022-01-26 14:18:13.461 | DEBUG    | __main__:trials:24 - Trial = 22055/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.463 | DEBUG    | __main__:trials:29 - Trial = 22055/30000 | Total reward = 52.57
2022-01-26 14:18:13.467 | DEBUG    | __main__:trials:24 - Trial = 22056/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.467 | DEBUG    | __main__:trials:29 - Trial = 22056/30000 | Total reward = 42.44
2022-01-26 14:18:13.471 | DEBUG    | __main__:trials:24 - Trial = 22057/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.473 | DEBUG    | __main__:trials:29 - Trial = 22057/30000 | Total reward = 32.88
2022-01-26 14:18:13.475 | DEBUG    | __main__:trials:24 - Trial = 22058/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.476 | DEBUG    | __main__:trials:29 - Trial = 22058/30000 | Total reward = 30.36
2022-01-26 14:18:13.479 | DEBUG    | __main__:trials:26 - Trial = 22059/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.480 | DEBUG    | __main__:trials:29 - Trial = 22059/30000 | Total reward = 28.55
2022-01-26 14:18:13.483 | DEBUG    | __main__:trials:24 - Trial = 22060/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.484 | DEBUG    | __main__:trials:29 - Trial = 22060/30000 | Total reward = 41.57
2022-01-26 14:18:13.488 | DEBUG    | __main__:trials:24 - Trial = 22061/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.490 | DEBUG    | __main__:trials:29 - Trial = 22061/30000 | Total reward = 36.07
2022-01-26 14:18:13.493 | DEBUG    | __main__:trials:24 - Trial = 22062/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.494 | DEBUG    | __main__:trials:29 - Trial = 22062/30000 | Total reward = 30.57
2022-01-26 14:18:13.497 | DEBUG    | __main__:trials:24 - Trial = 22063/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.498 | DEBUG    | __main__:trials:29 - Trial = 22063/30000 | Total reward = 36.68
2022-01-26 14:18:13.502 | DEBUG    | __main__:trials:24 - Trial = 22064/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.503 | DEBUG    | __main__:trials:29 - Trial = 22064/30000 | Total reward = 41.90
2022-01-26 14:18:13.506 | DEBUG    | __main__:trials:24 - Trial = 22065/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.507 | DEBUG    | __main__:trials:29 - Trial = 22065/30000 | Total reward = 33.50
2022-01-26 14:18:13.511 | DEBUG    | __main__:trials:24 - Trial = 22066/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.513 | DEBUG    | __main__:trials:29 - Trial = 22066/30000 | Total reward = 44.42
2022-01-26 14:18:13.515 | DEBUG    | __main__:trials:26 - Trial = 22067/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.516 | DEBUG    | __main__:trials:29 - Trial = 22067/30000 | Total reward = 24.72
2022-01-26 14:18:13.520 | DEBUG    | __main__:trials:24 - Trial = 22068/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.520 | DEBUG    | __main__:trials:29 - Trial = 22068/30000 | Total reward = 44.29
2022-01-26 14:18:13.525 | DEBUG    | __main__:trials:24 - Trial = 22069/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.526 | DEBUG    | __main__:trials:29 - Trial = 22069/30000 | Total reward = 32.69
2022-01-26 14:18:13.529 | DEBUG    | __main__:trials:24 - Trial = 22070/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.530 | DEBUG    | __main__:trials:29 - Trial = 22070/30000 | Total reward = 32.11
2022-01-26 14:18:13.533 | DEBUG    | __main__:trials:24 - Trial = 22071/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.535 | DEBUG    | __main__:trials:29 - Trial = 22071/30000 | Total reward = 42.53
2022-01-26 14:18:13.538 | DEBUG    | __main__:trials:24 - Trial = 22072/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.540 | DEBUG    | __main__:trials:29 - Trial = 22072/30000 | Total reward = 40.00
2022-01-26 14:18:13.543 | DEBUG    | __main__:trials:24 - Trial = 22073/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.543 | DEBUG    | __main__:trials:29 - Trial = 22073/30000 | Total reward = 36.70
2022-01-26 14:18:13.547 | DEBUG    | __main__:trials:24 - Trial = 22074/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.547 | DEBUG    | __main__:trials:29 - Trial = 22074/30000 | Total reward = 43.92
2022-01-26 14:18:13.551 | DEBUG    | __main__:trials:24 - Trial = 22075/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.551 | DEBUG    | __main__:trials:29 - Trial = 22075/30000 | Total reward = 33.89
2022-01-26 14:18:13.555 | DEBUG    | __main__:trials:24 - Trial = 22076/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.557 | DEBUG    | __main__:trials:29 - Trial = 22076/30000 | Total reward = 34.11
2022-01-26 14:18:13.560 | DEBUG    | __main__:trials:24 - Trial = 22077/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.560 | DEBUG    | __main__:trials:29 - Trial = 22077/30000 | Total reward = 40.64
2022-01-26 14:18:13.564 | DEBUG    | __main__:trials:26 - Trial = 22078/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.564 | DEBUG    | __main__:trials:29 - Trial = 22078/30000 | Total reward = 22.93
2022-01-26 14:18:13.568 | DEBUG    | __main__:trials:24 - Trial = 22079/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.568 | DEBUG    | __main__:trials:29 - Trial = 22079/30000 | Total reward = 35.78
2022-01-26 14:18:13.572 | DEBUG    | __main__:trials:24 - Trial = 22080/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.574 | DEBUG    | __main__:trials:29 - Trial = 22080/30000 | Total reward = 31.94
2022-01-26 14:18:13.577 | DEBUG    | __main__:trials:24 - Trial = 22081/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.578 | DEBUG    | __main__:trials:29 - Trial = 22081/30000 | Total reward = 33.67
2022-01-26 14:18:13.582 | DEBUG    | __main__:trials:24 - Trial = 22082/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.582 | DEBUG    | __main__:trials:29 - Trial = 22082/30000 | Total reward = 34.97
2022-01-26 14:18:13.585 | DEBUG    | __main__:trials:26 - Trial = 22083/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.587 | DEBUG    | __main__:trials:29 - Trial = 22083/30000 | Total reward = 19.50
2022-01-26 14:18:13.590 | DEBUG    | __main__:trials:26 - Trial = 22084/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.591 | DEBUG    | __main__:trials:29 - Trial = 22084/30000 | Total reward = 31.22
2022-01-26 14:18:13.594 | DEBUG    | __main__:trials:24 - Trial = 22085/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.595 | DEBUG    | __main__:trials:29 - Trial = 22085/30000 | Total reward = 41.47
2022-01-26 14:18:13.598 | DEBUG    | __main__:trials:24 - Trial = 22086/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.599 | DEBUG    | __main__:trials:29 - Trial = 22086/30000 | Total reward = 38.30
2022-01-26 14:18:13.603 | DEBUG    | __main__:trials:24 - Trial = 22087/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.604 | DEBUG    | __main__:trials:29 - Trial = 22087/30000 | Total reward = 33.16
2022-01-26 14:18:13.608 | DEBUG    | __main__:trials:24 - Trial = 22088/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.608 | DEBUG    | __main__:trials:29 - Trial = 22088/30000 | Total reward = 39.00
2022-01-26 14:18:13.612 | DEBUG    | __main__:trials:24 - Trial = 22089/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.612 | DEBUG    | __main__:trials:29 - Trial = 22089/30000 | Total reward = 38.25
2022-01-26 14:18:13.616 | DEBUG    | __main__:trials:24 - Trial = 22090/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.618 | DEBUG    | __main__:trials:29 - Trial = 22090/30000 | Total reward = 44.72
2022-01-26 14:18:13.621 | DEBUG    | __main__:trials:24 - Trial = 22091/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.621 | DEBUG    | __main__:trials:29 - Trial = 22091/30000 | Total reward = 47.94
2022-01-26 14:18:13.624 | DEBUG    | __main__:trials:26 - Trial = 22092/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.625 | DEBUG    | __main__:trials:29 - Trial = 22092/30000 | Total reward = 20.33
2022-01-26 14:18:13.629 | DEBUG    | __main__:trials:24 - Trial = 22093/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.630 | DEBUG    | __main__:trials:29 - Trial = 22093/30000 | Total reward = 33.41
2022-01-26 14:18:13.633 | DEBUG    | __main__:trials:24 - Trial = 22094/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.635 | DEBUG    | __main__:trials:29 - Trial = 22094/30000 | Total reward = 48.64
2022-01-26 14:18:13.637 | DEBUG    | __main__:trials:26 - Trial = 22095/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.638 | DEBUG    | __main__:trials:29 - Trial = 22095/30000 | Total reward = 25.42
2022-01-26 14:18:13.642 | DEBUG    | __main__:trials:24 - Trial = 22096/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.644 | DEBUG    | __main__:trials:29 - Trial = 22096/30000 | Total reward = 37.90
2022-01-26 14:18:13.646 | DEBUG    | __main__:trials:24 - Trial = 22097/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.647 | DEBUG    | __main__:trials:29 - Trial = 22097/30000 | Total reward = 37.37
2022-01-26 14:18:13.651 | DEBUG    | __main__:trials:24 - Trial = 22098/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.651 | DEBUG    | __main__:trials:29 - Trial = 22098/30000 | Total reward = 29.63
2022-01-26 14:18:13.655 | DEBUG    | __main__:trials:24 - Trial = 22099/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.656 | DEBUG    | __main__:trials:29 - Trial = 22099/30000 | Total reward = 37.14
2022-01-26 14:18:13.659 | DEBUG    | __main__:trials:24 - Trial = 22100/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.661 | DEBUG    | __main__:trials:29 - Trial = 22100/30000 | Total reward = 31.53
2022-01-26 14:18:13.664 | DEBUG    | __main__:trials:24 - Trial = 22101/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.665 | DEBUG    | __main__:trials:29 - Trial = 22101/30000 | Total reward = 39.72
2022-01-26 14:18:13.668 | DEBUG    | __main__:trials:24 - Trial = 22102/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.669 | DEBUG    | __main__:trials:29 - Trial = 22102/30000 | Total reward = 30.52
2022-01-26 14:18:13.672 | DEBUG    | __main__:trials:26 - Trial = 22103/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.673 | DEBUG    | __main__:trials:29 - Trial = 22103/30000 | Total reward = 23.55
2022-01-26 14:18:13.675 | DEBUG    | __main__:trials:24 - Trial = 22104/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.676 | DEBUG    | __main__:trials:29 - Trial = 22104/30000 | Total reward = 39.57
2022-01-26 14:18:13.679 | DEBUG    | __main__:trials:24 - Trial = 22105/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.680 | DEBUG    | __main__:trials:29 - Trial = 22105/30000 | Total reward = 40.79
2022-01-26 14:18:13.683 | DEBUG    | __main__:trials:24 - Trial = 22106/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.684 | DEBUG    | __main__:trials:29 - Trial = 22106/30000 | Total reward = 48.37
2022-01-26 14:18:13.687 | DEBUG    | __main__:trials:24 - Trial = 22107/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.688 | DEBUG    | __main__:trials:29 - Trial = 22107/30000 | Total reward = 36.24
2022-01-26 14:18:13.692 | DEBUG    | __main__:trials:24 - Trial = 22108/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.693 | DEBUG    | __main__:trials:29 - Trial = 22108/30000 | Total reward = 38.93
2022-01-26 14:18:13.697 | DEBUG    | __main__:trials:24 - Trial = 22109/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.697 | DEBUG    | __main__:trials:29 - Trial = 22109/30000 | Total reward = 39.03
2022-01-26 14:18:13.701 | DEBUG    | __main__:trials:24 - Trial = 22110/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.701 | DEBUG    | __main__:trials:29 - Trial = 22110/30000 | Total reward = 54.77
2022-01-26 14:18:13.705 | DEBUG    | __main__:trials:24 - Trial = 22111/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.706 | DEBUG    | __main__:trials:29 - Trial = 22111/30000 | Total reward = 46.13
2022-01-26 14:18:13.709 | DEBUG    | __main__:trials:24 - Trial = 22112/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.710 | DEBUG    | __main__:trials:29 - Trial = 22112/30000 | Total reward = 33.14
2022-01-26 14:18:13.713 | DEBUG    | __main__:trials:24 - Trial = 22113/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.715 | DEBUG    | __main__:trials:29 - Trial = 22113/30000 | Total reward = 39.79
2022-01-26 14:18:13.718 | DEBUG    | __main__:trials:24 - Trial = 22114/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.719 | DEBUG    | __main__:trials:29 - Trial = 22114/30000 | Total reward = 34.87
2022-01-26 14:18:13.722 | DEBUG    | __main__:trials:24 - Trial = 22115/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.723 | DEBUG    | __main__:trials:29 - Trial = 22115/30000 | Total reward = 48.96
2022-01-26 14:18:13.727 | DEBUG    | __main__:trials:24 - Trial = 22116/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.729 | DEBUG    | __main__:trials:29 - Trial = 22116/30000 | Total reward = 39.18
2022-01-26 14:18:13.732 | DEBUG    | __main__:trials:24 - Trial = 22117/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.733 | DEBUG    | __main__:trials:29 - Trial = 22117/30000 | Total reward = 48.73
2022-01-26 14:18:13.736 | DEBUG    | __main__:trials:24 - Trial = 22118/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.737 | DEBUG    | __main__:trials:29 - Trial = 22118/30000 | Total reward = 51.34
2022-01-26 14:18:13.740 | DEBUG    | __main__:trials:24 - Trial = 22119/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.741 | DEBUG    | __main__:trials:29 - Trial = 22119/30000 | Total reward = 54.66
2022-01-26 14:18:13.744 | DEBUG    | __main__:trials:24 - Trial = 22120/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.745 | DEBUG    | __main__:trials:29 - Trial = 22120/30000 | Total reward = 49.25
2022-01-26 14:18:13.748 | DEBUG    | __main__:trials:24 - Trial = 22121/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.750 | DEBUG    | __main__:trials:29 - Trial = 22121/30000 | Total reward = 37.77
2022-01-26 14:18:13.753 | DEBUG    | __main__:trials:26 - Trial = 22122/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.754 | DEBUG    | __main__:trials:29 - Trial = 22122/30000 | Total reward = 33.62
2022-01-26 14:18:13.757 | DEBUG    | __main__:trials:26 - Trial = 22123/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.758 | DEBUG    | __main__:trials:29 - Trial = 22123/30000 | Total reward = 30.62
2022-01-26 14:18:13.761 | DEBUG    | __main__:trials:24 - Trial = 22124/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.762 | DEBUG    | __main__:trials:29 - Trial = 22124/30000 | Total reward = 48.48
2022-01-26 14:18:13.765 | DEBUG    | __main__:trials:24 - Trial = 22125/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.766 | DEBUG    | __main__:trials:29 - Trial = 22125/30000 | Total reward = 44.75
2022-01-26 14:18:13.770 | DEBUG    | __main__:trials:24 - Trial = 22126/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.770 | DEBUG    | __main__:trials:29 - Trial = 22126/30000 | Total reward = 38.42
2022-01-26 14:18:13.773 | DEBUG    | __main__:trials:24 - Trial = 22127/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.774 | DEBUG    | __main__:trials:29 - Trial = 22127/30000 | Total reward = 50.25
2022-01-26 14:18:13.778 | DEBUG    | __main__:trials:24 - Trial = 22128/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.779 | DEBUG    | __main__:trials:29 - Trial = 22128/30000 | Total reward = 52.97
2022-01-26 14:18:13.782 | DEBUG    | __main__:trials:24 - Trial = 22129/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.784 | DEBUG    | __main__:trials:29 - Trial = 22129/30000 | Total reward = 51.39
2022-01-26 14:18:13.788 | DEBUG    | __main__:trials:24 - Trial = 22130/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.789 | DEBUG    | __main__:trials:29 - Trial = 22130/30000 | Total reward = 38.09
2022-01-26 14:18:13.792 | DEBUG    | __main__:trials:24 - Trial = 22131/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.794 | DEBUG    | __main__:trials:29 - Trial = 22131/30000 | Total reward = 36.71
2022-01-26 14:18:13.797 | DEBUG    | __main__:trials:24 - Trial = 22132/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.797 | DEBUG    | __main__:trials:29 - Trial = 22132/30000 | Total reward = 35.58
2022-01-26 14:18:13.801 | DEBUG    | __main__:trials:24 - Trial = 22133/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.801 | DEBUG    | __main__:trials:29 - Trial = 22133/30000 | Total reward = 33.50
2022-01-26 14:18:13.805 | DEBUG    | __main__:trials:24 - Trial = 22134/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.805 | DEBUG    | __main__:trials:29 - Trial = 22134/30000 | Total reward = 58.99
2022-01-26 14:18:13.809 | DEBUG    | __main__:trials:24 - Trial = 22135/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.809 | DEBUG    | __main__:trials:29 - Trial = 22135/30000 | Total reward = 41.34
2022-01-26 14:18:13.813 | DEBUG    | __main__:trials:24 - Trial = 22136/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.813 | DEBUG    | __main__:trials:29 - Trial = 22136/30000 | Total reward = 42.05
2022-01-26 14:18:13.817 | DEBUG    | __main__:trials:24 - Trial = 22137/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.817 | DEBUG    | __main__:trials:29 - Trial = 22137/30000 | Total reward = 31.32
2022-01-26 14:18:13.821 | DEBUG    | __main__:trials:24 - Trial = 22138/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.821 | DEBUG    | __main__:trials:29 - Trial = 22138/30000 | Total reward = 33.67
2022-01-26 14:18:13.825 | DEBUG    | __main__:trials:24 - Trial = 22139/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.827 | DEBUG    | __main__:trials:29 - Trial = 22139/30000 | Total reward = 39.60
2022-01-26 14:18:13.830 | DEBUG    | __main__:trials:24 - Trial = 22140/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.831 | DEBUG    | __main__:trials:29 - Trial = 22140/30000 | Total reward = 37.21
2022-01-26 14:18:13.834 | DEBUG    | __main__:trials:24 - Trial = 22141/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.835 | DEBUG    | __main__:trials:29 - Trial = 22141/30000 | Total reward = 39.00
2022-01-26 14:18:13.839 | DEBUG    | __main__:trials:24 - Trial = 22142/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.840 | DEBUG    | __main__:trials:29 - Trial = 22142/30000 | Total reward = 33.97
2022-01-26 14:18:13.843 | DEBUG    | __main__:trials:24 - Trial = 22143/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.844 | DEBUG    | __main__:trials:29 - Trial = 22143/30000 | Total reward = 38.65
2022-01-26 14:18:13.847 | DEBUG    | __main__:trials:26 - Trial = 22144/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.848 | DEBUG    | __main__:trials:29 - Trial = 22144/30000 | Total reward = 21.01
2022-01-26 14:18:13.851 | DEBUG    | __main__:trials:24 - Trial = 22145/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.852 | DEBUG    | __main__:trials:29 - Trial = 22145/30000 | Total reward = 33.91
2022-01-26 14:18:13.855 | DEBUG    | __main__:trials:26 - Trial = 22146/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.856 | DEBUG    | __main__:trials:29 - Trial = 22146/30000 | Total reward = 35.46
2022-01-26 14:18:13.861 | DEBUG    | __main__:trials:24 - Trial = 22147/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.862 | DEBUG    | __main__:trials:29 - Trial = 22147/30000 | Total reward = 38.25
2022-01-26 14:18:13.865 | DEBUG    | __main__:trials:24 - Trial = 22148/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.866 | DEBUG    | __main__:trials:29 - Trial = 22148/30000 | Total reward = 35.69
2022-01-26 14:18:13.869 | DEBUG    | __main__:trials:26 - Trial = 22149/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:13.870 | DEBUG    | __main__:trials:29 - Trial = 22149/30000 | Total reward = 31.02
2022-01-26 14:18:13.873 | DEBUG    | __main__:trials:24 - Trial = 22150/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.874 | DEBUG    | __main__:trials:29 - Trial = 22150/30000 | Total reward = 49.06
2022-01-26 14:18:13.878 | DEBUG    | __main__:trials:24 - Trial = 22151/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.880 | DEBUG    | __main__:trials:29 - Trial = 22151/30000 | Total reward = 48.55
2022-01-26 14:18:13.883 | DEBUG    | __main__:trials:24 - Trial = 22152/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.883 | DEBUG    | __main__:trials:29 - Trial = 22152/30000 | Total reward = 41.79
2022-01-26 14:18:13.887 | DEBUG    | __main__:trials:24 - Trial = 22153/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.887 | DEBUG    | __main__:trials:29 - Trial = 22153/30000 | Total reward = 46.06
2022-01-26 14:18:13.892 | DEBUG    | __main__:trials:24 - Trial = 22154/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.893 | DEBUG    | __main__:trials:29 - Trial = 22154/30000 | Total reward = 36.00
2022-01-26 14:18:13.896 | DEBUG    | __main__:trials:24 - Trial = 22155/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.897 | DEBUG    | __main__:trials:29 - Trial = 22155/30000 | Total reward = 41.66
2022-01-26 14:18:13.900 | DEBUG    | __main__:trials:24 - Trial = 22156/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.901 | DEBUG    | __main__:trials:29 - Trial = 22156/30000 | Total reward = 58.15
2022-01-26 14:18:13.904 | DEBUG    | __main__:trials:24 - Trial = 22157/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.906 | DEBUG    | __main__:trials:29 - Trial = 22157/30000 | Total reward = 39.45
2022-01-26 14:18:13.909 | DEBUG    | __main__:trials:24 - Trial = 22158/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.910 | DEBUG    | __main__:trials:29 - Trial = 22158/30000 | Total reward = 30.17
2022-01-26 14:18:13.913 | DEBUG    | __main__:trials:24 - Trial = 22159/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.914 | DEBUG    | __main__:trials:29 - Trial = 22159/30000 | Total reward = 49.15
2022-01-26 14:18:13.917 | DEBUG    | __main__:trials:24 - Trial = 22160/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.918 | DEBUG    | __main__:trials:29 - Trial = 22160/30000 | Total reward = 37.94
2022-01-26 14:18:13.922 | DEBUG    | __main__:trials:24 - Trial = 22161/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.923 | DEBUG    | __main__:trials:29 - Trial = 22161/30000 | Total reward = 52.09
2022-01-26 14:18:13.927 | DEBUG    | __main__:trials:24 - Trial = 22162/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.928 | DEBUG    | __main__:trials:29 - Trial = 22162/30000 | Total reward = 37.77
2022-01-26 14:18:13.932 | DEBUG    | __main__:trials:24 - Trial = 22163/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.933 | DEBUG    | __main__:trials:29 - Trial = 22163/30000 | Total reward = 38.24
2022-01-26 14:18:13.936 | DEBUG    | __main__:trials:24 - Trial = 22164/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.937 | DEBUG    | __main__:trials:29 - Trial = 22164/30000 | Total reward = 35.66
2022-01-26 14:18:13.941 | DEBUG    | __main__:trials:24 - Trial = 22165/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.943 | DEBUG    | __main__:trials:29 - Trial = 22165/30000 | Total reward = 47.11
2022-01-26 14:18:13.946 | DEBUG    | __main__:trials:24 - Trial = 22166/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.947 | DEBUG    | __main__:trials:29 - Trial = 22166/30000 | Total reward = 66.84
2022-01-26 14:18:13.951 | DEBUG    | __main__:trials:24 - Trial = 22167/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.952 | DEBUG    | __main__:trials:29 - Trial = 22167/30000 | Total reward = 35.27
2022-01-26 14:18:13.956 | DEBUG    | __main__:trials:24 - Trial = 22168/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.957 | DEBUG    | __main__:trials:29 - Trial = 22168/30000 | Total reward = 44.76
2022-01-26 14:18:13.961 | DEBUG    | __main__:trials:24 - Trial = 22169/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.963 | DEBUG    | __main__:trials:29 - Trial = 22169/30000 | Total reward = 46.60
2022-01-26 14:18:13.967 | DEBUG    | __main__:trials:24 - Trial = 22170/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.968 | DEBUG    | __main__:trials:29 - Trial = 22170/30000 | Total reward = 46.91
2022-01-26 14:18:13.972 | DEBUG    | __main__:trials:24 - Trial = 22171/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.973 | DEBUG    | __main__:trials:29 - Trial = 22171/30000 | Total reward = 41.99
2022-01-26 14:18:13.977 | DEBUG    | __main__:trials:24 - Trial = 22172/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.978 | DEBUG    | __main__:trials:29 - Trial = 22172/30000 | Total reward = 32.01
2022-01-26 14:18:13.982 | DEBUG    | __main__:trials:24 - Trial = 22173/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.984 | DEBUG    | __main__:trials:29 - Trial = 22173/30000 | Total reward = 37.31
2022-01-26 14:18:13.988 | DEBUG    | __main__:trials:24 - Trial = 22174/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.990 | DEBUG    | __main__:trials:29 - Trial = 22174/30000 | Total reward = 38.11
2022-01-26 14:18:13.993 | DEBUG    | __main__:trials:24 - Trial = 22175/30000 | Max number of steps (20) reached
2022-01-26 14:18:13.995 | DEBUG    | __main__:trials:29 - Trial = 22175/30000 | Total reward = 39.81
2022-01-26 14:18:13.999 | DEBUG    | __main__:trials:24 - Trial = 22176/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.000 | DEBUG    | __main__:trials:29 - Trial = 22176/30000 | Total reward = 37.04
2022-01-26 14:18:14.004 | DEBUG    | __main__:trials:24 - Trial = 22177/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.006 | DEBUG    | __main__:trials:29 - Trial = 22177/30000 | Total reward = 38.89
2022-01-26 14:18:14.009 | DEBUG    | __main__:trials:24 - Trial = 22178/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.010 | DEBUG    | __main__:trials:29 - Trial = 22178/30000 | Total reward = 19.82
2022-01-26 14:18:14.015 | DEBUG    | __main__:trials:24 - Trial = 22179/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.016 | DEBUG    | __main__:trials:29 - Trial = 22179/30000 | Total reward = 36.21
2022-01-26 14:18:14.020 | DEBUG    | __main__:trials:24 - Trial = 22180/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.022 | DEBUG    | __main__:trials:29 - Trial = 22180/30000 | Total reward = 39.89
2022-01-26 14:18:14.025 | DEBUG    | __main__:trials:24 - Trial = 22181/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.027 | DEBUG    | __main__:trials:29 - Trial = 22181/30000 | Total reward = 42.24
2022-01-26 14:18:14.030 | DEBUG    | __main__:trials:24 - Trial = 22182/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.032 | DEBUG    | __main__:trials:29 - Trial = 22182/30000 | Total reward = 41.54
2022-01-26 14:18:14.035 | DEBUG    | __main__:trials:24 - Trial = 22183/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.037 | DEBUG    | __main__:trials:29 - Trial = 22183/30000 | Total reward = 43.55
2022-01-26 14:18:14.040 | DEBUG    | __main__:trials:24 - Trial = 22184/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.042 | DEBUG    | __main__:trials:29 - Trial = 22184/30000 | Total reward = 38.73
2022-01-26 14:18:14.045 | DEBUG    | __main__:trials:24 - Trial = 22185/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.047 | DEBUG    | __main__:trials:29 - Trial = 22185/30000 | Total reward = 54.31
2022-01-26 14:18:14.050 | DEBUG    | __main__:trials:24 - Trial = 22186/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.052 | DEBUG    | __main__:trials:29 - Trial = 22186/30000 | Total reward = 43.82
2022-01-26 14:18:14.055 | DEBUG    | __main__:trials:24 - Trial = 22187/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.056 | DEBUG    | __main__:trials:29 - Trial = 22187/30000 | Total reward = 51.94
2022-01-26 14:18:14.061 | DEBUG    | __main__:trials:24 - Trial = 22188/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.062 | DEBUG    | __main__:trials:29 - Trial = 22188/30000 | Total reward = 39.31
2022-01-26 14:18:14.065 | DEBUG    | __main__:trials:24 - Trial = 22189/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.066 | DEBUG    | __main__:trials:29 - Trial = 22189/30000 | Total reward = 43.18
2022-01-26 14:18:14.069 | DEBUG    | __main__:trials:24 - Trial = 22190/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.070 | DEBUG    | __main__:trials:29 - Trial = 22190/30000 | Total reward = 49.92
2022-01-26 14:18:14.074 | DEBUG    | __main__:trials:24 - Trial = 22191/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.075 | DEBUG    | __main__:trials:29 - Trial = 22191/30000 | Total reward = 45.20
2022-01-26 14:18:14.079 | DEBUG    | __main__:trials:24 - Trial = 22192/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.079 | DEBUG    | __main__:trials:29 - Trial = 22192/30000 | Total reward = 31.57
2022-01-26 14:18:14.084 | DEBUG    | __main__:trials:24 - Trial = 22193/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.084 | DEBUG    | __main__:trials:29 - Trial = 22193/30000 | Total reward = 34.50
2022-01-26 14:18:14.088 | DEBUG    | __main__:trials:24 - Trial = 22194/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.090 | DEBUG    | __main__:trials:29 - Trial = 22194/30000 | Total reward = 38.62
2022-01-26 14:18:14.093 | DEBUG    | __main__:trials:24 - Trial = 22195/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.095 | DEBUG    | __main__:trials:29 - Trial = 22195/30000 | Total reward = 38.01
2022-01-26 14:18:14.099 | DEBUG    | __main__:trials:24 - Trial = 22196/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.100 | DEBUG    | __main__:trials:29 - Trial = 22196/30000 | Total reward = 50.61
2022-01-26 14:18:14.103 | DEBUG    | __main__:trials:24 - Trial = 22197/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.105 | DEBUG    | __main__:trials:29 - Trial = 22197/30000 | Total reward = 45.75
2022-01-26 14:18:14.109 | DEBUG    | __main__:trials:24 - Trial = 22198/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.109 | DEBUG    | __main__:trials:29 - Trial = 22198/30000 | Total reward = 48.02
2022-01-26 14:18:14.113 | DEBUG    | __main__:trials:24 - Trial = 22199/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.115 | DEBUG    | __main__:trials:29 - Trial = 22199/30000 | Total reward = 38.94
2022-01-26 14:18:14.119 | DEBUG    | __main__:trials:24 - Trial = 22200/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.120 | DEBUG    | __main__:trials:29 - Trial = 22200/30000 | Total reward = 40.77
2022-01-26 14:18:14.123 | DEBUG    | __main__:trials:24 - Trial = 22201/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.125 | DEBUG    | __main__:trials:29 - Trial = 22201/30000 | Total reward = 43.43
2022-01-26 14:18:14.129 | DEBUG    | __main__:trials:24 - Trial = 22202/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.130 | DEBUG    | __main__:trials:29 - Trial = 22202/30000 | Total reward = 29.80
2022-01-26 14:18:14.134 | DEBUG    | __main__:trials:24 - Trial = 22203/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.136 | DEBUG    | __main__:trials:29 - Trial = 22203/30000 | Total reward = 43.50
2022-01-26 14:18:14.140 | DEBUG    | __main__:trials:24 - Trial = 22204/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.141 | DEBUG    | __main__:trials:29 - Trial = 22204/30000 | Total reward = 27.76
2022-01-26 14:18:14.144 | DEBUG    | __main__:trials:24 - Trial = 22205/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.145 | DEBUG    | __main__:trials:29 - Trial = 22205/30000 | Total reward = 34.34
2022-01-26 14:18:14.150 | DEBUG    | __main__:trials:24 - Trial = 22206/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.151 | DEBUG    | __main__:trials:29 - Trial = 22206/30000 | Total reward = 33.77
2022-01-26 14:18:14.154 | DEBUG    | __main__:trials:24 - Trial = 22207/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.156 | DEBUG    | __main__:trials:29 - Trial = 22207/30000 | Total reward = 44.98
2022-01-26 14:18:14.160 | DEBUG    | __main__:trials:24 - Trial = 22208/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.162 | DEBUG    | __main__:trials:29 - Trial = 22208/30000 | Total reward = 39.95
2022-01-26 14:18:14.165 | DEBUG    | __main__:trials:24 - Trial = 22209/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.166 | DEBUG    | __main__:trials:29 - Trial = 22209/30000 | Total reward = 42.15
2022-01-26 14:18:14.170 | DEBUG    | __main__:trials:24 - Trial = 22210/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.172 | DEBUG    | __main__:trials:29 - Trial = 22210/30000 | Total reward = 29.26
2022-01-26 14:18:14.176 | DEBUG    | __main__:trials:24 - Trial = 22211/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.177 | DEBUG    | __main__:trials:29 - Trial = 22211/30000 | Total reward = 41.12
2022-01-26 14:18:14.181 | DEBUG    | __main__:trials:26 - Trial = 22212/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.181 | DEBUG    | __main__:trials:29 - Trial = 22212/30000 | Total reward = 21.98
2022-01-26 14:18:14.186 | DEBUG    | __main__:trials:24 - Trial = 22213/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.187 | DEBUG    | __main__:trials:29 - Trial = 22213/30000 | Total reward = 40.32
2022-01-26 14:18:14.191 | DEBUG    | __main__:trials:24 - Trial = 22214/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.192 | DEBUG    | __main__:trials:29 - Trial = 22214/30000 | Total reward = 44.31
2022-01-26 14:18:14.195 | DEBUG    | __main__:trials:24 - Trial = 22215/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.197 | DEBUG    | __main__:trials:29 - Trial = 22215/30000 | Total reward = 41.07
2022-01-26 14:18:14.200 | DEBUG    | __main__:trials:24 - Trial = 22216/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.202 | DEBUG    | __main__:trials:29 - Trial = 22216/30000 | Total reward = 49.04
2022-01-26 14:18:14.205 | DEBUG    | __main__:trials:24 - Trial = 22217/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.207 | DEBUG    | __main__:trials:29 - Trial = 22217/30000 | Total reward = 34.41
2022-01-26 14:18:14.210 | DEBUG    | __main__:trials:24 - Trial = 22218/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.210 | DEBUG    | __main__:trials:29 - Trial = 22218/30000 | Total reward = 39.55
2022-01-26 14:18:14.214 | DEBUG    | __main__:trials:24 - Trial = 22219/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.215 | DEBUG    | __main__:trials:29 - Trial = 22219/30000 | Total reward = 35.33
2022-01-26 14:18:14.219 | DEBUG    | __main__:trials:24 - Trial = 22220/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.219 | DEBUG    | __main__:trials:29 - Trial = 22220/30000 | Total reward = 51.80
2022-01-26 14:18:14.223 | DEBUG    | __main__:trials:24 - Trial = 22221/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.225 | DEBUG    | __main__:trials:29 - Trial = 22221/30000 | Total reward = 38.44
2022-01-26 14:18:14.227 | DEBUG    | __main__:trials:24 - Trial = 22222/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.228 | DEBUG    | __main__:trials:29 - Trial = 22222/30000 | Total reward = 35.29
2022-01-26 14:18:14.232 | DEBUG    | __main__:trials:24 - Trial = 22223/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.233 | DEBUG    | __main__:trials:29 - Trial = 22223/30000 | Total reward = 38.10
2022-01-26 14:18:14.236 | DEBUG    | __main__:trials:24 - Trial = 22224/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.238 | DEBUG    | __main__:trials:29 - Trial = 22224/30000 | Total reward = 37.15
2022-01-26 14:18:14.242 | DEBUG    | __main__:trials:24 - Trial = 22225/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.243 | DEBUG    | __main__:trials:29 - Trial = 22225/30000 | Total reward = 34.06
2022-01-26 14:18:14.246 | DEBUG    | __main__:trials:24 - Trial = 22226/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.247 | DEBUG    | __main__:trials:29 - Trial = 22226/30000 | Total reward = 39.16
2022-01-26 14:18:14.250 | DEBUG    | __main__:trials:26 - Trial = 22227/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.251 | DEBUG    | __main__:trials:29 - Trial = 22227/30000 | Total reward = 27.17
2022-01-26 14:18:14.254 | DEBUG    | __main__:trials:24 - Trial = 22228/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.256 | DEBUG    | __main__:trials:29 - Trial = 22228/30000 | Total reward = 30.42
2022-01-26 14:18:14.259 | DEBUG    | __main__:trials:24 - Trial = 22229/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.261 | DEBUG    | __main__:trials:29 - Trial = 22229/30000 | Total reward = 62.13
2022-01-26 14:18:14.265 | DEBUG    | __main__:trials:24 - Trial = 22230/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.266 | DEBUG    | __main__:trials:29 - Trial = 22230/30000 | Total reward = 34.98
2022-01-26 14:18:14.269 | DEBUG    | __main__:trials:24 - Trial = 22231/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.270 | DEBUG    | __main__:trials:29 - Trial = 22231/30000 | Total reward = 39.85
2022-01-26 14:18:14.274 | DEBUG    | __main__:trials:24 - Trial = 22232/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.274 | DEBUG    | __main__:trials:29 - Trial = 22232/30000 | Total reward = 37.16
2022-01-26 14:18:14.278 | DEBUG    | __main__:trials:24 - Trial = 22233/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.278 | DEBUG    | __main__:trials:29 - Trial = 22233/30000 | Total reward = 40.99
2022-01-26 14:18:14.282 | DEBUG    | __main__:trials:24 - Trial = 22234/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.284 | DEBUG    | __main__:trials:29 - Trial = 22234/30000 | Total reward = 43.65
2022-01-26 14:18:14.288 | DEBUG    | __main__:trials:26 - Trial = 22235/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.289 | DEBUG    | __main__:trials:29 - Trial = 22235/30000 | Total reward = 37.11
2022-01-26 14:18:14.292 | DEBUG    | __main__:trials:24 - Trial = 22236/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.294 | DEBUG    | __main__:trials:29 - Trial = 22236/30000 | Total reward = 45.08
2022-01-26 14:18:14.297 | DEBUG    | __main__:trials:24 - Trial = 22237/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.298 | DEBUG    | __main__:trials:29 - Trial = 22237/30000 | Total reward = 34.13
2022-01-26 14:18:14.301 | DEBUG    | __main__:trials:24 - Trial = 22238/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.302 | DEBUG    | __main__:trials:29 - Trial = 22238/30000 | Total reward = 23.02
2022-01-26 14:18:14.305 | DEBUG    | __main__:trials:24 - Trial = 22239/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.307 | DEBUG    | __main__:trials:29 - Trial = 22239/30000 | Total reward = 35.85
2022-01-26 14:18:14.310 | DEBUG    | __main__:trials:24 - Trial = 22240/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.312 | DEBUG    | __main__:trials:29 - Trial = 22240/30000 | Total reward = 47.29
2022-01-26 14:18:14.315 | DEBUG    | __main__:trials:24 - Trial = 22241/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.316 | DEBUG    | __main__:trials:29 - Trial = 22241/30000 | Total reward = 44.93
2022-01-26 14:18:14.319 | DEBUG    | __main__:trials:24 - Trial = 22242/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.320 | DEBUG    | __main__:trials:29 - Trial = 22242/30000 | Total reward = 62.35
2022-01-26 14:18:14.323 | DEBUG    | __main__:trials:24 - Trial = 22243/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.325 | DEBUG    | __main__:trials:29 - Trial = 22243/30000 | Total reward = 45.98
2022-01-26 14:18:14.328 | DEBUG    | __main__:trials:24 - Trial = 22244/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.329 | DEBUG    | __main__:trials:29 - Trial = 22244/30000 | Total reward = 46.83
2022-01-26 14:18:14.332 | DEBUG    | __main__:trials:24 - Trial = 22245/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.334 | DEBUG    | __main__:trials:29 - Trial = 22245/30000 | Total reward = 27.02
2022-01-26 14:18:14.338 | DEBUG    | __main__:trials:24 - Trial = 22246/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.338 | DEBUG    | __main__:trials:29 - Trial = 22246/30000 | Total reward = 37.08
2022-01-26 14:18:14.342 | DEBUG    | __main__:trials:24 - Trial = 22247/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.344 | DEBUG    | __main__:trials:29 - Trial = 22247/30000 | Total reward = 39.58
2022-01-26 14:18:14.346 | DEBUG    | __main__:trials:24 - Trial = 22248/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.347 | DEBUG    | __main__:trials:29 - Trial = 22248/30000 | Total reward = 39.57
2022-01-26 14:18:14.351 | DEBUG    | __main__:trials:24 - Trial = 22249/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.352 | DEBUG    | __main__:trials:29 - Trial = 22249/30000 | Total reward = 43.02
2022-01-26 14:18:14.355 | DEBUG    | __main__:trials:24 - Trial = 22250/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.357 | DEBUG    | __main__:trials:29 - Trial = 22250/30000 | Total reward = 56.02
2022-01-26 14:18:14.360 | DEBUG    | __main__:trials:24 - Trial = 22251/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.361 | DEBUG    | __main__:trials:29 - Trial = 22251/30000 | Total reward = 44.35
2022-01-26 14:18:14.364 | DEBUG    | __main__:trials:24 - Trial = 22252/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.365 | DEBUG    | __main__:trials:29 - Trial = 22252/30000 | Total reward = 45.36
2022-01-26 14:18:14.368 | DEBUG    | __main__:trials:24 - Trial = 22253/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.370 | DEBUG    | __main__:trials:29 - Trial = 22253/30000 | Total reward = 46.73
2022-01-26 14:18:14.373 | DEBUG    | __main__:trials:24 - Trial = 22254/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.374 | DEBUG    | __main__:trials:29 - Trial = 22254/30000 | Total reward = 50.47
2022-01-26 14:18:14.377 | DEBUG    | __main__:trials:24 - Trial = 22255/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.378 | DEBUG    | __main__:trials:29 - Trial = 22255/30000 | Total reward = 35.25
2022-01-26 14:18:14.381 | DEBUG    | __main__:trials:24 - Trial = 22256/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.383 | DEBUG    | __main__:trials:29 - Trial = 22256/30000 | Total reward = 38.30
2022-01-26 14:18:14.385 | DEBUG    | __main__:trials:24 - Trial = 22257/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.387 | DEBUG    | __main__:trials:29 - Trial = 22257/30000 | Total reward = 46.01
2022-01-26 14:18:14.390 | DEBUG    | __main__:trials:24 - Trial = 22258/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.391 | DEBUG    | __main__:trials:29 - Trial = 22258/30000 | Total reward = 47.36
2022-01-26 14:18:14.394 | DEBUG    | __main__:trials:24 - Trial = 22259/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.396 | DEBUG    | __main__:trials:29 - Trial = 22259/30000 | Total reward = 32.29
2022-01-26 14:18:14.399 | DEBUG    | __main__:trials:24 - Trial = 22260/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.400 | DEBUG    | __main__:trials:29 - Trial = 22260/30000 | Total reward = 47.49
2022-01-26 14:18:14.403 | DEBUG    | __main__:trials:24 - Trial = 22261/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.404 | DEBUG    | __main__:trials:29 - Trial = 22261/30000 | Total reward = 49.55
2022-01-26 14:18:14.408 | DEBUG    | __main__:trials:24 - Trial = 22262/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.408 | DEBUG    | __main__:trials:29 - Trial = 22262/30000 | Total reward = 41.04
2022-01-26 14:18:14.412 | DEBUG    | __main__:trials:24 - Trial = 22263/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.412 | DEBUG    | __main__:trials:29 - Trial = 22263/30000 | Total reward = 45.23
2022-01-26 14:18:14.416 | DEBUG    | __main__:trials:24 - Trial = 22264/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.416 | DEBUG    | __main__:trials:29 - Trial = 22264/30000 | Total reward = 46.65
2022-01-26 14:18:14.420 | DEBUG    | __main__:trials:24 - Trial = 22265/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.420 | DEBUG    | __main__:trials:29 - Trial = 22265/30000 | Total reward = 50.58
2022-01-26 14:18:14.424 | DEBUG    | __main__:trials:24 - Trial = 22266/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.424 | DEBUG    | __main__:trials:29 - Trial = 22266/30000 | Total reward = 45.32
2022-01-26 14:18:14.428 | DEBUG    | __main__:trials:24 - Trial = 22267/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.429 | DEBUG    | __main__:trials:29 - Trial = 22267/30000 | Total reward = 57.65
2022-01-26 14:18:14.433 | DEBUG    | __main__:trials:24 - Trial = 22268/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.434 | DEBUG    | __main__:trials:29 - Trial = 22268/30000 | Total reward = 55.04
2022-01-26 14:18:14.437 | DEBUG    | __main__:trials:24 - Trial = 22269/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.438 | DEBUG    | __main__:trials:29 - Trial = 22269/30000 | Total reward = 41.10
2022-01-26 14:18:14.441 | DEBUG    | __main__:trials:24 - Trial = 22270/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.442 | DEBUG    | __main__:trials:29 - Trial = 22270/30000 | Total reward = 46.93
2022-01-26 14:18:14.446 | DEBUG    | __main__:trials:24 - Trial = 22271/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.448 | DEBUG    | __main__:trials:29 - Trial = 22271/30000 | Total reward = 49.85
2022-01-26 14:18:14.451 | DEBUG    | __main__:trials:24 - Trial = 22272/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.453 | DEBUG    | __main__:trials:29 - Trial = 22272/30000 | Total reward = 46.51
2022-01-26 14:18:14.456 | DEBUG    | __main__:trials:24 - Trial = 22273/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.457 | DEBUG    | __main__:trials:29 - Trial = 22273/30000 | Total reward = 45.52
2022-01-26 14:18:14.460 | DEBUG    | __main__:trials:24 - Trial = 22274/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.462 | DEBUG    | __main__:trials:29 - Trial = 22274/30000 | Total reward = 47.36
2022-01-26 14:18:14.466 | DEBUG    | __main__:trials:24 - Trial = 22275/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.467 | DEBUG    | __main__:trials:29 - Trial = 22275/30000 | Total reward = 48.68
2022-01-26 14:18:14.471 | DEBUG    | __main__:trials:24 - Trial = 22276/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.473 | DEBUG    | __main__:trials:29 - Trial = 22276/30000 | Total reward = 49.55
2022-01-26 14:18:14.476 | DEBUG    | __main__:trials:24 - Trial = 22277/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.477 | DEBUG    | __main__:trials:29 - Trial = 22277/30000 | Total reward = 49.68
2022-01-26 14:18:14.481 | DEBUG    | __main__:trials:24 - Trial = 22278/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.482 | DEBUG    | __main__:trials:29 - Trial = 22278/30000 | Total reward = 42.30
2022-01-26 14:18:14.486 | DEBUG    | __main__:trials:24 - Trial = 22279/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.487 | DEBUG    | __main__:trials:29 - Trial = 22279/30000 | Total reward = 35.00
2022-01-26 14:18:14.491 | DEBUG    | __main__:trials:24 - Trial = 22280/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.493 | DEBUG    | __main__:trials:29 - Trial = 22280/30000 | Total reward = 49.59
2022-01-26 14:18:14.496 | DEBUG    | __main__:trials:24 - Trial = 22281/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.497 | DEBUG    | __main__:trials:29 - Trial = 22281/30000 | Total reward = 65.59
2022-01-26 14:18:14.501 | DEBUG    | __main__:trials:24 - Trial = 22282/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.502 | DEBUG    | __main__:trials:29 - Trial = 22282/30000 | Total reward = 35.90
2022-01-26 14:18:14.507 | DEBUG    | __main__:trials:24 - Trial = 22283/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.507 | DEBUG    | __main__:trials:29 - Trial = 22283/30000 | Total reward = 31.21
2022-01-26 14:18:14.512 | DEBUG    | __main__:trials:24 - Trial = 22284/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.513 | DEBUG    | __main__:trials:29 - Trial = 22284/30000 | Total reward = 47.20
2022-01-26 14:18:14.517 | DEBUG    | __main__:trials:24 - Trial = 22285/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.518 | DEBUG    | __main__:trials:29 - Trial = 22285/30000 | Total reward = 47.30
2022-01-26 14:18:14.522 | DEBUG    | __main__:trials:24 - Trial = 22286/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.523 | DEBUG    | __main__:trials:29 - Trial = 22286/30000 | Total reward = 37.74
2022-01-26 14:18:14.527 | DEBUG    | __main__:trials:24 - Trial = 22287/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.528 | DEBUG    | __main__:trials:29 - Trial = 22287/30000 | Total reward = 29.25
2022-01-26 14:18:14.532 | DEBUG    | __main__:trials:24 - Trial = 22288/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.534 | DEBUG    | __main__:trials:29 - Trial = 22288/30000 | Total reward = 35.02
2022-01-26 14:18:14.537 | DEBUG    | __main__:trials:24 - Trial = 22289/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.538 | DEBUG    | __main__:trials:29 - Trial = 22289/30000 | Total reward = 39.60
2022-01-26 14:18:14.543 | DEBUG    | __main__:trials:24 - Trial = 22290/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.543 | DEBUG    | __main__:trials:29 - Trial = 22290/30000 | Total reward = 44.61
2022-01-26 14:18:14.548 | DEBUG    | __main__:trials:24 - Trial = 22291/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.549 | DEBUG    | __main__:trials:29 - Trial = 22291/30000 | Total reward = 48.09
2022-01-26 14:18:14.552 | DEBUG    | __main__:trials:24 - Trial = 22292/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.554 | DEBUG    | __main__:trials:29 - Trial = 22292/30000 | Total reward = 37.29
2022-01-26 14:18:14.557 | DEBUG    | __main__:trials:24 - Trial = 22293/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.558 | DEBUG    | __main__:trials:29 - Trial = 22293/30000 | Total reward = 42.97
2022-01-26 14:18:14.561 | DEBUG    | __main__:trials:24 - Trial = 22294/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.563 | DEBUG    | __main__:trials:29 - Trial = 22294/30000 | Total reward = 35.54
2022-01-26 14:18:14.566 | DEBUG    | __main__:trials:24 - Trial = 22295/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.567 | DEBUG    | __main__:trials:29 - Trial = 22295/30000 | Total reward = 50.89
2022-01-26 14:18:14.572 | DEBUG    | __main__:trials:24 - Trial = 22296/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.572 | DEBUG    | __main__:trials:29 - Trial = 22296/30000 | Total reward = 66.26
2022-01-26 14:18:14.577 | DEBUG    | __main__:trials:24 - Trial = 22297/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.578 | DEBUG    | __main__:trials:29 - Trial = 22297/30000 | Total reward = 47.20
2022-01-26 14:18:14.582 | DEBUG    | __main__:trials:24 - Trial = 22298/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.584 | DEBUG    | __main__:trials:29 - Trial = 22298/30000 | Total reward = 61.91
2022-01-26 14:18:14.587 | DEBUG    | __main__:trials:24 - Trial = 22299/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.588 | DEBUG    | __main__:trials:29 - Trial = 22299/30000 | Total reward = 49.68
2022-01-26 14:18:14.591 | DEBUG    | __main__:trials:24 - Trial = 22300/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.593 | DEBUG    | __main__:trials:29 - Trial = 22300/30000 | Total reward = 53.38
2022-01-26 14:18:14.596 | DEBUG    | __main__:trials:24 - Trial = 22301/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.598 | DEBUG    | __main__:trials:29 - Trial = 22301/30000 | Total reward = 35.15
2022-01-26 14:18:14.602 | DEBUG    | __main__:trials:24 - Trial = 22302/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.604 | DEBUG    | __main__:trials:29 - Trial = 22302/30000 | Total reward = 53.58
2022-01-26 14:18:14.608 | DEBUG    | __main__:trials:24 - Trial = 22303/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.609 | DEBUG    | __main__:trials:29 - Trial = 22303/30000 | Total reward = 47.99
2022-01-26 14:18:14.613 | DEBUG    | __main__:trials:24 - Trial = 22304/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.614 | DEBUG    | __main__:trials:29 - Trial = 22304/30000 | Total reward = 39.26
2022-01-26 14:18:14.618 | DEBUG    | __main__:trials:24 - Trial = 22305/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.620 | DEBUG    | __main__:trials:29 - Trial = 22305/30000 | Total reward = 55.26
2022-01-26 14:18:14.624 | DEBUG    | __main__:trials:24 - Trial = 22306/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.625 | DEBUG    | __main__:trials:29 - Trial = 22306/30000 | Total reward = 43.41
2022-01-26 14:18:14.629 | DEBUG    | __main__:trials:24 - Trial = 22307/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.630 | DEBUG    | __main__:trials:29 - Trial = 22307/30000 | Total reward = 35.97
2022-01-26 14:18:14.634 | DEBUG    | __main__:trials:24 - Trial = 22308/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.635 | DEBUG    | __main__:trials:29 - Trial = 22308/30000 | Total reward = 40.12
2022-01-26 14:18:14.638 | DEBUG    | __main__:trials:26 - Trial = 22309/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.640 | DEBUG    | __main__:trials:29 - Trial = 22309/30000 | Total reward = 24.54
2022-01-26 14:18:14.644 | DEBUG    | __main__:trials:24 - Trial = 22310/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.645 | DEBUG    | __main__:trials:29 - Trial = 22310/30000 | Total reward = 46.07
2022-01-26 14:18:14.649 | DEBUG    | __main__:trials:24 - Trial = 22311/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.651 | DEBUG    | __main__:trials:29 - Trial = 22311/30000 | Total reward = 38.14
2022-01-26 14:18:14.655 | DEBUG    | __main__:trials:24 - Trial = 22312/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.656 | DEBUG    | __main__:trials:29 - Trial = 22312/30000 | Total reward = 38.34
2022-01-26 14:18:14.660 | DEBUG    | __main__:trials:24 - Trial = 22313/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.661 | DEBUG    | __main__:trials:29 - Trial = 22313/30000 | Total reward = 48.37
2022-01-26 14:18:14.665 | DEBUG    | __main__:trials:24 - Trial = 22314/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.666 | DEBUG    | __main__:trials:29 - Trial = 22314/30000 | Total reward = 34.07
2022-01-26 14:18:14.670 | DEBUG    | __main__:trials:24 - Trial = 22315/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.671 | DEBUG    | __main__:trials:29 - Trial = 22315/30000 | Total reward = 36.81
2022-01-26 14:18:14.674 | DEBUG    | __main__:trials:24 - Trial = 22316/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.676 | DEBUG    | __main__:trials:29 - Trial = 22316/30000 | Total reward = 49.44
2022-01-26 14:18:14.680 | DEBUG    | __main__:trials:24 - Trial = 22317/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.681 | DEBUG    | __main__:trials:29 - Trial = 22317/30000 | Total reward = 56.32
2022-01-26 14:18:14.685 | DEBUG    | __main__:trials:24 - Trial = 22318/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.686 | DEBUG    | __main__:trials:29 - Trial = 22318/30000 | Total reward = 36.74
2022-01-26 14:18:14.690 | DEBUG    | __main__:trials:24 - Trial = 22319/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.692 | DEBUG    | __main__:trials:29 - Trial = 22319/30000 | Total reward = 47.10
2022-01-26 14:18:14.696 | DEBUG    | __main__:trials:24 - Trial = 22320/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.697 | DEBUG    | __main__:trials:29 - Trial = 22320/30000 | Total reward = 38.73
2022-01-26 14:18:14.700 | DEBUG    | __main__:trials:24 - Trial = 22321/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.702 | DEBUG    | __main__:trials:29 - Trial = 22321/30000 | Total reward = 27.68
2022-01-26 14:18:14.706 | DEBUG    | __main__:trials:24 - Trial = 22322/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.706 | DEBUG    | __main__:trials:29 - Trial = 22322/30000 | Total reward = 37.35
2022-01-26 14:18:14.711 | DEBUG    | __main__:trials:24 - Trial = 22323/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.713 | DEBUG    | __main__:trials:29 - Trial = 22323/30000 | Total reward = 36.05
2022-01-26 14:18:14.716 | DEBUG    | __main__:trials:24 - Trial = 22324/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.717 | DEBUG    | __main__:trials:29 - Trial = 22324/30000 | Total reward = 37.90
2022-01-26 14:18:14.721 | DEBUG    | __main__:trials:24 - Trial = 22325/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.722 | DEBUG    | __main__:trials:29 - Trial = 22325/30000 | Total reward = 44.05
2022-01-26 14:18:14.725 | DEBUG    | __main__:trials:24 - Trial = 22326/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.726 | DEBUG    | __main__:trials:29 - Trial = 22326/30000 | Total reward = 51.39
2022-01-26 14:18:14.730 | DEBUG    | __main__:trials:24 - Trial = 22327/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.731 | DEBUG    | __main__:trials:29 - Trial = 22327/30000 | Total reward = 40.29
2022-01-26 14:18:14.736 | DEBUG    | __main__:trials:24 - Trial = 22328/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.737 | DEBUG    | __main__:trials:29 - Trial = 22328/30000 | Total reward = 36.23
2022-01-26 14:18:14.741 | DEBUG    | __main__:trials:24 - Trial = 22329/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.743 | DEBUG    | __main__:trials:29 - Trial = 22329/30000 | Total reward = 42.79
2022-01-26 14:18:14.746 | DEBUG    | __main__:trials:24 - Trial = 22330/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.747 | DEBUG    | __main__:trials:29 - Trial = 22330/30000 | Total reward = 44.97
2022-01-26 14:18:14.750 | DEBUG    | __main__:trials:24 - Trial = 22331/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.752 | DEBUG    | __main__:trials:29 - Trial = 22331/30000 | Total reward = 36.87
2022-01-26 14:18:14.755 | DEBUG    | __main__:trials:24 - Trial = 22332/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.757 | DEBUG    | __main__:trials:29 - Trial = 22332/30000 | Total reward = 36.38
2022-01-26 14:18:14.760 | DEBUG    | __main__:trials:26 - Trial = 22333/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.762 | DEBUG    | __main__:trials:29 - Trial = 22333/30000 | Total reward = 25.67
2022-01-26 14:18:14.766 | DEBUG    | __main__:trials:24 - Trial = 22334/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.766 | DEBUG    | __main__:trials:29 - Trial = 22334/30000 | Total reward = 42.43
2022-01-26 14:18:14.771 | DEBUG    | __main__:trials:24 - Trial = 22335/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.773 | DEBUG    | __main__:trials:29 - Trial = 22335/30000 | Total reward = 57.17
2022-01-26 14:18:14.776 | DEBUG    | __main__:trials:24 - Trial = 22336/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.778 | DEBUG    | __main__:trials:29 - Trial = 22336/30000 | Total reward = 33.71
2022-01-26 14:18:14.782 | DEBUG    | __main__:trials:24 - Trial = 22337/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.783 | DEBUG    | __main__:trials:29 - Trial = 22337/30000 | Total reward = 37.94
2022-01-26 14:18:14.787 | DEBUG    | __main__:trials:24 - Trial = 22338/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.789 | DEBUG    | __main__:trials:29 - Trial = 22338/30000 | Total reward = 39.57
2022-01-26 14:18:14.792 | DEBUG    | __main__:trials:24 - Trial = 22339/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.793 | DEBUG    | __main__:trials:29 - Trial = 22339/30000 | Total reward = 36.03
2022-01-26 14:18:14.797 | DEBUG    | __main__:trials:24 - Trial = 22340/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.797 | DEBUG    | __main__:trials:29 - Trial = 22340/30000 | Total reward = 41.00
2022-01-26 14:18:14.802 | DEBUG    | __main__:trials:24 - Trial = 22341/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.802 | DEBUG    | __main__:trials:29 - Trial = 22341/30000 | Total reward = 45.70
2022-01-26 14:18:14.807 | DEBUG    | __main__:trials:24 - Trial = 22342/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.808 | DEBUG    | __main__:trials:29 - Trial = 22342/30000 | Total reward = 36.52
2022-01-26 14:18:14.812 | DEBUG    | __main__:trials:24 - Trial = 22343/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.813 | DEBUG    | __main__:trials:29 - Trial = 22343/30000 | Total reward = 39.57
2022-01-26 14:18:14.816 | DEBUG    | __main__:trials:24 - Trial = 22344/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.817 | DEBUG    | __main__:trials:29 - Trial = 22344/30000 | Total reward = 35.21
2022-01-26 14:18:14.821 | DEBUG    | __main__:trials:24 - Trial = 22345/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.822 | DEBUG    | __main__:trials:29 - Trial = 22345/30000 | Total reward = 30.01
2022-01-26 14:18:14.826 | DEBUG    | __main__:trials:24 - Trial = 22346/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.828 | DEBUG    | __main__:trials:29 - Trial = 22346/30000 | Total reward = 52.29
2022-01-26 14:18:14.831 | DEBUG    | __main__:trials:24 - Trial = 22347/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.832 | DEBUG    | __main__:trials:29 - Trial = 22347/30000 | Total reward = 33.36
2022-01-26 14:18:14.836 | DEBUG    | __main__:trials:24 - Trial = 22348/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.836 | DEBUG    | __main__:trials:29 - Trial = 22348/30000 | Total reward = 33.75
2022-01-26 14:18:14.840 | DEBUG    | __main__:trials:24 - Trial = 22349/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.841 | DEBUG    | __main__:trials:29 - Trial = 22349/30000 | Total reward = 47.70
2022-01-26 14:18:14.844 | DEBUG    | __main__:trials:26 - Trial = 22350/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.846 | DEBUG    | __main__:trials:29 - Trial = 22350/30000 | Total reward = 27.76
2022-01-26 14:18:14.850 | DEBUG    | __main__:trials:24 - Trial = 22351/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.851 | DEBUG    | __main__:trials:29 - Trial = 22351/30000 | Total reward = 48.57
2022-01-26 14:18:14.854 | DEBUG    | __main__:trials:24 - Trial = 22352/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.856 | DEBUG    | __main__:trials:29 - Trial = 22352/30000 | Total reward = 45.76
2022-01-26 14:18:14.859 | DEBUG    | __main__:trials:24 - Trial = 22353/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.861 | DEBUG    | __main__:trials:29 - Trial = 22353/30000 | Total reward = 32.48
2022-01-26 14:18:14.864 | DEBUG    | __main__:trials:24 - Trial = 22354/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.866 | DEBUG    | __main__:trials:29 - Trial = 22354/30000 | Total reward = 37.41
2022-01-26 14:18:14.870 | DEBUG    | __main__:trials:24 - Trial = 22355/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.870 | DEBUG    | __main__:trials:29 - Trial = 22355/30000 | Total reward = 39.98
2022-01-26 14:18:14.875 | DEBUG    | __main__:trials:24 - Trial = 22356/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.876 | DEBUG    | __main__:trials:29 - Trial = 22356/30000 | Total reward = 40.86
2022-01-26 14:18:14.879 | DEBUG    | __main__:trials:24 - Trial = 22357/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.881 | DEBUG    | __main__:trials:29 - Trial = 22357/30000 | Total reward = 38.68
2022-01-26 14:18:14.884 | DEBUG    | __main__:trials:24 - Trial = 22358/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.886 | DEBUG    | __main__:trials:29 - Trial = 22358/30000 | Total reward = 43.90
2022-01-26 14:18:14.889 | DEBUG    | __main__:trials:24 - Trial = 22359/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.890 | DEBUG    | __main__:trials:29 - Trial = 22359/30000 | Total reward = 38.77
2022-01-26 14:18:14.893 | DEBUG    | __main__:trials:24 - Trial = 22360/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.894 | DEBUG    | __main__:trials:29 - Trial = 22360/30000 | Total reward = 34.64
2022-01-26 14:18:14.898 | DEBUG    | __main__:trials:24 - Trial = 22361/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.899 | DEBUG    | __main__:trials:29 - Trial = 22361/30000 | Total reward = 38.80
2022-01-26 14:18:14.903 | DEBUG    | __main__:trials:24 - Trial = 22362/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.904 | DEBUG    | __main__:trials:29 - Trial = 22362/30000 | Total reward = 47.43
2022-01-26 14:18:14.908 | DEBUG    | __main__:trials:26 - Trial = 22363/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.909 | DEBUG    | __main__:trials:29 - Trial = 22363/30000 | Total reward = 30.94
2022-01-26 14:18:14.913 | DEBUG    | __main__:trials:24 - Trial = 22364/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.914 | DEBUG    | __main__:trials:29 - Trial = 22364/30000 | Total reward = 34.85
2022-01-26 14:18:14.918 | DEBUG    | __main__:trials:24 - Trial = 22365/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.920 | DEBUG    | __main__:trials:29 - Trial = 22365/30000 | Total reward = 34.42
2022-01-26 14:18:14.924 | DEBUG    | __main__:trials:24 - Trial = 22366/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.925 | DEBUG    | __main__:trials:29 - Trial = 22366/30000 | Total reward = 37.25
2022-01-26 14:18:14.929 | DEBUG    | __main__:trials:24 - Trial = 22367/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.931 | DEBUG    | __main__:trials:29 - Trial = 22367/30000 | Total reward = 35.32
2022-01-26 14:18:14.934 | DEBUG    | __main__:trials:24 - Trial = 22368/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.935 | DEBUG    | __main__:trials:29 - Trial = 22368/30000 | Total reward = 42.51
2022-01-26 14:18:14.938 | DEBUG    | __main__:trials:24 - Trial = 22369/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.940 | DEBUG    | __main__:trials:29 - Trial = 22369/30000 | Total reward = 36.43
2022-01-26 14:18:14.944 | DEBUG    | __main__:trials:24 - Trial = 22370/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.945 | DEBUG    | __main__:trials:29 - Trial = 22370/30000 | Total reward = 41.78
2022-01-26 14:18:14.949 | DEBUG    | __main__:trials:24 - Trial = 22371/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.951 | DEBUG    | __main__:trials:29 - Trial = 22371/30000 | Total reward = 41.38
2022-01-26 14:18:14.954 | DEBUG    | __main__:trials:24 - Trial = 22372/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.956 | DEBUG    | __main__:trials:29 - Trial = 22372/30000 | Total reward = 56.51
2022-01-26 14:18:14.959 | DEBUG    | __main__:trials:24 - Trial = 22373/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.961 | DEBUG    | __main__:trials:29 - Trial = 22373/30000 | Total reward = 39.18
2022-01-26 14:18:14.964 | DEBUG    | __main__:trials:26 - Trial = 22374/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:14.966 | DEBUG    | __main__:trials:29 - Trial = 22374/30000 | Total reward = 25.27
2022-01-26 14:18:14.969 | DEBUG    | __main__:trials:24 - Trial = 22375/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.970 | DEBUG    | __main__:trials:29 - Trial = 22375/30000 | Total reward = 61.55
2022-01-26 14:18:14.975 | DEBUG    | __main__:trials:24 - Trial = 22376/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.976 | DEBUG    | __main__:trials:29 - Trial = 22376/30000 | Total reward = 35.33
2022-01-26 14:18:14.979 | DEBUG    | __main__:trials:24 - Trial = 22377/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.981 | DEBUG    | __main__:trials:29 - Trial = 22377/30000 | Total reward = 39.57
2022-01-26 14:18:14.984 | DEBUG    | __main__:trials:24 - Trial = 22378/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.986 | DEBUG    | __main__:trials:29 - Trial = 22378/30000 | Total reward = 52.71
2022-01-26 14:18:14.989 | DEBUG    | __main__:trials:24 - Trial = 22379/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.990 | DEBUG    | __main__:trials:29 - Trial = 22379/30000 | Total reward = 40.31
2022-01-26 14:18:14.994 | DEBUG    | __main__:trials:24 - Trial = 22380/30000 | Max number of steps (20) reached
2022-01-26 14:18:14.996 | DEBUG    | __main__:trials:29 - Trial = 22380/30000 | Total reward = 44.22
2022-01-26 14:18:15.000 | DEBUG    | __main__:trials:24 - Trial = 22381/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.001 | DEBUG    | __main__:trials:29 - Trial = 22381/30000 | Total reward = 34.35
2022-01-26 14:18:15.005 | DEBUG    | __main__:trials:24 - Trial = 22382/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.007 | DEBUG    | __main__:trials:29 - Trial = 22382/30000 | Total reward = 32.42
2022-01-26 14:18:15.011 | DEBUG    | __main__:trials:24 - Trial = 22383/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.012 | DEBUG    | __main__:trials:29 - Trial = 22383/30000 | Total reward = 32.63
2022-01-26 14:18:15.016 | DEBUG    | __main__:trials:24 - Trial = 22384/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.018 | DEBUG    | __main__:trials:29 - Trial = 22384/30000 | Total reward = 47.42
2022-01-26 14:18:15.022 | DEBUG    | __main__:trials:24 - Trial = 22385/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.023 | DEBUG    | __main__:trials:29 - Trial = 22385/30000 | Total reward = 32.08
2022-01-26 14:18:15.026 | DEBUG    | __main__:trials:24 - Trial = 22386/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.028 | DEBUG    | __main__:trials:29 - Trial = 22386/30000 | Total reward = 34.64
2022-01-26 14:18:15.032 | DEBUG    | __main__:trials:24 - Trial = 22387/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.032 | DEBUG    | __main__:trials:29 - Trial = 22387/30000 | Total reward = 36.52
2022-01-26 14:18:15.037 | DEBUG    | __main__:trials:24 - Trial = 22388/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.038 | DEBUG    | __main__:trials:29 - Trial = 22388/30000 | Total reward = 41.44
2022-01-26 14:18:15.042 | DEBUG    | __main__:trials:24 - Trial = 22389/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.043 | DEBUG    | __main__:trials:29 - Trial = 22389/30000 | Total reward = 34.66
2022-01-26 14:18:15.047 | DEBUG    | __main__:trials:24 - Trial = 22390/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.048 | DEBUG    | __main__:trials:29 - Trial = 22390/30000 | Total reward = 44.35
2022-01-26 14:18:15.052 | DEBUG    | __main__:trials:24 - Trial = 22391/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.054 | DEBUG    | __main__:trials:29 - Trial = 22391/30000 | Total reward = 44.68
2022-01-26 14:18:15.057 | DEBUG    | __main__:trials:24 - Trial = 22392/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.059 | DEBUG    | __main__:trials:29 - Trial = 22392/30000 | Total reward = 32.73
2022-01-26 14:18:15.062 | DEBUG    | __main__:trials:24 - Trial = 22393/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.064 | DEBUG    | __main__:trials:29 - Trial = 22393/30000 | Total reward = 38.60
2022-01-26 14:18:15.067 | DEBUG    | __main__:trials:24 - Trial = 22394/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.069 | DEBUG    | __main__:trials:29 - Trial = 22394/30000 | Total reward = 34.71
2022-01-26 14:18:15.072 | DEBUG    | __main__:trials:24 - Trial = 22395/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.073 | DEBUG    | __main__:trials:29 - Trial = 22395/30000 | Total reward = 26.71
2022-01-26 14:18:15.076 | DEBUG    | __main__:trials:24 - Trial = 22396/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.078 | DEBUG    | __main__:trials:29 - Trial = 22396/30000 | Total reward = 42.10
2022-01-26 14:18:15.082 | DEBUG    | __main__:trials:24 - Trial = 22397/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.083 | DEBUG    | __main__:trials:29 - Trial = 22397/30000 | Total reward = 46.34
2022-01-26 14:18:15.087 | DEBUG    | __main__:trials:24 - Trial = 22398/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.088 | DEBUG    | __main__:trials:29 - Trial = 22398/30000 | Total reward = 40.09
2022-01-26 14:18:15.092 | DEBUG    | __main__:trials:24 - Trial = 22399/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.094 | DEBUG    | __main__:trials:29 - Trial = 22399/30000 | Total reward = 32.24
2022-01-26 14:18:15.097 | DEBUG    | __main__:trials:24 - Trial = 22400/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.099 | DEBUG    | __main__:trials:29 - Trial = 22400/30000 | Total reward = 52.41
2022-01-26 14:18:15.102 | DEBUG    | __main__:trials:24 - Trial = 22401/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.104 | DEBUG    | __main__:trials:29 - Trial = 22401/30000 | Total reward = 53.13
2022-01-26 14:18:15.107 | DEBUG    | __main__:trials:24 - Trial = 22402/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.108 | DEBUG    | __main__:trials:29 - Trial = 22402/30000 | Total reward = 49.38
2022-01-26 14:18:15.112 | DEBUG    | __main__:trials:24 - Trial = 22403/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.114 | DEBUG    | __main__:trials:29 - Trial = 22403/30000 | Total reward = 42.43
2022-01-26 14:18:15.117 | DEBUG    | __main__:trials:24 - Trial = 22404/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.118 | DEBUG    | __main__:trials:29 - Trial = 22404/30000 | Total reward = 40.14
2022-01-26 14:18:15.121 | DEBUG    | __main__:trials:24 - Trial = 22405/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.124 | DEBUG    | __main__:trials:29 - Trial = 22405/30000 | Total reward = 59.86
2022-01-26 14:18:15.126 | DEBUG    | __main__:trials:24 - Trial = 22406/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.128 | DEBUG    | __main__:trials:29 - Trial = 22406/30000 | Total reward = 32.27
2022-01-26 14:18:15.131 | DEBUG    | __main__:trials:24 - Trial = 22407/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.133 | DEBUG    | __main__:trials:29 - Trial = 22407/30000 | Total reward = 37.03
2022-01-26 14:18:15.136 | DEBUG    | __main__:trials:24 - Trial = 22408/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.137 | DEBUG    | __main__:trials:29 - Trial = 22408/30000 | Total reward = 33.09
2022-01-26 14:18:15.141 | DEBUG    | __main__:trials:24 - Trial = 22409/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.143 | DEBUG    | __main__:trials:29 - Trial = 22409/30000 | Total reward = 37.74
2022-01-26 14:18:15.146 | DEBUG    | __main__:trials:24 - Trial = 22410/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.148 | DEBUG    | __main__:trials:29 - Trial = 22410/30000 | Total reward = 42.31
2022-01-26 14:18:15.151 | DEBUG    | __main__:trials:26 - Trial = 22411/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:15.152 | DEBUG    | __main__:trials:29 - Trial = 22411/30000 | Total reward = 27.28
2022-01-26 14:18:15.156 | DEBUG    | __main__:trials:24 - Trial = 22412/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.157 | DEBUG    | __main__:trials:29 - Trial = 22412/30000 | Total reward = 56.81
2022-01-26 14:18:15.161 | DEBUG    | __main__:trials:24 - Trial = 22413/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.163 | DEBUG    | __main__:trials:29 - Trial = 22413/30000 | Total reward = 49.14
2022-01-26 14:18:15.166 | DEBUG    | __main__:trials:24 - Trial = 22414/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.167 | DEBUG    | __main__:trials:29 - Trial = 22414/30000 | Total reward = 35.59
2022-01-26 14:18:15.171 | DEBUG    | __main__:trials:24 - Trial = 22415/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.173 | DEBUG    | __main__:trials:29 - Trial = 22415/30000 | Total reward = 34.57
2022-01-26 14:18:15.176 | DEBUG    | __main__:trials:24 - Trial = 22416/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.178 | DEBUG    | __main__:trials:29 - Trial = 22416/30000 | Total reward = 41.79
2022-01-26 14:18:15.181 | DEBUG    | __main__:trials:24 - Trial = 22417/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.183 | DEBUG    | __main__:trials:29 - Trial = 22417/30000 | Total reward = 47.86
2022-01-26 14:18:15.187 | DEBUG    | __main__:trials:24 - Trial = 22418/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.187 | DEBUG    | __main__:trials:29 - Trial = 22418/30000 | Total reward = 54.47
2022-01-26 14:18:15.192 | DEBUG    | __main__:trials:24 - Trial = 22419/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.193 | DEBUG    | __main__:trials:29 - Trial = 22419/30000 | Total reward = 45.72
2022-01-26 14:18:15.196 | DEBUG    | __main__:trials:24 - Trial = 22420/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.198 | DEBUG    | __main__:trials:29 - Trial = 22420/30000 | Total reward = 48.25
2022-01-26 14:18:15.202 | DEBUG    | __main__:trials:24 - Trial = 22421/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.203 | DEBUG    | __main__:trials:29 - Trial = 22421/30000 | Total reward = 40.03
2022-01-26 14:18:15.206 | DEBUG    | __main__:trials:24 - Trial = 22422/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.208 | DEBUG    | __main__:trials:29 - Trial = 22422/30000 | Total reward = 20.44
2022-01-26 14:18:15.211 | DEBUG    | __main__:trials:24 - Trial = 22423/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.212 | DEBUG    | __main__:trials:29 - Trial = 22423/30000 | Total reward = 38.95
2022-01-26 14:18:15.216 | DEBUG    | __main__:trials:24 - Trial = 22424/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.217 | DEBUG    | __main__:trials:29 - Trial = 22424/30000 | Total reward = 45.81
2022-01-26 14:18:15.221 | DEBUG    | __main__:trials:24 - Trial = 22425/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.222 | DEBUG    | __main__:trials:29 - Trial = 22425/30000 | Total reward = 50.86
2022-01-26 14:18:15.227 | DEBUG    | __main__:trials:24 - Trial = 22426/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.228 | DEBUG    | __main__:trials:29 - Trial = 22426/30000 | Total reward = 32.04
2022-01-26 14:18:15.232 | DEBUG    | __main__:trials:24 - Trial = 22427/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.232 | DEBUG    | __main__:trials:29 - Trial = 22427/30000 | Total reward = 29.83
2022-01-26 14:18:15.236 | DEBUG    | __main__:trials:24 - Trial = 22428/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.237 | DEBUG    | __main__:trials:29 - Trial = 22428/30000 | Total reward = 49.67
2022-01-26 14:18:15.240 | DEBUG    | __main__:trials:24 - Trial = 22429/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.242 | DEBUG    | __main__:trials:29 - Trial = 22429/30000 | Total reward = 39.78
2022-01-26 14:18:15.245 | DEBUG    | __main__:trials:24 - Trial = 22430/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.246 | DEBUG    | __main__:trials:29 - Trial = 22430/30000 | Total reward = 34.28
2022-01-26 14:18:15.249 | DEBUG    | __main__:trials:24 - Trial = 22431/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.250 | DEBUG    | __main__:trials:29 - Trial = 22431/30000 | Total reward = 33.98
2022-01-26 14:18:15.254 | DEBUG    | __main__:trials:24 - Trial = 22432/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.254 | DEBUG    | __main__:trials:29 - Trial = 22432/30000 | Total reward = 47.34
2022-01-26 14:18:15.258 | DEBUG    | __main__:trials:24 - Trial = 22433/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.260 | DEBUG    | __main__:trials:29 - Trial = 22433/30000 | Total reward = 35.65
2022-01-26 14:18:15.263 | DEBUG    | __main__:trials:24 - Trial = 22434/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.264 | DEBUG    | __main__:trials:29 - Trial = 22434/30000 | Total reward = 39.30
2022-01-26 14:18:15.268 | DEBUG    | __main__:trials:24 - Trial = 22435/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.269 | DEBUG    | __main__:trials:29 - Trial = 22435/30000 | Total reward = 33.34
2022-01-26 14:18:15.273 | DEBUG    | __main__:trials:24 - Trial = 22436/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.274 | DEBUG    | __main__:trials:29 - Trial = 22436/30000 | Total reward = 32.46
2022-01-26 14:18:15.277 | DEBUG    | __main__:trials:24 - Trial = 22437/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.278 | DEBUG    | __main__:trials:29 - Trial = 22437/30000 | Total reward = 34.47
2022-01-26 14:18:15.283 | DEBUG    | __main__:trials:24 - Trial = 22438/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.284 | DEBUG    | __main__:trials:29 - Trial = 22438/30000 | Total reward = 43.19
2022-01-26 14:18:15.287 | DEBUG    | __main__:trials:24 - Trial = 22439/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.289 | DEBUG    | __main__:trials:29 - Trial = 22439/30000 | Total reward = 37.91
2022-01-26 14:18:15.292 | DEBUG    | __main__:trials:24 - Trial = 22440/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.294 | DEBUG    | __main__:trials:29 - Trial = 22440/30000 | Total reward = 30.12
2022-01-26 14:18:15.297 | DEBUG    | __main__:trials:24 - Trial = 22441/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.298 | DEBUG    | __main__:trials:29 - Trial = 22441/30000 | Total reward = 34.82
2022-01-26 14:18:15.302 | DEBUG    | __main__:trials:24 - Trial = 22442/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.304 | DEBUG    | __main__:trials:29 - Trial = 22442/30000 | Total reward = 36.75
2022-01-26 14:18:15.307 | DEBUG    | __main__:trials:24 - Trial = 22443/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.308 | DEBUG    | __main__:trials:29 - Trial = 22443/30000 | Total reward = 36.13
2022-01-26 14:18:15.311 | DEBUG    | __main__:trials:24 - Trial = 22444/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.313 | DEBUG    | __main__:trials:29 - Trial = 22444/30000 | Total reward = 37.48
2022-01-26 14:18:15.317 | DEBUG    | __main__:trials:24 - Trial = 22445/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.318 | DEBUG    | __main__:trials:29 - Trial = 22445/30000 | Total reward = 35.96
2022-01-26 14:18:15.322 | DEBUG    | __main__:trials:24 - Trial = 22446/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.324 | DEBUG    | __main__:trials:29 - Trial = 22446/30000 | Total reward = 39.21
2022-01-26 14:18:15.327 | DEBUG    | __main__:trials:24 - Trial = 22447/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.329 | DEBUG    | __main__:trials:29 - Trial = 22447/30000 | Total reward = 33.34
2022-01-26 14:18:15.332 | DEBUG    | __main__:trials:24 - Trial = 22448/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.334 | DEBUG    | __main__:trials:29 - Trial = 22448/30000 | Total reward = 40.44
2022-01-26 14:18:15.337 | DEBUG    | __main__:trials:24 - Trial = 22449/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.338 | DEBUG    | __main__:trials:29 - Trial = 22449/30000 | Total reward = 50.24
2022-01-26 14:18:15.343 | DEBUG    | __main__:trials:24 - Trial = 22450/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.344 | DEBUG    | __main__:trials:29 - Trial = 22450/30000 | Total reward = 26.61
2022-01-26 14:18:15.348 | DEBUG    | __main__:trials:24 - Trial = 22451/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.350 | DEBUG    | __main__:trials:29 - Trial = 22451/30000 | Total reward = 32.12
2022-01-26 14:18:15.353 | DEBUG    | __main__:trials:24 - Trial = 22452/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.354 | DEBUG    | __main__:trials:29 - Trial = 22452/30000 | Total reward = 34.73
2022-01-26 14:18:15.358 | DEBUG    | __main__:trials:24 - Trial = 22453/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.360 | DEBUG    | __main__:trials:29 - Trial = 22453/30000 | Total reward = 40.73
2022-01-26 14:18:15.363 | DEBUG    | __main__:trials:24 - Trial = 22454/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.364 | DEBUG    | __main__:trials:29 - Trial = 22454/30000 | Total reward = 41.01
2022-01-26 14:18:15.367 | DEBUG    | __main__:trials:24 - Trial = 22455/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.369 | DEBUG    | __main__:trials:29 - Trial = 22455/30000 | Total reward = 57.53
2022-01-26 14:18:15.372 | DEBUG    | __main__:trials:24 - Trial = 22456/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.374 | DEBUG    | __main__:trials:29 - Trial = 22456/30000 | Total reward = 39.59
2022-01-26 14:18:15.378 | DEBUG    | __main__:trials:24 - Trial = 22457/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.378 | DEBUG    | __main__:trials:29 - Trial = 22457/30000 | Total reward = 36.08
2022-01-26 14:18:15.382 | DEBUG    | __main__:trials:26 - Trial = 22458/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:15.383 | DEBUG    | __main__:trials:29 - Trial = 22458/30000 | Total reward = 25.54
2022-01-26 14:18:15.387 | DEBUG    | __main__:trials:24 - Trial = 22459/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.388 | DEBUG    | __main__:trials:29 - Trial = 22459/30000 | Total reward = 38.22
2022-01-26 14:18:15.392 | DEBUG    | __main__:trials:24 - Trial = 22460/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.393 | DEBUG    | __main__:trials:29 - Trial = 22460/30000 | Total reward = 36.42
2022-01-26 14:18:15.397 | DEBUG    | __main__:trials:24 - Trial = 22461/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.397 | DEBUG    | __main__:trials:29 - Trial = 22461/30000 | Total reward = 37.73
2022-01-26 14:18:15.401 | DEBUG    | __main__:trials:24 - Trial = 22462/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.401 | DEBUG    | __main__:trials:29 - Trial = 22462/30000 | Total reward = 53.26
2022-01-26 14:18:15.405 | DEBUG    | __main__:trials:24 - Trial = 22463/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.406 | DEBUG    | __main__:trials:29 - Trial = 22463/30000 | Total reward = 33.86
2022-01-26 14:18:15.409 | DEBUG    | __main__:trials:24 - Trial = 22464/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.411 | DEBUG    | __main__:trials:29 - Trial = 22464/30000 | Total reward = 33.95
2022-01-26 14:18:15.414 | DEBUG    | __main__:trials:24 - Trial = 22465/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.414 | DEBUG    | __main__:trials:29 - Trial = 22465/30000 | Total reward = 62.19
2022-01-26 14:18:15.418 | DEBUG    | __main__:trials:24 - Trial = 22466/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.419 | DEBUG    | __main__:trials:29 - Trial = 22466/30000 | Total reward = 64.67
2022-01-26 14:18:15.423 | DEBUG    | __main__:trials:24 - Trial = 22467/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.424 | DEBUG    | __main__:trials:29 - Trial = 22467/30000 | Total reward = 40.75
2022-01-26 14:18:15.427 | DEBUG    | __main__:trials:24 - Trial = 22468/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.429 | DEBUG    | __main__:trials:29 - Trial = 22468/30000 | Total reward = 39.41
2022-01-26 14:18:15.432 | DEBUG    | __main__:trials:24 - Trial = 22469/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.433 | DEBUG    | __main__:trials:29 - Trial = 22469/30000 | Total reward = 31.52
2022-01-26 14:18:15.436 | DEBUG    | __main__:trials:24 - Trial = 22470/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.438 | DEBUG    | __main__:trials:29 - Trial = 22470/30000 | Total reward = 52.72
2022-01-26 14:18:15.441 | DEBUG    | __main__:trials:24 - Trial = 22471/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.442 | DEBUG    | __main__:trials:29 - Trial = 22471/30000 | Total reward = 52.12
2022-01-26 14:18:15.446 | DEBUG    | __main__:trials:24 - Trial = 22472/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.448 | DEBUG    | __main__:trials:29 - Trial = 22472/30000 | Total reward = 39.50
2022-01-26 14:18:15.451 | DEBUG    | __main__:trials:24 - Trial = 22473/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.451 | DEBUG    | __main__:trials:29 - Trial = 22473/30000 | Total reward = 32.94
2022-01-26 14:18:15.455 | DEBUG    | __main__:trials:24 - Trial = 22474/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.457 | DEBUG    | __main__:trials:29 - Trial = 22474/30000 | Total reward = 33.15
2022-01-26 14:18:15.460 | DEBUG    | __main__:trials:24 - Trial = 22475/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.461 | DEBUG    | __main__:trials:29 - Trial = 22475/30000 | Total reward = 32.36
2022-01-26 14:18:15.464 | DEBUG    | __main__:trials:24 - Trial = 22476/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.466 | DEBUG    | __main__:trials:29 - Trial = 22476/30000 | Total reward = 62.45
2022-01-26 14:18:15.469 | DEBUG    | __main__:trials:24 - Trial = 22477/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.469 | DEBUG    | __main__:trials:29 - Trial = 22477/30000 | Total reward = 33.61
2022-01-26 14:18:15.473 | DEBUG    | __main__:trials:24 - Trial = 22478/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.474 | DEBUG    | __main__:trials:29 - Trial = 22478/30000 | Total reward = 42.86
2022-01-26 14:18:15.477 | DEBUG    | __main__:trials:24 - Trial = 22479/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.479 | DEBUG    | __main__:trials:29 - Trial = 22479/30000 | Total reward = 49.84
2022-01-26 14:18:15.482 | DEBUG    | __main__:trials:24 - Trial = 22480/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.483 | DEBUG    | __main__:trials:29 - Trial = 22480/30000 | Total reward = 36.46
2022-01-26 14:18:15.486 | DEBUG    | __main__:trials:24 - Trial = 22481/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.488 | DEBUG    | __main__:trials:29 - Trial = 22481/30000 | Total reward = 40.51
2022-01-26 14:18:15.491 | DEBUG    | __main__:trials:24 - Trial = 22482/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.492 | DEBUG    | __main__:trials:29 - Trial = 22482/30000 | Total reward = 37.86
2022-01-26 14:18:15.495 | DEBUG    | __main__:trials:24 - Trial = 22483/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.497 | DEBUG    | __main__:trials:29 - Trial = 22483/30000 | Total reward = 40.76
2022-01-26 14:18:15.500 | DEBUG    | __main__:trials:24 - Trial = 22484/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.502 | DEBUG    | __main__:trials:29 - Trial = 22484/30000 | Total reward = 44.45
2022-01-26 14:18:15.505 | DEBUG    | __main__:trials:24 - Trial = 22485/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.506 | DEBUG    | __main__:trials:29 - Trial = 22485/30000 | Total reward = 38.39
2022-01-26 14:18:15.509 | DEBUG    | __main__:trials:24 - Trial = 22486/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.510 | DEBUG    | __main__:trials:29 - Trial = 22486/30000 | Total reward = 38.25
2022-01-26 14:18:15.513 | DEBUG    | __main__:trials:24 - Trial = 22487/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.514 | DEBUG    | __main__:trials:29 - Trial = 22487/30000 | Total reward = 33.05
2022-01-26 14:18:15.517 | DEBUG    | __main__:trials:24 - Trial = 22488/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.518 | DEBUG    | __main__:trials:29 - Trial = 22488/30000 | Total reward = 54.27
2022-01-26 14:18:15.521 | DEBUG    | __main__:trials:24 - Trial = 22489/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.523 | DEBUG    | __main__:trials:29 - Trial = 22489/30000 | Total reward = 54.05
2022-01-26 14:18:15.527 | DEBUG    | __main__:trials:24 - Trial = 22490/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.528 | DEBUG    | __main__:trials:29 - Trial = 22490/30000 | Total reward = 34.53
2022-01-26 14:18:15.531 | DEBUG    | __main__:trials:24 - Trial = 22491/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.532 | DEBUG    | __main__:trials:29 - Trial = 22491/30000 | Total reward = 41.69
2022-01-26 14:18:15.536 | DEBUG    | __main__:trials:24 - Trial = 22492/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.537 | DEBUG    | __main__:trials:29 - Trial = 22492/30000 | Total reward = 35.32
2022-01-26 14:18:15.540 | DEBUG    | __main__:trials:24 - Trial = 22493/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.542 | DEBUG    | __main__:trials:29 - Trial = 22493/30000 | Total reward = 40.39
2022-01-26 14:18:15.545 | DEBUG    | __main__:trials:24 - Trial = 22494/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.546 | DEBUG    | __main__:trials:29 - Trial = 22494/30000 | Total reward = 41.01
2022-01-26 14:18:15.549 | DEBUG    | __main__:trials:24 - Trial = 22495/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.551 | DEBUG    | __main__:trials:29 - Trial = 22495/30000 | Total reward = 62.28
2022-01-26 14:18:15.554 | DEBUG    | __main__:trials:24 - Trial = 22496/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.555 | DEBUG    | __main__:trials:29 - Trial = 22496/30000 | Total reward = 52.03
2022-01-26 14:18:15.558 | DEBUG    | __main__:trials:24 - Trial = 22497/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.559 | DEBUG    | __main__:trials:29 - Trial = 22497/30000 | Total reward = 43.64
2022-01-26 14:18:15.563 | DEBUG    | __main__:trials:24 - Trial = 22498/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.564 | DEBUG    | __main__:trials:29 - Trial = 22498/30000 | Total reward = 36.64
2022-01-26 14:18:15.567 | DEBUG    | __main__:trials:24 - Trial = 22499/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.569 | DEBUG    | __main__:trials:29 - Trial = 22499/30000 | Total reward = 40.34
2022-01-26 14:18:15.572 | DEBUG    | __main__:trials:24 - Trial = 22500/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.574 | DEBUG    | __main__:trials:29 - Trial = 22500/30000 | Total reward = 40.48
2022-01-26 14:18:15.577 | DEBUG    | __main__:trials:24 - Trial = 22501/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.578 | DEBUG    | __main__:trials:29 - Trial = 22501/30000 | Total reward = 54.67
2022-01-26 14:18:15.582 | DEBUG    | __main__:trials:24 - Trial = 22502/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.583 | DEBUG    | __main__:trials:29 - Trial = 22502/30000 | Total reward = 52.70
2022-01-26 14:18:15.586 | DEBUG    | __main__:trials:24 - Trial = 22503/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.588 | DEBUG    | __main__:trials:29 - Trial = 22503/30000 | Total reward = 59.63
2022-01-26 14:18:15.590 | DEBUG    | __main__:trials:24 - Trial = 22504/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.591 | DEBUG    | __main__:trials:29 - Trial = 22504/30000 | Total reward = 55.96
2022-01-26 14:18:15.595 | DEBUG    | __main__:trials:24 - Trial = 22505/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.596 | DEBUG    | __main__:trials:29 - Trial = 22505/30000 | Total reward = 56.45
2022-01-26 14:18:15.599 | DEBUG    | __main__:trials:24 - Trial = 22506/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.601 | DEBUG    | __main__:trials:29 - Trial = 22506/30000 | Total reward = 56.28
2022-01-26 14:18:15.605 | DEBUG    | __main__:trials:24 - Trial = 22507/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.606 | DEBUG    | __main__:trials:29 - Trial = 22507/30000 | Total reward = 43.43
2022-01-26 14:18:15.609 | DEBUG    | __main__:trials:24 - Trial = 22508/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.610 | DEBUG    | __main__:trials:29 - Trial = 22508/30000 | Total reward = 63.56
2022-01-26 14:18:15.614 | DEBUG    | __main__:trials:24 - Trial = 22509/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.615 | DEBUG    | __main__:trials:29 - Trial = 22509/30000 | Total reward = 33.23
2022-01-26 14:18:15.618 | DEBUG    | __main__:trials:24 - Trial = 22510/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.619 | DEBUG    | __main__:trials:29 - Trial = 22510/30000 | Total reward = 52.52
2022-01-26 14:18:15.622 | DEBUG    | __main__:trials:26 - Trial = 22511/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:15.624 | DEBUG    | __main__:trials:29 - Trial = 22511/30000 | Total reward = 33.51
2022-01-26 14:18:15.628 | DEBUG    | __main__:trials:24 - Trial = 22512/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.629 | DEBUG    | __main__:trials:29 - Trial = 22512/30000 | Total reward = 41.77
2022-01-26 14:18:15.632 | DEBUG    | __main__:trials:24 - Trial = 22513/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.633 | DEBUG    | __main__:trials:29 - Trial = 22513/30000 | Total reward = 40.97
2022-01-26 14:18:15.636 | DEBUG    | __main__:trials:24 - Trial = 22514/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.637 | DEBUG    | __main__:trials:29 - Trial = 22514/30000 | Total reward = 39.95
2022-01-26 14:18:15.640 | DEBUG    | __main__:trials:24 - Trial = 22515/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.641 | DEBUG    | __main__:trials:29 - Trial = 22515/30000 | Total reward = 41.44
2022-01-26 14:18:15.644 | DEBUG    | __main__:trials:24 - Trial = 22516/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.646 | DEBUG    | __main__:trials:29 - Trial = 22516/30000 | Total reward = 42.40
2022-01-26 14:18:15.649 | DEBUG    | __main__:trials:24 - Trial = 22517/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.650 | DEBUG    | __main__:trials:29 - Trial = 22517/30000 | Total reward = 40.38
2022-01-26 14:18:15.653 | DEBUG    | __main__:trials:24 - Trial = 22518/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.654 | DEBUG    | __main__:trials:29 - Trial = 22518/30000 | Total reward = 37.05
2022-01-26 14:18:15.657 | DEBUG    | __main__:trials:24 - Trial = 22519/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.658 | DEBUG    | __main__:trials:29 - Trial = 22519/30000 | Total reward = 40.08
2022-01-26 14:18:15.661 | DEBUG    | __main__:trials:24 - Trial = 22520/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.662 | DEBUG    | __main__:trials:29 - Trial = 22520/30000 | Total reward = 39.68
2022-01-26 14:18:15.666 | DEBUG    | __main__:trials:24 - Trial = 22521/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.667 | DEBUG    | __main__:trials:29 - Trial = 22521/30000 | Total reward = 47.84
2022-01-26 14:18:15.670 | DEBUG    | __main__:trials:24 - Trial = 22522/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.672 | DEBUG    | __main__:trials:29 - Trial = 22522/30000 | Total reward = 39.87
2022-01-26 14:18:15.675 | DEBUG    | __main__:trials:24 - Trial = 22523/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.675 | DEBUG    | __main__:trials:29 - Trial = 22523/30000 | Total reward = 45.42
2022-01-26 14:18:15.679 | DEBUG    | __main__:trials:24 - Trial = 22524/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.681 | DEBUG    | __main__:trials:29 - Trial = 22524/30000 | Total reward = 40.39
2022-01-26 14:18:15.683 | DEBUG    | __main__:trials:24 - Trial = 22525/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.685 | DEBUG    | __main__:trials:29 - Trial = 22525/30000 | Total reward = 32.57
2022-01-26 14:18:15.688 | DEBUG    | __main__:trials:24 - Trial = 22526/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.690 | DEBUG    | __main__:trials:29 - Trial = 22526/30000 | Total reward = 41.05
2022-01-26 14:18:15.693 | DEBUG    | __main__:trials:24 - Trial = 22527/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.693 | DEBUG    | __main__:trials:29 - Trial = 22527/30000 | Total reward = 38.53
2022-01-26 14:18:15.697 | DEBUG    | __main__:trials:24 - Trial = 22528/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.698 | DEBUG    | __main__:trials:29 - Trial = 22528/30000 | Total reward = 42.68
2022-01-26 14:18:15.701 | DEBUG    | __main__:trials:24 - Trial = 22529/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.703 | DEBUG    | __main__:trials:29 - Trial = 22529/30000 | Total reward = 48.92
2022-01-26 14:18:15.707 | DEBUG    | __main__:trials:24 - Trial = 22530/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.707 | DEBUG    | __main__:trials:29 - Trial = 22530/30000 | Total reward = 43.29
2022-01-26 14:18:15.711 | DEBUG    | __main__:trials:24 - Trial = 22531/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.713 | DEBUG    | __main__:trials:29 - Trial = 22531/30000 | Total reward = 44.42
2022-01-26 14:18:15.715 | DEBUG    | __main__:trials:24 - Trial = 22532/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.716 | DEBUG    | __main__:trials:29 - Trial = 22532/30000 | Total reward = 44.22
2022-01-26 14:18:15.720 | DEBUG    | __main__:trials:24 - Trial = 22533/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.720 | DEBUG    | __main__:trials:29 - Trial = 22533/30000 | Total reward = 40.93
2022-01-26 14:18:15.724 | DEBUG    | __main__:trials:24 - Trial = 22534/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.725 | DEBUG    | __main__:trials:29 - Trial = 22534/30000 | Total reward = 36.07
2022-01-26 14:18:15.728 | DEBUG    | __main__:trials:24 - Trial = 22535/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.730 | DEBUG    | __main__:trials:29 - Trial = 22535/30000 | Total reward = 39.77
2022-01-26 14:18:15.733 | DEBUG    | __main__:trials:24 - Trial = 22536/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.734 | DEBUG    | __main__:trials:29 - Trial = 22536/30000 | Total reward = 52.18
2022-01-26 14:18:15.737 | DEBUG    | __main__:trials:24 - Trial = 22537/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.739 | DEBUG    | __main__:trials:29 - Trial = 22537/30000 | Total reward = 41.04
2022-01-26 14:18:15.742 | DEBUG    | __main__:trials:24 - Trial = 22538/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.742 | DEBUG    | __main__:trials:29 - Trial = 22538/30000 | Total reward = 39.49
2022-01-26 14:18:15.746 | DEBUG    | __main__:trials:24 - Trial = 22539/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.746 | DEBUG    | __main__:trials:29 - Trial = 22539/30000 | Total reward = 39.01
2022-01-26 14:18:15.750 | DEBUG    | __main__:trials:24 - Trial = 22540/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.752 | DEBUG    | __main__:trials:29 - Trial = 22540/30000 | Total reward = 39.88
2022-01-26 14:18:15.755 | DEBUG    | __main__:trials:24 - Trial = 22541/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.755 | DEBUG    | __main__:trials:29 - Trial = 22541/30000 | Total reward = 51.30
2022-01-26 14:18:15.759 | DEBUG    | __main__:trials:24 - Trial = 22542/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.761 | DEBUG    | __main__:trials:29 - Trial = 22542/30000 | Total reward = 40.03
2022-01-26 14:18:15.763 | DEBUG    | __main__:trials:24 - Trial = 22543/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.765 | DEBUG    | __main__:trials:29 - Trial = 22543/30000 | Total reward = 60.50
2022-01-26 14:18:15.768 | DEBUG    | __main__:trials:24 - Trial = 22544/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.771 | DEBUG    | __main__:trials:29 - Trial = 22544/30000 | Total reward = 40.63
2022-01-26 14:18:15.774 | DEBUG    | __main__:trials:24 - Trial = 22545/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.774 | DEBUG    | __main__:trials:29 - Trial = 22545/30000 | Total reward = 51.72
2022-01-26 14:18:15.778 | DEBUG    | __main__:trials:24 - Trial = 22546/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.780 | DEBUG    | __main__:trials:29 - Trial = 22546/30000 | Total reward = 62.57
2022-01-26 14:18:15.783 | DEBUG    | __main__:trials:24 - Trial = 22547/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.783 | DEBUG    | __main__:trials:29 - Trial = 22547/30000 | Total reward = 46.76
2022-01-26 14:18:15.787 | DEBUG    | __main__:trials:24 - Trial = 22548/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.788 | DEBUG    | __main__:trials:29 - Trial = 22548/30000 | Total reward = 39.49
2022-01-26 14:18:15.791 | DEBUG    | __main__:trials:24 - Trial = 22549/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.793 | DEBUG    | __main__:trials:29 - Trial = 22549/30000 | Total reward = 48.31
2022-01-26 14:18:15.796 | DEBUG    | __main__:trials:26 - Trial = 22550/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:15.797 | DEBUG    | __main__:trials:29 - Trial = 22550/30000 | Total reward = 23.95
2022-01-26 14:18:15.800 | DEBUG    | __main__:trials:24 - Trial = 22551/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.801 | DEBUG    | __main__:trials:29 - Trial = 22551/30000 | Total reward = 26.37
2022-01-26 14:18:15.804 | DEBUG    | __main__:trials:24 - Trial = 22552/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.805 | DEBUG    | __main__:trials:29 - Trial = 22552/30000 | Total reward = 42.30
2022-01-26 14:18:15.808 | DEBUG    | __main__:trials:24 - Trial = 22553/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.809 | DEBUG    | __main__:trials:29 - Trial = 22553/30000 | Total reward = 60.33
2022-01-26 14:18:15.812 | DEBUG    | __main__:trials:24 - Trial = 22554/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.814 | DEBUG    | __main__:trials:29 - Trial = 22554/30000 | Total reward = 35.90
2022-01-26 14:18:15.817 | DEBUG    | __main__:trials:24 - Trial = 22555/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.819 | DEBUG    | __main__:trials:29 - Trial = 22555/30000 | Total reward = 46.80
2022-01-26 14:18:15.823 | DEBUG    | __main__:trials:24 - Trial = 22556/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.824 | DEBUG    | __main__:trials:29 - Trial = 22556/30000 | Total reward = 49.85
2022-01-26 14:18:15.828 | DEBUG    | __main__:trials:24 - Trial = 22557/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.829 | DEBUG    | __main__:trials:29 - Trial = 22557/30000 | Total reward = 61.76
2022-01-26 14:18:15.833 | DEBUG    | __main__:trials:24 - Trial = 22558/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.834 | DEBUG    | __main__:trials:29 - Trial = 22558/30000 | Total reward = 38.15
2022-01-26 14:18:15.837 | DEBUG    | __main__:trials:24 - Trial = 22559/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.839 | DEBUG    | __main__:trials:29 - Trial = 22559/30000 | Total reward = 39.58
2022-01-26 14:18:15.843 | DEBUG    | __main__:trials:24 - Trial = 22560/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.845 | DEBUG    | __main__:trials:29 - Trial = 22560/30000 | Total reward = 36.57
2022-01-26 14:18:15.848 | DEBUG    | __main__:trials:24 - Trial = 22561/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.850 | DEBUG    | __main__:trials:29 - Trial = 22561/30000 | Total reward = 43.44
2022-01-26 14:18:15.854 | DEBUG    | __main__:trials:24 - Trial = 22562/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.855 | DEBUG    | __main__:trials:29 - Trial = 22562/30000 | Total reward = 68.35
2022-01-26 14:18:15.859 | DEBUG    | __main__:trials:24 - Trial = 22563/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.861 | DEBUG    | __main__:trials:29 - Trial = 22563/30000 | Total reward = 32.89
2022-01-26 14:18:15.864 | DEBUG    | __main__:trials:26 - Trial = 22564/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:15.865 | DEBUG    | __main__:trials:29 - Trial = 22564/30000 | Total reward = 25.89
2022-01-26 14:18:15.869 | DEBUG    | __main__:trials:24 - Trial = 22565/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.871 | DEBUG    | __main__:trials:29 - Trial = 22565/30000 | Total reward = 46.65
2022-01-26 14:18:15.875 | DEBUG    | __main__:trials:24 - Trial = 22566/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.875 | DEBUG    | __main__:trials:29 - Trial = 22566/30000 | Total reward = 36.87
2022-01-26 14:18:15.880 | DEBUG    | __main__:trials:24 - Trial = 22567/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.882 | DEBUG    | __main__:trials:29 - Trial = 22567/30000 | Total reward = 26.62
2022-01-26 14:18:15.885 | DEBUG    | __main__:trials:24 - Trial = 22568/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.887 | DEBUG    | __main__:trials:29 - Trial = 22568/30000 | Total reward = 61.28
2022-01-26 14:18:15.890 | DEBUG    | __main__:trials:24 - Trial = 22569/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.892 | DEBUG    | __main__:trials:29 - Trial = 22569/30000 | Total reward = 61.28
2022-01-26 14:18:15.895 | DEBUG    | __main__:trials:24 - Trial = 22570/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.896 | DEBUG    | __main__:trials:29 - Trial = 22570/30000 | Total reward = 39.51
2022-01-26 14:18:15.900 | DEBUG    | __main__:trials:24 - Trial = 22571/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.902 | DEBUG    | __main__:trials:29 - Trial = 22571/30000 | Total reward = 39.40
2022-01-26 14:18:15.905 | DEBUG    | __main__:trials:24 - Trial = 22572/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.906 | DEBUG    | __main__:trials:29 - Trial = 22572/30000 | Total reward = 36.15
2022-01-26 14:18:15.910 | DEBUG    | __main__:trials:24 - Trial = 22573/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.912 | DEBUG    | __main__:trials:29 - Trial = 22573/30000 | Total reward = 39.80
2022-01-26 14:18:15.916 | DEBUG    | __main__:trials:24 - Trial = 22574/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.918 | DEBUG    | __main__:trials:29 - Trial = 22574/30000 | Total reward = 43.35
2022-01-26 14:18:15.922 | DEBUG    | __main__:trials:24 - Trial = 22575/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.923 | DEBUG    | __main__:trials:29 - Trial = 22575/30000 | Total reward = 53.84
2022-01-26 14:18:15.927 | DEBUG    | __main__:trials:24 - Trial = 22576/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.928 | DEBUG    | __main__:trials:29 - Trial = 22576/30000 | Total reward = 40.69
2022-01-26 14:18:15.932 | DEBUG    | __main__:trials:24 - Trial = 22577/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.933 | DEBUG    | __main__:trials:29 - Trial = 22577/30000 | Total reward = 31.03
2022-01-26 14:18:15.936 | DEBUG    | __main__:trials:24 - Trial = 22578/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.938 | DEBUG    | __main__:trials:29 - Trial = 22578/30000 | Total reward = 45.58
2022-01-26 14:18:15.941 | DEBUG    | __main__:trials:24 - Trial = 22579/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.943 | DEBUG    | __main__:trials:29 - Trial = 22579/30000 | Total reward = 25.42
2022-01-26 14:18:15.947 | DEBUG    | __main__:trials:24 - Trial = 22580/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.948 | DEBUG    | __main__:trials:29 - Trial = 22580/30000 | Total reward = 40.21
2022-01-26 14:18:15.951 | DEBUG    | __main__:trials:24 - Trial = 22581/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.952 | DEBUG    | __main__:trials:29 - Trial = 22581/30000 | Total reward = 36.39
2022-01-26 14:18:15.956 | DEBUG    | __main__:trials:24 - Trial = 22582/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.957 | DEBUG    | __main__:trials:29 - Trial = 22582/30000 | Total reward = 46.23
2022-01-26 14:18:15.962 | DEBUG    | __main__:trials:24 - Trial = 22583/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.963 | DEBUG    | __main__:trials:29 - Trial = 22583/30000 | Total reward = 40.62
2022-01-26 14:18:15.966 | DEBUG    | __main__:trials:24 - Trial = 22584/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.968 | DEBUG    | __main__:trials:29 - Trial = 22584/30000 | Total reward = 38.53
2022-01-26 14:18:15.972 | DEBUG    | __main__:trials:24 - Trial = 22585/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.973 | DEBUG    | __main__:trials:29 - Trial = 22585/30000 | Total reward = 42.86
2022-01-26 14:18:15.977 | DEBUG    | __main__:trials:24 - Trial = 22586/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.979 | DEBUG    | __main__:trials:29 - Trial = 22586/30000 | Total reward = 32.82
2022-01-26 14:18:15.983 | DEBUG    | __main__:trials:24 - Trial = 22587/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.984 | DEBUG    | __main__:trials:29 - Trial = 22587/30000 | Total reward = 43.08
2022-01-26 14:18:15.988 | DEBUG    | __main__:trials:24 - Trial = 22588/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.990 | DEBUG    | __main__:trials:29 - Trial = 22588/30000 | Total reward = 42.63
2022-01-26 14:18:15.993 | DEBUG    | __main__:trials:24 - Trial = 22589/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.995 | DEBUG    | __main__:trials:29 - Trial = 22589/30000 | Total reward = 53.06
2022-01-26 14:18:15.999 | DEBUG    | __main__:trials:24 - Trial = 22590/30000 | Max number of steps (20) reached
2022-01-26 14:18:15.999 | DEBUG    | __main__:trials:29 - Trial = 22590/30000 | Total reward = 35.08
2022-01-26 14:18:16.004 | DEBUG    | __main__:trials:24 - Trial = 22591/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.005 | DEBUG    | __main__:trials:29 - Trial = 22591/30000 | Total reward = 47.19
2022-01-26 14:18:16.009 | DEBUG    | __main__:trials:24 - Trial = 22592/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.010 | DEBUG    | __main__:trials:29 - Trial = 22592/30000 | Total reward = 42.49
2022-01-26 14:18:16.013 | DEBUG    | __main__:trials:26 - Trial = 22593/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.015 | DEBUG    | __main__:trials:29 - Trial = 22593/30000 | Total reward = 20.07
2022-01-26 14:18:16.017 | DEBUG    | __main__:trials:26 - Trial = 22594/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.018 | DEBUG    | __main__:trials:29 - Trial = 22594/30000 | Total reward = 21.03
2022-01-26 14:18:16.021 | DEBUG    | __main__:trials:24 - Trial = 22595/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.023 | DEBUG    | __main__:trials:29 - Trial = 22595/30000 | Total reward = 39.85
2022-01-26 14:18:16.026 | DEBUG    | __main__:trials:24 - Trial = 22596/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.027 | DEBUG    | __main__:trials:29 - Trial = 22596/30000 | Total reward = 55.02
2022-01-26 14:18:16.031 | DEBUG    | __main__:trials:24 - Trial = 22597/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.032 | DEBUG    | __main__:trials:29 - Trial = 22597/30000 | Total reward = 47.03
2022-01-26 14:18:16.036 | DEBUG    | __main__:trials:24 - Trial = 22598/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.037 | DEBUG    | __main__:trials:29 - Trial = 22598/30000 | Total reward = 30.72
2022-01-26 14:18:16.041 | DEBUG    | __main__:trials:24 - Trial = 22599/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.043 | DEBUG    | __main__:trials:29 - Trial = 22599/30000 | Total reward = 50.75
2022-01-26 14:18:16.047 | DEBUG    | __main__:trials:26 - Trial = 22600/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.048 | DEBUG    | __main__:trials:29 - Trial = 22600/30000 | Total reward = 35.36
2022-01-26 14:18:16.052 | DEBUG    | __main__:trials:24 - Trial = 22601/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.053 | DEBUG    | __main__:trials:29 - Trial = 22601/30000 | Total reward = 34.92
2022-01-26 14:18:16.056 | DEBUG    | __main__:trials:24 - Trial = 22602/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.057 | DEBUG    | __main__:trials:29 - Trial = 22602/30000 | Total reward = 45.87
2022-01-26 14:18:16.062 | DEBUG    | __main__:trials:24 - Trial = 22603/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.063 | DEBUG    | __main__:trials:29 - Trial = 22603/30000 | Total reward = 37.25
2022-01-26 14:18:16.068 | DEBUG    | __main__:trials:24 - Trial = 22604/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.069 | DEBUG    | __main__:trials:29 - Trial = 22604/30000 | Total reward = 44.75
2022-01-26 14:18:16.072 | DEBUG    | __main__:trials:24 - Trial = 22605/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.074 | DEBUG    | __main__:trials:29 - Trial = 22605/30000 | Total reward = 53.43
2022-01-26 14:18:16.078 | DEBUG    | __main__:trials:24 - Trial = 22606/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.080 | DEBUG    | __main__:trials:29 - Trial = 22606/30000 | Total reward = 36.83
2022-01-26 14:18:16.083 | DEBUG    | __main__:trials:24 - Trial = 22607/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.084 | DEBUG    | __main__:trials:29 - Trial = 22607/30000 | Total reward = 38.75
2022-01-26 14:18:16.088 | DEBUG    | __main__:trials:24 - Trial = 22608/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.090 | DEBUG    | __main__:trials:29 - Trial = 22608/30000 | Total reward = 36.17
2022-01-26 14:18:16.094 | DEBUG    | __main__:trials:24 - Trial = 22609/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.095 | DEBUG    | __main__:trials:29 - Trial = 22609/30000 | Total reward = 39.29
2022-01-26 14:18:16.099 | DEBUG    | __main__:trials:24 - Trial = 22610/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.100 | DEBUG    | __main__:trials:29 - Trial = 22610/30000 | Total reward = 40.57
2022-01-26 14:18:16.104 | DEBUG    | __main__:trials:24 - Trial = 22611/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.105 | DEBUG    | __main__:trials:29 - Trial = 22611/30000 | Total reward = 40.64
2022-01-26 14:18:16.109 | DEBUG    | __main__:trials:24 - Trial = 22612/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.111 | DEBUG    | __main__:trials:29 - Trial = 22612/30000 | Total reward = 38.27
2022-01-26 14:18:16.114 | DEBUG    | __main__:trials:24 - Trial = 22613/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.115 | DEBUG    | __main__:trials:29 - Trial = 22613/30000 | Total reward = 42.92
2022-01-26 14:18:16.119 | DEBUG    | __main__:trials:24 - Trial = 22614/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.120 | DEBUG    | __main__:trials:29 - Trial = 22614/30000 | Total reward = 54.48
2022-01-26 14:18:16.124 | DEBUG    | __main__:trials:24 - Trial = 22615/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.126 | DEBUG    | __main__:trials:29 - Trial = 22615/30000 | Total reward = 62.24
2022-01-26 14:18:16.130 | DEBUG    | __main__:trials:24 - Trial = 22616/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.131 | DEBUG    | __main__:trials:29 - Trial = 22616/30000 | Total reward = 60.61
2022-01-26 14:18:16.135 | DEBUG    | __main__:trials:24 - Trial = 22617/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.136 | DEBUG    | __main__:trials:29 - Trial = 22617/30000 | Total reward = 34.36
2022-01-26 14:18:16.140 | DEBUG    | __main__:trials:24 - Trial = 22618/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.142 | DEBUG    | __main__:trials:29 - Trial = 22618/30000 | Total reward = 40.14
2022-01-26 14:18:16.146 | DEBUG    | __main__:trials:24 - Trial = 22619/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.147 | DEBUG    | __main__:trials:29 - Trial = 22619/30000 | Total reward = 38.28
2022-01-26 14:18:16.151 | DEBUG    | __main__:trials:24 - Trial = 22620/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.152 | DEBUG    | __main__:trials:29 - Trial = 22620/30000 | Total reward = 41.18
2022-01-26 14:18:16.156 | DEBUG    | __main__:trials:24 - Trial = 22621/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.158 | DEBUG    | __main__:trials:29 - Trial = 22621/30000 | Total reward = 29.19
2022-01-26 14:18:16.161 | DEBUG    | __main__:trials:24 - Trial = 22622/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.162 | DEBUG    | __main__:trials:29 - Trial = 22622/30000 | Total reward = 53.08
2022-01-26 14:18:16.166 | DEBUG    | __main__:trials:24 - Trial = 22623/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.167 | DEBUG    | __main__:trials:29 - Trial = 22623/30000 | Total reward = 26.30
2022-01-26 14:18:16.171 | DEBUG    | __main__:trials:24 - Trial = 22624/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.172 | DEBUG    | __main__:trials:29 - Trial = 22624/30000 | Total reward = 38.15
2022-01-26 14:18:16.176 | DEBUG    | __main__:trials:24 - Trial = 22625/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.177 | DEBUG    | __main__:trials:29 - Trial = 22625/30000 | Total reward = 33.26
2022-01-26 14:18:16.181 | DEBUG    | __main__:trials:24 - Trial = 22626/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.181 | DEBUG    | __main__:trials:29 - Trial = 22626/30000 | Total reward = 46.83
2022-01-26 14:18:16.186 | DEBUG    | __main__:trials:24 - Trial = 22627/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.186 | DEBUG    | __main__:trials:29 - Trial = 22627/30000 | Total reward = 38.90
2022-01-26 14:18:16.191 | DEBUG    | __main__:trials:24 - Trial = 22628/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.192 | DEBUG    | __main__:trials:29 - Trial = 22628/30000 | Total reward = 37.94
2022-01-26 14:18:16.196 | DEBUG    | __main__:trials:24 - Trial = 22629/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.197 | DEBUG    | __main__:trials:29 - Trial = 22629/30000 | Total reward = 37.28
2022-01-26 14:18:16.201 | DEBUG    | __main__:trials:24 - Trial = 22630/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.202 | DEBUG    | __main__:trials:29 - Trial = 22630/30000 | Total reward = 42.71
2022-01-26 14:18:16.207 | DEBUG    | __main__:trials:24 - Trial = 22631/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.208 | DEBUG    | __main__:trials:29 - Trial = 22631/30000 | Total reward = 53.62
2022-01-26 14:18:16.212 | DEBUG    | __main__:trials:24 - Trial = 22632/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.213 | DEBUG    | __main__:trials:29 - Trial = 22632/30000 | Total reward = 31.57
2022-01-26 14:18:16.216 | DEBUG    | __main__:trials:24 - Trial = 22633/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.217 | DEBUG    | __main__:trials:29 - Trial = 22633/30000 | Total reward = 41.50
2022-01-26 14:18:16.221 | DEBUG    | __main__:trials:24 - Trial = 22634/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.222 | DEBUG    | __main__:trials:29 - Trial = 22634/30000 | Total reward = 42.99
2022-01-26 14:18:16.226 | DEBUG    | __main__:trials:24 - Trial = 22635/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.227 | DEBUG    | __main__:trials:29 - Trial = 22635/30000 | Total reward = 41.96
2022-01-26 14:18:16.230 | DEBUG    | __main__:trials:24 - Trial = 22636/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.232 | DEBUG    | __main__:trials:29 - Trial = 22636/30000 | Total reward = 42.49
2022-01-26 14:18:16.235 | DEBUG    | __main__:trials:24 - Trial = 22637/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.237 | DEBUG    | __main__:trials:29 - Trial = 22637/30000 | Total reward = 49.66
2022-01-26 14:18:16.240 | DEBUG    | __main__:trials:24 - Trial = 22638/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.242 | DEBUG    | __main__:trials:29 - Trial = 22638/30000 | Total reward = 38.10
2022-01-26 14:18:16.246 | DEBUG    | __main__:trials:24 - Trial = 22639/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.246 | DEBUG    | __main__:trials:29 - Trial = 22639/30000 | Total reward = 31.31
2022-01-26 14:18:16.250 | DEBUG    | __main__:trials:24 - Trial = 22640/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.252 | DEBUG    | __main__:trials:29 - Trial = 22640/30000 | Total reward = 45.27
2022-01-26 14:18:16.256 | DEBUG    | __main__:trials:24 - Trial = 22641/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.257 | DEBUG    | __main__:trials:29 - Trial = 22641/30000 | Total reward = 40.50
2022-01-26 14:18:16.261 | DEBUG    | __main__:trials:24 - Trial = 22642/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.262 | DEBUG    | __main__:trials:29 - Trial = 22642/30000 | Total reward = 47.22
2022-01-26 14:18:16.266 | DEBUG    | __main__:trials:24 - Trial = 22643/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.268 | DEBUG    | __main__:trials:29 - Trial = 22643/30000 | Total reward = 40.66
2022-01-26 14:18:16.272 | DEBUG    | __main__:trials:24 - Trial = 22644/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.272 | DEBUG    | __main__:trials:29 - Trial = 22644/30000 | Total reward = 51.62
2022-01-26 14:18:16.276 | DEBUG    | __main__:trials:24 - Trial = 22645/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.277 | DEBUG    | __main__:trials:29 - Trial = 22645/30000 | Total reward = 41.08
2022-01-26 14:18:16.281 | DEBUG    | __main__:trials:24 - Trial = 22646/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.282 | DEBUG    | __main__:trials:29 - Trial = 22646/30000 | Total reward = 49.38
2022-01-26 14:18:16.286 | DEBUG    | __main__:trials:24 - Trial = 22647/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.288 | DEBUG    | __main__:trials:29 - Trial = 22647/30000 | Total reward = 35.10
2022-01-26 14:18:16.291 | DEBUG    | __main__:trials:24 - Trial = 22648/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.292 | DEBUG    | __main__:trials:29 - Trial = 22648/30000 | Total reward = 49.59
2022-01-26 14:18:16.296 | DEBUG    | __main__:trials:24 - Trial = 22649/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.298 | DEBUG    | __main__:trials:29 - Trial = 22649/30000 | Total reward = 26.12
2022-01-26 14:18:16.302 | DEBUG    | __main__:trials:24 - Trial = 22650/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.302 | DEBUG    | __main__:trials:29 - Trial = 22650/30000 | Total reward = 38.64
2022-01-26 14:18:16.307 | DEBUG    | __main__:trials:24 - Trial = 22651/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.309 | DEBUG    | __main__:trials:29 - Trial = 22651/30000 | Total reward = 28.05
2022-01-26 14:18:16.312 | DEBUG    | __main__:trials:24 - Trial = 22652/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.313 | DEBUG    | __main__:trials:29 - Trial = 22652/30000 | Total reward = 38.44
2022-01-26 14:18:16.317 | DEBUG    | __main__:trials:24 - Trial = 22653/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.319 | DEBUG    | __main__:trials:29 - Trial = 22653/30000 | Total reward = 49.47
2022-01-26 14:18:16.323 | DEBUG    | __main__:trials:24 - Trial = 22654/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.324 | DEBUG    | __main__:trials:29 - Trial = 22654/30000 | Total reward = 42.50
2022-01-26 14:18:16.328 | DEBUG    | __main__:trials:24 - Trial = 22655/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.329 | DEBUG    | __main__:trials:29 - Trial = 22655/30000 | Total reward = 37.09
2022-01-26 14:18:16.334 | DEBUG    | __main__:trials:24 - Trial = 22656/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.335 | DEBUG    | __main__:trials:29 - Trial = 22656/30000 | Total reward = 37.75
2022-01-26 14:18:16.339 | DEBUG    | __main__:trials:24 - Trial = 22657/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.341 | DEBUG    | __main__:trials:29 - Trial = 22657/30000 | Total reward = 39.83
2022-01-26 14:18:16.344 | DEBUG    | __main__:trials:24 - Trial = 22658/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.346 | DEBUG    | __main__:trials:29 - Trial = 22658/30000 | Total reward = 51.74
2022-01-26 14:18:16.350 | DEBUG    | __main__:trials:24 - Trial = 22659/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.351 | DEBUG    | __main__:trials:29 - Trial = 22659/30000 | Total reward = 49.30
2022-01-26 14:18:16.355 | DEBUG    | __main__:trials:24 - Trial = 22660/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.356 | DEBUG    | __main__:trials:29 - Trial = 22660/30000 | Total reward = 47.60
2022-01-26 14:18:16.360 | DEBUG    | __main__:trials:24 - Trial = 22661/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.361 | DEBUG    | __main__:trials:29 - Trial = 22661/30000 | Total reward = 44.21
2022-01-26 14:18:16.365 | DEBUG    | __main__:trials:24 - Trial = 22662/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.366 | DEBUG    | __main__:trials:29 - Trial = 22662/30000 | Total reward = 43.02
2022-01-26 14:18:16.370 | DEBUG    | __main__:trials:24 - Trial = 22663/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.371 | DEBUG    | __main__:trials:29 - Trial = 22663/30000 | Total reward = 46.01
2022-01-26 14:18:16.376 | DEBUG    | __main__:trials:24 - Trial = 22664/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.377 | DEBUG    | __main__:trials:29 - Trial = 22664/30000 | Total reward = 45.30
2022-01-26 14:18:16.380 | DEBUG    | __main__:trials:24 - Trial = 22665/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.382 | DEBUG    | __main__:trials:29 - Trial = 22665/30000 | Total reward = 46.32
2022-01-26 14:18:16.385 | DEBUG    | __main__:trials:26 - Trial = 22666/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.386 | DEBUG    | __main__:trials:29 - Trial = 22666/30000 | Total reward = 26.95
2022-01-26 14:18:16.390 | DEBUG    | __main__:trials:24 - Trial = 22667/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.392 | DEBUG    | __main__:trials:29 - Trial = 22667/30000 | Total reward = 40.17
2022-01-26 14:18:16.396 | DEBUG    | __main__:trials:24 - Trial = 22668/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.397 | DEBUG    | __main__:trials:29 - Trial = 22668/30000 | Total reward = 40.30
2022-01-26 14:18:16.400 | DEBUG    | __main__:trials:24 - Trial = 22669/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.402 | DEBUG    | __main__:trials:29 - Trial = 22669/30000 | Total reward = 42.35
2022-01-26 14:18:16.405 | DEBUG    | __main__:trials:24 - Trial = 22670/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.406 | DEBUG    | __main__:trials:29 - Trial = 22670/30000 | Total reward = 42.93
2022-01-26 14:18:16.409 | DEBUG    | __main__:trials:24 - Trial = 22671/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.411 | DEBUG    | __main__:trials:29 - Trial = 22671/30000 | Total reward = 39.89
2022-01-26 14:18:16.414 | DEBUG    | __main__:trials:26 - Trial = 22672/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.415 | DEBUG    | __main__:trials:29 - Trial = 22672/30000 | Total reward = 34.84
2022-01-26 14:18:16.418 | DEBUG    | __main__:trials:24 - Trial = 22673/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.420 | DEBUG    | __main__:trials:29 - Trial = 22673/30000 | Total reward = 50.25
2022-01-26 14:18:16.423 | DEBUG    | __main__:trials:24 - Trial = 22674/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.425 | DEBUG    | __main__:trials:29 - Trial = 22674/30000 | Total reward = 38.79
2022-01-26 14:18:16.428 | DEBUG    | __main__:trials:24 - Trial = 22675/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.430 | DEBUG    | __main__:trials:29 - Trial = 22675/30000 | Total reward = 43.00
2022-01-26 14:18:16.433 | DEBUG    | __main__:trials:24 - Trial = 22676/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.434 | DEBUG    | __main__:trials:29 - Trial = 22676/30000 | Total reward = 42.53
2022-01-26 14:18:16.438 | DEBUG    | __main__:trials:24 - Trial = 22677/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.440 | DEBUG    | __main__:trials:29 - Trial = 22677/30000 | Total reward = 36.87
2022-01-26 14:18:16.443 | DEBUG    | __main__:trials:24 - Trial = 22678/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.444 | DEBUG    | __main__:trials:29 - Trial = 22678/30000 | Total reward = 45.91
2022-01-26 14:18:16.447 | DEBUG    | __main__:trials:24 - Trial = 22679/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.449 | DEBUG    | __main__:trials:29 - Trial = 22679/30000 | Total reward = 33.09
2022-01-26 14:18:16.452 | DEBUG    | __main__:trials:24 - Trial = 22680/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.452 | DEBUG    | __main__:trials:29 - Trial = 22680/30000 | Total reward = 46.60
2022-01-26 14:18:16.456 | DEBUG    | __main__:trials:24 - Trial = 22681/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.458 | DEBUG    | __main__:trials:29 - Trial = 22681/30000 | Total reward = 41.18
2022-01-26 14:18:16.461 | DEBUG    | __main__:trials:24 - Trial = 22682/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.461 | DEBUG    | __main__:trials:29 - Trial = 22682/30000 | Total reward = 39.09
2022-01-26 14:18:16.465 | DEBUG    | __main__:trials:24 - Trial = 22683/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.466 | DEBUG    | __main__:trials:29 - Trial = 22683/30000 | Total reward = 46.84
2022-01-26 14:18:16.470 | DEBUG    | __main__:trials:24 - Trial = 22684/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.471 | DEBUG    | __main__:trials:29 - Trial = 22684/30000 | Total reward = 46.73
2022-01-26 14:18:16.475 | DEBUG    | __main__:trials:26 - Trial = 22685/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.476 | DEBUG    | __main__:trials:29 - Trial = 22685/30000 | Total reward = 20.13
2022-01-26 14:18:16.480 | DEBUG    | __main__:trials:24 - Trial = 22686/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.481 | DEBUG    | __main__:trials:29 - Trial = 22686/30000 | Total reward = 46.92
2022-01-26 14:18:16.485 | DEBUG    | __main__:trials:24 - Trial = 22687/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.485 | DEBUG    | __main__:trials:29 - Trial = 22687/30000 | Total reward = 61.65
2022-01-26 14:18:16.489 | DEBUG    | __main__:trials:24 - Trial = 22688/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.490 | DEBUG    | __main__:trials:29 - Trial = 22688/30000 | Total reward = 40.08
2022-01-26 14:18:16.494 | DEBUG    | __main__:trials:24 - Trial = 22689/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.494 | DEBUG    | __main__:trials:29 - Trial = 22689/30000 | Total reward = 42.24
2022-01-26 14:18:16.498 | DEBUG    | __main__:trials:24 - Trial = 22690/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.499 | DEBUG    | __main__:trials:29 - Trial = 22690/30000 | Total reward = 42.23
2022-01-26 14:18:16.502 | DEBUG    | __main__:trials:24 - Trial = 22691/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.504 | DEBUG    | __main__:trials:29 - Trial = 22691/30000 | Total reward = 32.45
2022-01-26 14:18:16.507 | DEBUG    | __main__:trials:24 - Trial = 22692/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.509 | DEBUG    | __main__:trials:29 - Trial = 22692/30000 | Total reward = 32.71
2022-01-26 14:18:16.512 | DEBUG    | __main__:trials:24 - Trial = 22693/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.513 | DEBUG    | __main__:trials:29 - Trial = 22693/30000 | Total reward = 38.57
2022-01-26 14:18:16.516 | DEBUG    | __main__:trials:24 - Trial = 22694/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.518 | DEBUG    | __main__:trials:29 - Trial = 22694/30000 | Total reward = 38.66
2022-01-26 14:18:16.521 | DEBUG    | __main__:trials:24 - Trial = 22695/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.523 | DEBUG    | __main__:trials:29 - Trial = 22695/30000 | Total reward = 38.16
2022-01-26 14:18:16.527 | DEBUG    | __main__:trials:24 - Trial = 22696/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.527 | DEBUG    | __main__:trials:29 - Trial = 22696/30000 | Total reward = 47.51
2022-01-26 14:18:16.531 | DEBUG    | __main__:trials:24 - Trial = 22697/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.532 | DEBUG    | __main__:trials:29 - Trial = 22697/30000 | Total reward = 45.85
2022-01-26 14:18:16.535 | DEBUG    | __main__:trials:24 - Trial = 22698/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.537 | DEBUG    | __main__:trials:29 - Trial = 22698/30000 | Total reward = 40.94
2022-01-26 14:18:16.540 | DEBUG    | __main__:trials:26 - Trial = 22699/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.542 | DEBUG    | __main__:trials:29 - Trial = 22699/30000 | Total reward = 34.06
2022-01-26 14:18:16.545 | DEBUG    | __main__:trials:24 - Trial = 22700/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.547 | DEBUG    | __main__:trials:29 - Trial = 22700/30000 | Total reward = 48.51
2022-01-26 14:18:16.549 | DEBUG    | __main__:trials:24 - Trial = 22701/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.550 | DEBUG    | __main__:trials:29 - Trial = 22701/30000 | Total reward = 35.01
2022-01-26 14:18:16.554 | DEBUG    | __main__:trials:24 - Trial = 22702/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.555 | DEBUG    | __main__:trials:29 - Trial = 22702/30000 | Total reward = 39.09
2022-01-26 14:18:16.559 | DEBUG    | __main__:trials:24 - Trial = 22703/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.561 | DEBUG    | __main__:trials:29 - Trial = 22703/30000 | Total reward = 47.61
2022-01-26 14:18:16.564 | DEBUG    | __main__:trials:24 - Trial = 22704/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.567 | DEBUG    | __main__:trials:29 - Trial = 22704/30000 | Total reward = 49.25
2022-01-26 14:18:16.570 | DEBUG    | __main__:trials:24 - Trial = 22705/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.572 | DEBUG    | __main__:trials:29 - Trial = 22705/30000 | Total reward = 44.21
2022-01-26 14:18:16.575 | DEBUG    | __main__:trials:24 - Trial = 22706/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.577 | DEBUG    | __main__:trials:29 - Trial = 22706/30000 | Total reward = 36.66
2022-01-26 14:18:16.579 | DEBUG    | __main__:trials:24 - Trial = 22707/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.581 | DEBUG    | __main__:trials:29 - Trial = 22707/30000 | Total reward = 38.48
2022-01-26 14:18:16.584 | DEBUG    | __main__:trials:24 - Trial = 22708/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.585 | DEBUG    | __main__:trials:29 - Trial = 22708/30000 | Total reward = 39.91
2022-01-26 14:18:16.588 | DEBUG    | __main__:trials:24 - Trial = 22709/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.590 | DEBUG    | __main__:trials:29 - Trial = 22709/30000 | Total reward = 41.90
2022-01-26 14:18:16.594 | DEBUG    | __main__:trials:24 - Trial = 22710/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.594 | DEBUG    | __main__:trials:29 - Trial = 22710/30000 | Total reward = 31.07
2022-01-26 14:18:16.599 | DEBUG    | __main__:trials:24 - Trial = 22711/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.600 | DEBUG    | __main__:trials:29 - Trial = 22711/30000 | Total reward = 53.08
2022-01-26 14:18:16.603 | DEBUG    | __main__:trials:26 - Trial = 22712/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.604 | DEBUG    | __main__:trials:29 - Trial = 22712/30000 | Total reward = 11.99
2022-01-26 14:18:16.607 | DEBUG    | __main__:trials:24 - Trial = 22713/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.609 | DEBUG    | __main__:trials:29 - Trial = 22713/30000 | Total reward = 37.34
2022-01-26 14:18:16.612 | DEBUG    | __main__:trials:24 - Trial = 22714/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.614 | DEBUG    | __main__:trials:29 - Trial = 22714/30000 | Total reward = 40.73
2022-01-26 14:18:16.617 | DEBUG    | __main__:trials:24 - Trial = 22715/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.618 | DEBUG    | __main__:trials:29 - Trial = 22715/30000 | Total reward = 57.59
2022-01-26 14:18:16.621 | DEBUG    | __main__:trials:24 - Trial = 22716/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.622 | DEBUG    | __main__:trials:29 - Trial = 22716/30000 | Total reward = 30.70
2022-01-26 14:18:16.625 | DEBUG    | __main__:trials:24 - Trial = 22717/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.627 | DEBUG    | __main__:trials:29 - Trial = 22717/30000 | Total reward = 47.29
2022-01-26 14:18:16.630 | DEBUG    | __main__:trials:24 - Trial = 22718/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.631 | DEBUG    | __main__:trials:29 - Trial = 22718/30000 | Total reward = 35.39
2022-01-26 14:18:16.635 | DEBUG    | __main__:trials:24 - Trial = 22719/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.635 | DEBUG    | __main__:trials:29 - Trial = 22719/30000 | Total reward = 45.35
2022-01-26 14:18:16.639 | DEBUG    | __main__:trials:24 - Trial = 22720/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.641 | DEBUG    | __main__:trials:29 - Trial = 22720/30000 | Total reward = 41.33
2022-01-26 14:18:16.644 | DEBUG    | __main__:trials:24 - Trial = 22721/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.645 | DEBUG    | __main__:trials:29 - Trial = 22721/30000 | Total reward = 50.52
2022-01-26 14:18:16.649 | DEBUG    | __main__:trials:24 - Trial = 22722/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.649 | DEBUG    | __main__:trials:29 - Trial = 22722/30000 | Total reward = 40.36
2022-01-26 14:18:16.653 | DEBUG    | __main__:trials:24 - Trial = 22723/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.653 | DEBUG    | __main__:trials:29 - Trial = 22723/30000 | Total reward = 37.39
2022-01-26 14:18:16.658 | DEBUG    | __main__:trials:24 - Trial = 22724/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.659 | DEBUG    | __main__:trials:29 - Trial = 22724/30000 | Total reward = 42.76
2022-01-26 14:18:16.662 | DEBUG    | __main__:trials:24 - Trial = 22725/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.664 | DEBUG    | __main__:trials:29 - Trial = 22725/30000 | Total reward = 45.96
2022-01-26 14:18:16.667 | DEBUG    | __main__:trials:24 - Trial = 22726/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.668 | DEBUG    | __main__:trials:29 - Trial = 22726/30000 | Total reward = 42.25
2022-01-26 14:18:16.671 | DEBUG    | __main__:trials:24 - Trial = 22727/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.673 | DEBUG    | __main__:trials:29 - Trial = 22727/30000 | Total reward = 43.45
2022-01-26 14:18:16.676 | DEBUG    | __main__:trials:24 - Trial = 22728/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.677 | DEBUG    | __main__:trials:29 - Trial = 22728/30000 | Total reward = 35.70
2022-01-26 14:18:16.680 | DEBUG    | __main__:trials:24 - Trial = 22729/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.681 | DEBUG    | __main__:trials:29 - Trial = 22729/30000 | Total reward = 37.95
2022-01-26 14:18:16.685 | DEBUG    | __main__:trials:24 - Trial = 22730/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.686 | DEBUG    | __main__:trials:29 - Trial = 22730/30000 | Total reward = 39.31
2022-01-26 14:18:16.689 | DEBUG    | __main__:trials:24 - Trial = 22731/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.690 | DEBUG    | __main__:trials:29 - Trial = 22731/30000 | Total reward = 42.73
2022-01-26 14:18:16.694 | DEBUG    | __main__:trials:24 - Trial = 22732/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.696 | DEBUG    | __main__:trials:29 - Trial = 22732/30000 | Total reward = 39.78
2022-01-26 14:18:16.699 | DEBUG    | __main__:trials:24 - Trial = 22733/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.701 | DEBUG    | __main__:trials:29 - Trial = 22733/30000 | Total reward = 35.39
2022-01-26 14:18:16.704 | DEBUG    | __main__:trials:24 - Trial = 22734/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.706 | DEBUG    | __main__:trials:29 - Trial = 22734/30000 | Total reward = 46.57
2022-01-26 14:18:16.709 | DEBUG    | __main__:trials:24 - Trial = 22735/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.709 | DEBUG    | __main__:trials:29 - Trial = 22735/30000 | Total reward = 41.62
2022-01-26 14:18:16.713 | DEBUG    | __main__:trials:24 - Trial = 22736/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.714 | DEBUG    | __main__:trials:29 - Trial = 22736/30000 | Total reward = 34.40
2022-01-26 14:18:16.718 | DEBUG    | __main__:trials:24 - Trial = 22737/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.719 | DEBUG    | __main__:trials:29 - Trial = 22737/30000 | Total reward = 35.70
2022-01-26 14:18:16.722 | DEBUG    | __main__:trials:24 - Trial = 22738/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.724 | DEBUG    | __main__:trials:29 - Trial = 22738/30000 | Total reward = 45.63
2022-01-26 14:18:16.728 | DEBUG    | __main__:trials:24 - Trial = 22739/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.729 | DEBUG    | __main__:trials:29 - Trial = 22739/30000 | Total reward = 39.98
2022-01-26 14:18:16.733 | DEBUG    | __main__:trials:24 - Trial = 22740/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.735 | DEBUG    | __main__:trials:29 - Trial = 22740/30000 | Total reward = 25.00
2022-01-26 14:18:16.738 | DEBUG    | __main__:trials:26 - Trial = 22741/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.740 | DEBUG    | __main__:trials:29 - Trial = 22741/30000 | Total reward = 29.05
2022-01-26 14:18:16.743 | DEBUG    | __main__:trials:24 - Trial = 22742/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.745 | DEBUG    | __main__:trials:29 - Trial = 22742/30000 | Total reward = 61.25
2022-01-26 14:18:16.748 | DEBUG    | __main__:trials:24 - Trial = 22743/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.750 | DEBUG    | __main__:trials:29 - Trial = 22743/30000 | Total reward = 37.69
2022-01-26 14:18:16.754 | DEBUG    | __main__:trials:26 - Trial = 22744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.755 | DEBUG    | __main__:trials:29 - Trial = 22744/30000 | Total reward = 25.65
2022-01-26 14:18:16.759 | DEBUG    | __main__:trials:24 - Trial = 22745/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.761 | DEBUG    | __main__:trials:29 - Trial = 22745/30000 | Total reward = 37.14
2022-01-26 14:18:16.764 | DEBUG    | __main__:trials:24 - Trial = 22746/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.766 | DEBUG    | __main__:trials:29 - Trial = 22746/30000 | Total reward = 50.74
2022-01-26 14:18:16.770 | DEBUG    | __main__:trials:24 - Trial = 22747/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.771 | DEBUG    | __main__:trials:29 - Trial = 22747/30000 | Total reward = 60.23
2022-01-26 14:18:16.775 | DEBUG    | __main__:trials:24 - Trial = 22748/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.777 | DEBUG    | __main__:trials:29 - Trial = 22748/30000 | Total reward = 63.42
2022-01-26 14:18:16.781 | DEBUG    | __main__:trials:24 - Trial = 22749/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.782 | DEBUG    | __main__:trials:29 - Trial = 22749/30000 | Total reward = 40.86
2022-01-26 14:18:16.785 | DEBUG    | __main__:trials:24 - Trial = 22750/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.786 | DEBUG    | __main__:trials:29 - Trial = 22750/30000 | Total reward = 63.59
2022-01-26 14:18:16.791 | DEBUG    | __main__:trials:24 - Trial = 22751/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.792 | DEBUG    | __main__:trials:29 - Trial = 22751/30000 | Total reward = 40.75
2022-01-26 14:18:16.796 | DEBUG    | __main__:trials:24 - Trial = 22752/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.798 | DEBUG    | __main__:trials:29 - Trial = 22752/30000 | Total reward = 34.63
2022-01-26 14:18:16.801 | DEBUG    | __main__:trials:26 - Trial = 22753/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.803 | DEBUG    | __main__:trials:29 - Trial = 22753/30000 | Total reward = 30.68
2022-01-26 14:18:16.807 | DEBUG    | __main__:trials:24 - Trial = 22754/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.808 | DEBUG    | __main__:trials:29 - Trial = 22754/30000 | Total reward = 38.03
2022-01-26 14:18:16.812 | DEBUG    | __main__:trials:24 - Trial = 22755/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.813 | DEBUG    | __main__:trials:29 - Trial = 22755/30000 | Total reward = 48.23
2022-01-26 14:18:16.816 | DEBUG    | __main__:trials:24 - Trial = 22756/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.818 | DEBUG    | __main__:trials:29 - Trial = 22756/30000 | Total reward = 37.86
2022-01-26 14:18:16.822 | DEBUG    | __main__:trials:24 - Trial = 22757/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.823 | DEBUG    | __main__:trials:29 - Trial = 22757/30000 | Total reward = 50.58
2022-01-26 14:18:16.826 | DEBUG    | __main__:trials:24 - Trial = 22758/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.828 | DEBUG    | __main__:trials:29 - Trial = 22758/30000 | Total reward = 50.50
2022-01-26 14:18:16.832 | DEBUG    | __main__:trials:24 - Trial = 22759/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.833 | DEBUG    | __main__:trials:29 - Trial = 22759/30000 | Total reward = 34.77
2022-01-26 14:18:16.837 | DEBUG    | __main__:trials:24 - Trial = 22760/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.839 | DEBUG    | __main__:trials:29 - Trial = 22760/30000 | Total reward = 56.86
2022-01-26 14:18:16.842 | DEBUG    | __main__:trials:24 - Trial = 22761/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.844 | DEBUG    | __main__:trials:29 - Trial = 22761/30000 | Total reward = 47.64
2022-01-26 14:18:16.848 | DEBUG    | __main__:trials:24 - Trial = 22762/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.849 | DEBUG    | __main__:trials:29 - Trial = 22762/30000 | Total reward = 50.04
2022-01-26 14:18:16.852 | DEBUG    | __main__:trials:24 - Trial = 22763/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.854 | DEBUG    | __main__:trials:29 - Trial = 22763/30000 | Total reward = 48.97
2022-01-26 14:18:16.858 | DEBUG    | __main__:trials:24 - Trial = 22764/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.859 | DEBUG    | __main__:trials:29 - Trial = 22764/30000 | Total reward = 37.65
2022-01-26 14:18:16.861 | DEBUG    | __main__:trials:24 - Trial = 22765/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.862 | DEBUG    | __main__:trials:29 - Trial = 22765/30000 | Total reward = 50.58
2022-01-26 14:18:16.866 | DEBUG    | __main__:trials:24 - Trial = 22766/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.868 | DEBUG    | __main__:trials:29 - Trial = 22766/30000 | Total reward = 46.20
2022-01-26 14:18:16.871 | DEBUG    | __main__:trials:24 - Trial = 22767/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.872 | DEBUG    | __main__:trials:29 - Trial = 22767/30000 | Total reward = 34.82
2022-01-26 14:18:16.876 | DEBUG    | __main__:trials:24 - Trial = 22768/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.878 | DEBUG    | __main__:trials:29 - Trial = 22768/30000 | Total reward = 39.16
2022-01-26 14:18:16.882 | DEBUG    | __main__:trials:24 - Trial = 22769/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.884 | DEBUG    | __main__:trials:29 - Trial = 22769/30000 | Total reward = 38.78
2022-01-26 14:18:16.887 | DEBUG    | __main__:trials:24 - Trial = 22770/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.889 | DEBUG    | __main__:trials:29 - Trial = 22770/30000 | Total reward = 43.88
2022-01-26 14:18:16.892 | DEBUG    | __main__:trials:24 - Trial = 22771/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.894 | DEBUG    | __main__:trials:29 - Trial = 22771/30000 | Total reward = 56.65
2022-01-26 14:18:16.897 | DEBUG    | __main__:trials:24 - Trial = 22772/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.898 | DEBUG    | __main__:trials:29 - Trial = 22772/30000 | Total reward = 38.02
2022-01-26 14:18:16.902 | DEBUG    | __main__:trials:24 - Trial = 22773/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.903 | DEBUG    | __main__:trials:29 - Trial = 22773/30000 | Total reward = 63.73
2022-01-26 14:18:16.907 | DEBUG    | __main__:trials:24 - Trial = 22774/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.907 | DEBUG    | __main__:trials:29 - Trial = 22774/30000 | Total reward = 52.13
2022-01-26 14:18:16.912 | DEBUG    | __main__:trials:26 - Trial = 22775/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:16.914 | DEBUG    | __main__:trials:29 - Trial = 22775/30000 | Total reward = 38.83
2022-01-26 14:18:16.917 | DEBUG    | __main__:trials:24 - Trial = 22776/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.919 | DEBUG    | __main__:trials:29 - Trial = 22776/30000 | Total reward = 36.26
2022-01-26 14:18:16.923 | DEBUG    | __main__:trials:24 - Trial = 22777/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.924 | DEBUG    | __main__:trials:29 - Trial = 22777/30000 | Total reward = 40.35
2022-01-26 14:18:16.928 | DEBUG    | __main__:trials:24 - Trial = 22778/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.930 | DEBUG    | __main__:trials:29 - Trial = 22778/30000 | Total reward = 41.30
2022-01-26 14:18:16.933 | DEBUG    | __main__:trials:24 - Trial = 22779/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.934 | DEBUG    | __main__:trials:29 - Trial = 22779/30000 | Total reward = 38.43
2022-01-26 14:18:16.939 | DEBUG    | __main__:trials:24 - Trial = 22780/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.939 | DEBUG    | __main__:trials:29 - Trial = 22780/30000 | Total reward = 34.01
2022-01-26 14:18:16.943 | DEBUG    | __main__:trials:24 - Trial = 22781/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.945 | DEBUG    | __main__:trials:29 - Trial = 22781/30000 | Total reward = 43.11
2022-01-26 14:18:16.948 | DEBUG    | __main__:trials:24 - Trial = 22782/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.949 | DEBUG    | __main__:trials:29 - Trial = 22782/30000 | Total reward = 44.71
2022-01-26 14:18:16.954 | DEBUG    | __main__:trials:24 - Trial = 22783/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.955 | DEBUG    | __main__:trials:29 - Trial = 22783/30000 | Total reward = 41.56
2022-01-26 14:18:16.959 | DEBUG    | __main__:trials:24 - Trial = 22784/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.960 | DEBUG    | __main__:trials:29 - Trial = 22784/30000 | Total reward = 41.39
2022-01-26 14:18:16.963 | DEBUG    | __main__:trials:24 - Trial = 22785/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.965 | DEBUG    | __main__:trials:29 - Trial = 22785/30000 | Total reward = 47.64
2022-01-26 14:18:16.969 | DEBUG    | __main__:trials:24 - Trial = 22786/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.970 | DEBUG    | __main__:trials:29 - Trial = 22786/30000 | Total reward = 41.46
2022-01-26 14:18:16.974 | DEBUG    | __main__:trials:24 - Trial = 22787/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.976 | DEBUG    | __main__:trials:29 - Trial = 22787/30000 | Total reward = 40.16
2022-01-26 14:18:16.979 | DEBUG    | __main__:trials:24 - Trial = 22788/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.981 | DEBUG    | __main__:trials:29 - Trial = 22788/30000 | Total reward = 44.68
2022-01-26 14:18:16.984 | DEBUG    | __main__:trials:24 - Trial = 22789/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.985 | DEBUG    | __main__:trials:29 - Trial = 22789/30000 | Total reward = 43.96
2022-01-26 14:18:16.988 | DEBUG    | __main__:trials:24 - Trial = 22790/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.990 | DEBUG    | __main__:trials:29 - Trial = 22790/30000 | Total reward = 37.46
2022-01-26 14:18:16.993 | DEBUG    | __main__:trials:24 - Trial = 22791/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.995 | DEBUG    | __main__:trials:29 - Trial = 22791/30000 | Total reward = 48.27
2022-01-26 14:18:16.998 | DEBUG    | __main__:trials:24 - Trial = 22792/30000 | Max number of steps (20) reached
2022-01-26 14:18:16.998 | DEBUG    | __main__:trials:29 - Trial = 22792/30000 | Total reward = 41.74
2022-01-26 14:18:17.002 | DEBUG    | __main__:trials:24 - Trial = 22793/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.004 | DEBUG    | __main__:trials:29 - Trial = 22793/30000 | Total reward = 39.79
2022-01-26 14:18:17.007 | DEBUG    | __main__:trials:24 - Trial = 22794/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.008 | DEBUG    | __main__:trials:29 - Trial = 22794/30000 | Total reward = 41.88
2022-01-26 14:18:17.012 | DEBUG    | __main__:trials:24 - Trial = 22795/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.013 | DEBUG    | __main__:trials:29 - Trial = 22795/30000 | Total reward = 39.28
2022-01-26 14:18:17.017 | DEBUG    | __main__:trials:24 - Trial = 22796/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.019 | DEBUG    | __main__:trials:29 - Trial = 22796/30000 | Total reward = 49.04
2022-01-26 14:18:17.022 | DEBUG    | __main__:trials:24 - Trial = 22797/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.024 | DEBUG    | __main__:trials:29 - Trial = 22797/30000 | Total reward = 49.56
2022-01-26 14:18:17.027 | DEBUG    | __main__:trials:24 - Trial = 22798/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.028 | DEBUG    | __main__:trials:29 - Trial = 22798/30000 | Total reward = 42.93
2022-01-26 14:18:17.032 | DEBUG    | __main__:trials:24 - Trial = 22799/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.033 | DEBUG    | __main__:trials:29 - Trial = 22799/30000 | Total reward = 52.73
2022-01-26 14:18:17.037 | DEBUG    | __main__:trials:24 - Trial = 22800/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.038 | DEBUG    | __main__:trials:29 - Trial = 22800/30000 | Total reward = 46.76
2022-01-26 14:18:17.041 | DEBUG    | __main__:trials:24 - Trial = 22801/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.043 | DEBUG    | __main__:trials:29 - Trial = 22801/30000 | Total reward = 58.64
2022-01-26 14:18:17.046 | DEBUG    | __main__:trials:24 - Trial = 22802/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.048 | DEBUG    | __main__:trials:29 - Trial = 22802/30000 | Total reward = 35.31
2022-01-26 14:18:17.051 | DEBUG    | __main__:trials:24 - Trial = 22803/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.053 | DEBUG    | __main__:trials:29 - Trial = 22803/30000 | Total reward = 36.62
2022-01-26 14:18:17.056 | DEBUG    | __main__:trials:24 - Trial = 22804/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.058 | DEBUG    | __main__:trials:29 - Trial = 22804/30000 | Total reward = 46.69
2022-01-26 14:18:17.062 | DEBUG    | __main__:trials:24 - Trial = 22805/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.063 | DEBUG    | __main__:trials:29 - Trial = 22805/30000 | Total reward = 51.06
2022-01-26 14:18:17.067 | DEBUG    | __main__:trials:24 - Trial = 22806/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.069 | DEBUG    | __main__:trials:29 - Trial = 22806/30000 | Total reward = 44.69
2022-01-26 14:18:17.072 | DEBUG    | __main__:trials:24 - Trial = 22807/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.074 | DEBUG    | __main__:trials:29 - Trial = 22807/30000 | Total reward = 45.79
2022-01-26 14:18:17.078 | DEBUG    | __main__:trials:24 - Trial = 22808/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.078 | DEBUG    | __main__:trials:29 - Trial = 22808/30000 | Total reward = 52.20
2022-01-26 14:18:17.083 | DEBUG    | __main__:trials:24 - Trial = 22809/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.083 | DEBUG    | __main__:trials:29 - Trial = 22809/30000 | Total reward = 38.62
2022-01-26 14:18:17.087 | DEBUG    | __main__:trials:24 - Trial = 22810/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.089 | DEBUG    | __main__:trials:29 - Trial = 22810/30000 | Total reward = 38.64
2022-01-26 14:18:17.092 | DEBUG    | __main__:trials:24 - Trial = 22811/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.093 | DEBUG    | __main__:trials:29 - Trial = 22811/30000 | Total reward = 62.74
2022-01-26 14:18:17.096 | DEBUG    | __main__:trials:24 - Trial = 22812/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.098 | DEBUG    | __main__:trials:29 - Trial = 22812/30000 | Total reward = 51.94
2022-01-26 14:18:17.101 | DEBUG    | __main__:trials:24 - Trial = 22813/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.103 | DEBUG    | __main__:trials:29 - Trial = 22813/30000 | Total reward = 41.36
2022-01-26 14:18:17.107 | DEBUG    | __main__:trials:24 - Trial = 22814/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.109 | DEBUG    | __main__:trials:29 - Trial = 22814/30000 | Total reward = 38.32
2022-01-26 14:18:17.112 | DEBUG    | __main__:trials:26 - Trial = 22815/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.113 | DEBUG    | __main__:trials:29 - Trial = 22815/30000 | Total reward = 27.38
2022-01-26 14:18:17.117 | DEBUG    | __main__:trials:24 - Trial = 22816/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.118 | DEBUG    | __main__:trials:29 - Trial = 22816/30000 | Total reward = 46.98
2022-01-26 14:18:17.122 | DEBUG    | __main__:trials:24 - Trial = 22817/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.123 | DEBUG    | __main__:trials:29 - Trial = 22817/30000 | Total reward = 54.42
2022-01-26 14:18:17.127 | DEBUG    | __main__:trials:24 - Trial = 22818/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.128 | DEBUG    | __main__:trials:29 - Trial = 22818/30000 | Total reward = 45.11
2022-01-26 14:18:17.132 | DEBUG    | __main__:trials:24 - Trial = 22819/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.133 | DEBUG    | __main__:trials:29 - Trial = 22819/30000 | Total reward = 48.37
2022-01-26 14:18:17.137 | DEBUG    | __main__:trials:24 - Trial = 22820/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.139 | DEBUG    | __main__:trials:29 - Trial = 22820/30000 | Total reward = 46.98
2022-01-26 14:18:17.143 | DEBUG    | __main__:trials:24 - Trial = 22821/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.143 | DEBUG    | __main__:trials:29 - Trial = 22821/30000 | Total reward = 48.57
2022-01-26 14:18:17.148 | DEBUG    | __main__:trials:24 - Trial = 22822/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.149 | DEBUG    | __main__:trials:29 - Trial = 22822/30000 | Total reward = 56.66
2022-01-26 14:18:17.153 | DEBUG    | __main__:trials:26 - Trial = 22823/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.154 | DEBUG    | __main__:trials:29 - Trial = 22823/30000 | Total reward = 33.21
2022-01-26 14:18:17.157 | DEBUG    | __main__:trials:24 - Trial = 22824/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.159 | DEBUG    | __main__:trials:29 - Trial = 22824/30000 | Total reward = 38.20
2022-01-26 14:18:17.163 | DEBUG    | __main__:trials:26 - Trial = 22825/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.164 | DEBUG    | __main__:trials:29 - Trial = 22825/30000 | Total reward = 40.22
2022-01-26 14:18:17.168 | DEBUG    | __main__:trials:24 - Trial = 22826/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.169 | DEBUG    | __main__:trials:29 - Trial = 22826/30000 | Total reward = 43.83
2022-01-26 14:18:17.173 | DEBUG    | __main__:trials:24 - Trial = 22827/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.175 | DEBUG    | __main__:trials:29 - Trial = 22827/30000 | Total reward = 44.66
2022-01-26 14:18:17.179 | DEBUG    | __main__:trials:24 - Trial = 22828/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.180 | DEBUG    | __main__:trials:29 - Trial = 22828/30000 | Total reward = 46.56
2022-01-26 14:18:17.184 | DEBUG    | __main__:trials:24 - Trial = 22829/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.185 | DEBUG    | __main__:trials:29 - Trial = 22829/30000 | Total reward = 36.81
2022-01-26 14:18:17.189 | DEBUG    | __main__:trials:24 - Trial = 22830/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.190 | DEBUG    | __main__:trials:29 - Trial = 22830/30000 | Total reward = 38.63
2022-01-26 14:18:17.192 | DEBUG    | __main__:trials:26 - Trial = 22831/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.193 | DEBUG    | __main__:trials:29 - Trial = 22831/30000 | Total reward = 15.88
2022-01-26 14:18:17.196 | DEBUG    | __main__:trials:24 - Trial = 22832/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.197 | DEBUG    | __main__:trials:29 - Trial = 22832/30000 | Total reward = 44.54
2022-01-26 14:18:17.201 | DEBUG    | __main__:trials:24 - Trial = 22833/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.202 | DEBUG    | __main__:trials:29 - Trial = 22833/30000 | Total reward = 53.51
2022-01-26 14:18:17.205 | DEBUG    | __main__:trials:24 - Trial = 22834/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.206 | DEBUG    | __main__:trials:29 - Trial = 22834/30000 | Total reward = 50.40
2022-01-26 14:18:17.209 | DEBUG    | __main__:trials:24 - Trial = 22835/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.210 | DEBUG    | __main__:trials:29 - Trial = 22835/30000 | Total reward = 52.76
2022-01-26 14:18:17.213 | DEBUG    | __main__:trials:24 - Trial = 22836/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.215 | DEBUG    | __main__:trials:29 - Trial = 22836/30000 | Total reward = 53.08
2022-01-26 14:18:17.219 | DEBUG    | __main__:trials:24 - Trial = 22837/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.220 | DEBUG    | __main__:trials:29 - Trial = 22837/30000 | Total reward = 53.51
2022-01-26 14:18:17.224 | DEBUG    | __main__:trials:24 - Trial = 22838/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.225 | DEBUG    | __main__:trials:29 - Trial = 22838/30000 | Total reward = 47.35
2022-01-26 14:18:17.228 | DEBUG    | __main__:trials:24 - Trial = 22839/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.230 | DEBUG    | __main__:trials:29 - Trial = 22839/30000 | Total reward = 39.48
2022-01-26 14:18:17.234 | DEBUG    | __main__:trials:24 - Trial = 22840/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.235 | DEBUG    | __main__:trials:29 - Trial = 22840/30000 | Total reward = 47.99
2022-01-26 14:18:17.238 | DEBUG    | __main__:trials:24 - Trial = 22841/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.240 | DEBUG    | __main__:trials:29 - Trial = 22841/30000 | Total reward = 39.31
2022-01-26 14:18:17.243 | DEBUG    | __main__:trials:24 - Trial = 22842/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.245 | DEBUG    | __main__:trials:29 - Trial = 22842/30000 | Total reward = 46.44
2022-01-26 14:18:17.248 | DEBUG    | __main__:trials:24 - Trial = 22843/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.250 | DEBUG    | __main__:trials:29 - Trial = 22843/30000 | Total reward = 40.15
2022-01-26 14:18:17.253 | DEBUG    | __main__:trials:24 - Trial = 22844/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.254 | DEBUG    | __main__:trials:29 - Trial = 22844/30000 | Total reward = 34.97
2022-01-26 14:18:17.258 | DEBUG    | __main__:trials:24 - Trial = 22845/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.259 | DEBUG    | __main__:trials:29 - Trial = 22845/30000 | Total reward = 45.32
2022-01-26 14:18:17.263 | DEBUG    | __main__:trials:24 - Trial = 22846/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.264 | DEBUG    | __main__:trials:29 - Trial = 22846/30000 | Total reward = 51.43
2022-01-26 14:18:17.268 | DEBUG    | __main__:trials:24 - Trial = 22847/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.269 | DEBUG    | __main__:trials:29 - Trial = 22847/30000 | Total reward = 36.39
2022-01-26 14:18:17.273 | DEBUG    | __main__:trials:24 - Trial = 22848/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.275 | DEBUG    | __main__:trials:29 - Trial = 22848/30000 | Total reward = 41.81
2022-01-26 14:18:17.278 | DEBUG    | __main__:trials:24 - Trial = 22849/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.279 | DEBUG    | __main__:trials:29 - Trial = 22849/30000 | Total reward = 41.50
2022-01-26 14:18:17.282 | DEBUG    | __main__:trials:24 - Trial = 22850/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.284 | DEBUG    | __main__:trials:29 - Trial = 22850/30000 | Total reward = 39.18
2022-01-26 14:18:17.287 | DEBUG    | __main__:trials:24 - Trial = 22851/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.289 | DEBUG    | __main__:trials:29 - Trial = 22851/30000 | Total reward = 35.15
2022-01-26 14:18:17.292 | DEBUG    | __main__:trials:24 - Trial = 22852/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.294 | DEBUG    | __main__:trials:29 - Trial = 22852/30000 | Total reward = 35.79
2022-01-26 14:18:17.298 | DEBUG    | __main__:trials:24 - Trial = 22853/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.298 | DEBUG    | __main__:trials:29 - Trial = 22853/30000 | Total reward = 43.26
2022-01-26 14:18:17.302 | DEBUG    | __main__:trials:24 - Trial = 22854/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.304 | DEBUG    | __main__:trials:29 - Trial = 22854/30000 | Total reward = 50.58
2022-01-26 14:18:17.308 | DEBUG    | __main__:trials:26 - Trial = 22855/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.309 | DEBUG    | __main__:trials:29 - Trial = 22855/30000 | Total reward = 27.11
2022-01-26 14:18:17.313 | DEBUG    | __main__:trials:24 - Trial = 22856/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.314 | DEBUG    | __main__:trials:29 - Trial = 22856/30000 | Total reward = 44.49
2022-01-26 14:18:17.318 | DEBUG    | __main__:trials:26 - Trial = 22857/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.320 | DEBUG    | __main__:trials:29 - Trial = 22857/30000 | Total reward = 30.11
2022-01-26 14:18:17.323 | DEBUG    | __main__:trials:24 - Trial = 22858/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.325 | DEBUG    | __main__:trials:29 - Trial = 22858/30000 | Total reward = 51.47
2022-01-26 14:18:17.328 | DEBUG    | __main__:trials:24 - Trial = 22859/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.330 | DEBUG    | __main__:trials:29 - Trial = 22859/30000 | Total reward = 39.87
2022-01-26 14:18:17.334 | DEBUG    | __main__:trials:24 - Trial = 22860/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.334 | DEBUG    | __main__:trials:29 - Trial = 22860/30000 | Total reward = 49.01
2022-01-26 14:18:17.339 | DEBUG    | __main__:trials:24 - Trial = 22861/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.340 | DEBUG    | __main__:trials:29 - Trial = 22861/30000 | Total reward = 58.45
2022-01-26 14:18:17.344 | DEBUG    | __main__:trials:24 - Trial = 22862/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.345 | DEBUG    | __main__:trials:29 - Trial = 22862/30000 | Total reward = 36.97
2022-01-26 14:18:17.349 | DEBUG    | __main__:trials:24 - Trial = 22863/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.351 | DEBUG    | __main__:trials:29 - Trial = 22863/30000 | Total reward = 44.09
2022-01-26 14:18:17.354 | DEBUG    | __main__:trials:24 - Trial = 22864/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.355 | DEBUG    | __main__:trials:29 - Trial = 22864/30000 | Total reward = 41.59
2022-01-26 14:18:17.359 | DEBUG    | __main__:trials:24 - Trial = 22865/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.360 | DEBUG    | __main__:trials:29 - Trial = 22865/30000 | Total reward = 45.75
2022-01-26 14:18:17.364 | DEBUG    | __main__:trials:24 - Trial = 22866/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.366 | DEBUG    | __main__:trials:29 - Trial = 22866/30000 | Total reward = 30.08
2022-01-26 14:18:17.369 | DEBUG    | __main__:trials:24 - Trial = 22867/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.370 | DEBUG    | __main__:trials:29 - Trial = 22867/30000 | Total reward = 33.33
2022-01-26 14:18:17.375 | DEBUG    | __main__:trials:24 - Trial = 22868/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.376 | DEBUG    | __main__:trials:29 - Trial = 22868/30000 | Total reward = 43.76
2022-01-26 14:18:17.380 | DEBUG    | __main__:trials:24 - Trial = 22869/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.381 | DEBUG    | __main__:trials:29 - Trial = 22869/30000 | Total reward = 47.30
2022-01-26 14:18:17.386 | DEBUG    | __main__:trials:24 - Trial = 22870/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.386 | DEBUG    | __main__:trials:29 - Trial = 22870/30000 | Total reward = 49.03
2022-01-26 14:18:17.391 | DEBUG    | __main__:trials:24 - Trial = 22871/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.393 | DEBUG    | __main__:trials:29 - Trial = 22871/30000 | Total reward = 41.57
2022-01-26 14:18:17.396 | DEBUG    | __main__:trials:24 - Trial = 22872/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.397 | DEBUG    | __main__:trials:29 - Trial = 22872/30000 | Total reward = 49.94
2022-01-26 14:18:17.401 | DEBUG    | __main__:trials:24 - Trial = 22873/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.402 | DEBUG    | __main__:trials:29 - Trial = 22873/30000 | Total reward = 43.40
2022-01-26 14:18:17.406 | DEBUG    | __main__:trials:24 - Trial = 22874/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.407 | DEBUG    | __main__:trials:29 - Trial = 22874/30000 | Total reward = 41.34
2022-01-26 14:18:17.411 | DEBUG    | __main__:trials:24 - Trial = 22875/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.412 | DEBUG    | __main__:trials:29 - Trial = 22875/30000 | Total reward = 35.32
2022-01-26 14:18:17.416 | DEBUG    | __main__:trials:24 - Trial = 22876/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.418 | DEBUG    | __main__:trials:29 - Trial = 22876/30000 | Total reward = 41.97
2022-01-26 14:18:17.422 | DEBUG    | __main__:trials:24 - Trial = 22877/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.422 | DEBUG    | __main__:trials:29 - Trial = 22877/30000 | Total reward = 40.00
2022-01-26 14:18:17.427 | DEBUG    | __main__:trials:24 - Trial = 22878/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.428 | DEBUG    | __main__:trials:29 - Trial = 22878/30000 | Total reward = 30.41
2022-01-26 14:18:17.432 | DEBUG    | __main__:trials:24 - Trial = 22879/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.433 | DEBUG    | __main__:trials:29 - Trial = 22879/30000 | Total reward = 43.25
2022-01-26 14:18:17.438 | DEBUG    | __main__:trials:24 - Trial = 22880/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.439 | DEBUG    | __main__:trials:29 - Trial = 22880/30000 | Total reward = 48.64
2022-01-26 14:18:17.442 | DEBUG    | __main__:trials:24 - Trial = 22881/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.444 | DEBUG    | __main__:trials:29 - Trial = 22881/30000 | Total reward = 47.84
2022-01-26 14:18:17.448 | DEBUG    | __main__:trials:24 - Trial = 22882/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.449 | DEBUG    | __main__:trials:29 - Trial = 22882/30000 | Total reward = 34.76
2022-01-26 14:18:17.453 | DEBUG    | __main__:trials:24 - Trial = 22883/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.454 | DEBUG    | __main__:trials:29 - Trial = 22883/30000 | Total reward = 46.88
2022-01-26 14:18:17.457 | DEBUG    | __main__:trials:24 - Trial = 22884/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.459 | DEBUG    | __main__:trials:29 - Trial = 22884/30000 | Total reward = 48.64
2022-01-26 14:18:17.462 | DEBUG    | __main__:trials:24 - Trial = 22885/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.462 | DEBUG    | __main__:trials:29 - Trial = 22885/30000 | Total reward = 48.08
2022-01-26 14:18:17.466 | DEBUG    | __main__:trials:24 - Trial = 22886/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.466 | DEBUG    | __main__:trials:29 - Trial = 22886/30000 | Total reward = 41.97
2022-01-26 14:18:17.470 | DEBUG    | __main__:trials:24 - Trial = 22887/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.471 | DEBUG    | __main__:trials:29 - Trial = 22887/30000 | Total reward = 45.14
2022-01-26 14:18:17.474 | DEBUG    | __main__:trials:24 - Trial = 22888/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.476 | DEBUG    | __main__:trials:29 - Trial = 22888/30000 | Total reward = 54.64
2022-01-26 14:18:17.480 | DEBUG    | __main__:trials:24 - Trial = 22889/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.481 | DEBUG    | __main__:trials:29 - Trial = 22889/30000 | Total reward = 45.53
2022-01-26 14:18:17.485 | DEBUG    | __main__:trials:24 - Trial = 22890/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.486 | DEBUG    | __main__:trials:29 - Trial = 22890/30000 | Total reward = 33.22
2022-01-26 14:18:17.490 | DEBUG    | __main__:trials:24 - Trial = 22891/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.492 | DEBUG    | __main__:trials:29 - Trial = 22891/30000 | Total reward = 34.27
2022-01-26 14:18:17.495 | DEBUG    | __main__:trials:24 - Trial = 22892/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.497 | DEBUG    | __main__:trials:29 - Trial = 22892/30000 | Total reward = 48.07
2022-01-26 14:18:17.500 | DEBUG    | __main__:trials:24 - Trial = 22893/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.502 | DEBUG    | __main__:trials:29 - Trial = 22893/30000 | Total reward = 40.96
2022-01-26 14:18:17.505 | DEBUG    | __main__:trials:24 - Trial = 22894/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.507 | DEBUG    | __main__:trials:29 - Trial = 22894/30000 | Total reward = 50.45
2022-01-26 14:18:17.511 | DEBUG    | __main__:trials:24 - Trial = 22895/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.512 | DEBUG    | __main__:trials:29 - Trial = 22895/30000 | Total reward = 57.64
2022-01-26 14:18:17.516 | DEBUG    | __main__:trials:24 - Trial = 22896/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.518 | DEBUG    | __main__:trials:29 - Trial = 22896/30000 | Total reward = 45.32
2022-01-26 14:18:17.521 | DEBUG    | __main__:trials:24 - Trial = 22897/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.522 | DEBUG    | __main__:trials:29 - Trial = 22897/30000 | Total reward = 45.21
2022-01-26 14:18:17.526 | DEBUG    | __main__:trials:24 - Trial = 22898/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.528 | DEBUG    | __main__:trials:29 - Trial = 22898/30000 | Total reward = 46.64
2022-01-26 14:18:17.531 | DEBUG    | __main__:trials:24 - Trial = 22899/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.533 | DEBUG    | __main__:trials:29 - Trial = 22899/30000 | Total reward = 46.38
2022-01-26 14:18:17.536 | DEBUG    | __main__:trials:24 - Trial = 22900/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.537 | DEBUG    | __main__:trials:29 - Trial = 22900/30000 | Total reward = 45.94
2022-01-26 14:18:17.542 | DEBUG    | __main__:trials:24 - Trial = 22901/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.542 | DEBUG    | __main__:trials:29 - Trial = 22901/30000 | Total reward = 62.16
2022-01-26 14:18:17.546 | DEBUG    | __main__:trials:24 - Trial = 22902/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.548 | DEBUG    | __main__:trials:29 - Trial = 22902/30000 | Total reward = 44.69
2022-01-26 14:18:17.551 | DEBUG    | __main__:trials:24 - Trial = 22903/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.553 | DEBUG    | __main__:trials:29 - Trial = 22903/30000 | Total reward = 48.63
2022-01-26 14:18:17.555 | DEBUG    | __main__:trials:26 - Trial = 22904/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.557 | DEBUG    | __main__:trials:29 - Trial = 22904/30000 | Total reward = 19.80
2022-01-26 14:18:17.561 | DEBUG    | __main__:trials:24 - Trial = 22905/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.562 | DEBUG    | __main__:trials:29 - Trial = 22905/30000 | Total reward = 33.36
2022-01-26 14:18:17.565 | DEBUG    | __main__:trials:24 - Trial = 22906/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.566 | DEBUG    | __main__:trials:29 - Trial = 22906/30000 | Total reward = 27.38
2022-01-26 14:18:17.571 | DEBUG    | __main__:trials:24 - Trial = 22907/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.572 | DEBUG    | __main__:trials:29 - Trial = 22907/30000 | Total reward = 47.19
2022-01-26 14:18:17.576 | DEBUG    | __main__:trials:24 - Trial = 22908/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.577 | DEBUG    | __main__:trials:29 - Trial = 22908/30000 | Total reward = 27.52
2022-01-26 14:18:17.582 | DEBUG    | __main__:trials:24 - Trial = 22909/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.582 | DEBUG    | __main__:trials:29 - Trial = 22909/30000 | Total reward = 46.92
2022-01-26 14:18:17.586 | DEBUG    | __main__:trials:24 - Trial = 22910/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.588 | DEBUG    | __main__:trials:29 - Trial = 22910/30000 | Total reward = 41.80
2022-01-26 14:18:17.592 | DEBUG    | __main__:trials:24 - Trial = 22911/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.593 | DEBUG    | __main__:trials:29 - Trial = 22911/30000 | Total reward = 55.52
2022-01-26 14:18:17.597 | DEBUG    | __main__:trials:24 - Trial = 22912/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.599 | DEBUG    | __main__:trials:29 - Trial = 22912/30000 | Total reward = 47.10
2022-01-26 14:18:17.602 | DEBUG    | __main__:trials:24 - Trial = 22913/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.603 | DEBUG    | __main__:trials:29 - Trial = 22913/30000 | Total reward = 37.05
2022-01-26 14:18:17.606 | DEBUG    | __main__:trials:24 - Trial = 22914/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.608 | DEBUG    | __main__:trials:29 - Trial = 22914/30000 | Total reward = 43.96
2022-01-26 14:18:17.612 | DEBUG    | __main__:trials:24 - Trial = 22915/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.613 | DEBUG    | __main__:trials:29 - Trial = 22915/30000 | Total reward = 52.91
2022-01-26 14:18:17.617 | DEBUG    | __main__:trials:24 - Trial = 22916/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.619 | DEBUG    | __main__:trials:29 - Trial = 22916/30000 | Total reward = 30.34
2022-01-26 14:18:17.623 | DEBUG    | __main__:trials:24 - Trial = 22917/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.624 | DEBUG    | __main__:trials:29 - Trial = 22917/30000 | Total reward = 41.26
2022-01-26 14:18:17.627 | DEBUG    | __main__:trials:24 - Trial = 22918/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.629 | DEBUG    | __main__:trials:29 - Trial = 22918/30000 | Total reward = 45.76
2022-01-26 14:18:17.633 | DEBUG    | __main__:trials:24 - Trial = 22919/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.634 | DEBUG    | __main__:trials:29 - Trial = 22919/30000 | Total reward = 61.46
2022-01-26 14:18:17.638 | DEBUG    | __main__:trials:24 - Trial = 22920/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.639 | DEBUG    | __main__:trials:29 - Trial = 22920/30000 | Total reward = 48.50
2022-01-26 14:18:17.642 | DEBUG    | __main__:trials:26 - Trial = 22921/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.644 | DEBUG    | __main__:trials:29 - Trial = 22921/30000 | Total reward = 13.17
2022-01-26 14:18:17.648 | DEBUG    | __main__:trials:24 - Trial = 22922/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.649 | DEBUG    | __main__:trials:29 - Trial = 22922/30000 | Total reward = 35.63
2022-01-26 14:18:17.653 | DEBUG    | __main__:trials:26 - Trial = 22923/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.654 | DEBUG    | __main__:trials:29 - Trial = 22923/30000 | Total reward = 26.72
2022-01-26 14:18:17.658 | DEBUG    | __main__:trials:24 - Trial = 22924/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.659 | DEBUG    | __main__:trials:29 - Trial = 22924/30000 | Total reward = 52.23
2022-01-26 14:18:17.663 | DEBUG    | __main__:trials:24 - Trial = 22925/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.664 | DEBUG    | __main__:trials:29 - Trial = 22925/30000 | Total reward = 40.94
2022-01-26 14:18:17.668 | DEBUG    | __main__:trials:24 - Trial = 22926/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.670 | DEBUG    | __main__:trials:29 - Trial = 22926/30000 | Total reward = 35.77
2022-01-26 14:18:17.673 | DEBUG    | __main__:trials:24 - Trial = 22927/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.675 | DEBUG    | __main__:trials:29 - Trial = 22927/30000 | Total reward = 55.06
2022-01-26 14:18:17.679 | DEBUG    | __main__:trials:24 - Trial = 22928/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.680 | DEBUG    | __main__:trials:29 - Trial = 22928/30000 | Total reward = 39.93
2022-01-26 14:18:17.684 | DEBUG    | __main__:trials:26 - Trial = 22929/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.685 | DEBUG    | __main__:trials:29 - Trial = 22929/30000 | Total reward = 36.49
2022-01-26 14:18:17.690 | DEBUG    | __main__:trials:24 - Trial = 22930/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.691 | DEBUG    | __main__:trials:29 - Trial = 22930/30000 | Total reward = 37.49
2022-01-26 14:18:17.695 | DEBUG    | __main__:trials:24 - Trial = 22931/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.696 | DEBUG    | __main__:trials:29 - Trial = 22931/30000 | Total reward = 44.70
2022-01-26 14:18:17.700 | DEBUG    | __main__:trials:24 - Trial = 22932/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.701 | DEBUG    | __main__:trials:29 - Trial = 22932/30000 | Total reward = 39.25
2022-01-26 14:18:17.705 | DEBUG    | __main__:trials:24 - Trial = 22933/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.706 | DEBUG    | __main__:trials:29 - Trial = 22933/30000 | Total reward = 38.13
2022-01-26 14:18:17.710 | DEBUG    | __main__:trials:24 - Trial = 22934/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.711 | DEBUG    | __main__:trials:29 - Trial = 22934/30000 | Total reward = 37.81
2022-01-26 14:18:17.716 | DEBUG    | __main__:trials:24 - Trial = 22935/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.717 | DEBUG    | __main__:trials:29 - Trial = 22935/30000 | Total reward = 51.91
2022-01-26 14:18:17.720 | DEBUG    | __main__:trials:24 - Trial = 22936/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.722 | DEBUG    | __main__:trials:29 - Trial = 22936/30000 | Total reward = 41.94
2022-01-26 14:18:17.726 | DEBUG    | __main__:trials:24 - Trial = 22937/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.727 | DEBUG    | __main__:trials:29 - Trial = 22937/30000 | Total reward = 50.16
2022-01-26 14:18:17.731 | DEBUG    | __main__:trials:24 - Trial = 22938/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.733 | DEBUG    | __main__:trials:29 - Trial = 22938/30000 | Total reward = 56.09
2022-01-26 14:18:17.736 | DEBUG    | __main__:trials:24 - Trial = 22939/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.737 | DEBUG    | __main__:trials:29 - Trial = 22939/30000 | Total reward = 34.91
2022-01-26 14:18:17.741 | DEBUG    | __main__:trials:24 - Trial = 22940/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.741 | DEBUG    | __main__:trials:29 - Trial = 22940/30000 | Total reward = 51.36
2022-01-26 14:18:17.745 | DEBUG    | __main__:trials:24 - Trial = 22941/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.746 | DEBUG    | __main__:trials:29 - Trial = 22941/30000 | Total reward = 49.99
2022-01-26 14:18:17.750 | DEBUG    | __main__:trials:24 - Trial = 22942/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.752 | DEBUG    | __main__:trials:29 - Trial = 22942/30000 | Total reward = 37.04
2022-01-26 14:18:17.755 | DEBUG    | __main__:trials:24 - Trial = 22943/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.757 | DEBUG    | __main__:trials:29 - Trial = 22943/30000 | Total reward = 35.42
2022-01-26 14:18:17.760 | DEBUG    | __main__:trials:24 - Trial = 22944/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.762 | DEBUG    | __main__:trials:29 - Trial = 22944/30000 | Total reward = 49.76
2022-01-26 14:18:17.766 | DEBUG    | __main__:trials:24 - Trial = 22945/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.767 | DEBUG    | __main__:trials:29 - Trial = 22945/30000 | Total reward = 50.68
2022-01-26 14:18:17.771 | DEBUG    | __main__:trials:24 - Trial = 22946/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.771 | DEBUG    | __main__:trials:29 - Trial = 22946/30000 | Total reward = 52.22
2022-01-26 14:18:17.775 | DEBUG    | __main__:trials:24 - Trial = 22947/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.776 | DEBUG    | __main__:trials:29 - Trial = 22947/30000 | Total reward = 39.86
2022-01-26 14:18:17.780 | DEBUG    | __main__:trials:24 - Trial = 22948/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.782 | DEBUG    | __main__:trials:29 - Trial = 22948/30000 | Total reward = 29.02
2022-01-26 14:18:17.785 | DEBUG    | __main__:trials:24 - Trial = 22949/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.786 | DEBUG    | __main__:trials:29 - Trial = 22949/30000 | Total reward = 47.05
2022-01-26 14:18:17.790 | DEBUG    | __main__:trials:24 - Trial = 22950/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.791 | DEBUG    | __main__:trials:29 - Trial = 22950/30000 | Total reward = 46.64
2022-01-26 14:18:17.794 | DEBUG    | __main__:trials:24 - Trial = 22951/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.795 | DEBUG    | __main__:trials:29 - Trial = 22951/30000 | Total reward = 39.80
2022-01-26 14:18:17.798 | DEBUG    | __main__:trials:24 - Trial = 22952/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.800 | DEBUG    | __main__:trials:29 - Trial = 22952/30000 | Total reward = 26.59
2022-01-26 14:18:17.803 | DEBUG    | __main__:trials:24 - Trial = 22953/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.804 | DEBUG    | __main__:trials:29 - Trial = 22953/30000 | Total reward = 44.37
2022-01-26 14:18:17.807 | DEBUG    | __main__:trials:24 - Trial = 22954/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.809 | DEBUG    | __main__:trials:29 - Trial = 22954/30000 | Total reward = 31.99
2022-01-26 14:18:17.812 | DEBUG    | __main__:trials:24 - Trial = 22955/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.812 | DEBUG    | __main__:trials:29 - Trial = 22955/30000 | Total reward = 44.38
2022-01-26 14:18:17.816 | DEBUG    | __main__:trials:24 - Trial = 22956/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.818 | DEBUG    | __main__:trials:29 - Trial = 22956/30000 | Total reward = 44.83
2022-01-26 14:18:17.821 | DEBUG    | __main__:trials:24 - Trial = 22957/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.821 | DEBUG    | __main__:trials:29 - Trial = 22957/30000 | Total reward = 44.21
2022-01-26 14:18:17.825 | DEBUG    | __main__:trials:24 - Trial = 22958/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.826 | DEBUG    | __main__:trials:29 - Trial = 22958/30000 | Total reward = 48.80
2022-01-26 14:18:17.829 | DEBUG    | __main__:trials:24 - Trial = 22959/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.831 | DEBUG    | __main__:trials:29 - Trial = 22959/30000 | Total reward = 49.83
2022-01-26 14:18:17.834 | DEBUG    | __main__:trials:24 - Trial = 22960/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.834 | DEBUG    | __main__:trials:29 - Trial = 22960/30000 | Total reward = 55.41
2022-01-26 14:18:17.838 | DEBUG    | __main__:trials:24 - Trial = 22961/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.839 | DEBUG    | __main__:trials:29 - Trial = 22961/30000 | Total reward = 37.45
2022-01-26 14:18:17.842 | DEBUG    | __main__:trials:24 - Trial = 22962/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.843 | DEBUG    | __main__:trials:29 - Trial = 22962/30000 | Total reward = 49.69
2022-01-26 14:18:17.846 | DEBUG    | __main__:trials:24 - Trial = 22963/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.848 | DEBUG    | __main__:trials:29 - Trial = 22963/30000 | Total reward = 37.12
2022-01-26 14:18:17.851 | DEBUG    | __main__:trials:24 - Trial = 22964/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.852 | DEBUG    | __main__:trials:29 - Trial = 22964/30000 | Total reward = 52.30
2022-01-26 14:18:17.855 | DEBUG    | __main__:trials:24 - Trial = 22965/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.856 | DEBUG    | __main__:trials:29 - Trial = 22965/30000 | Total reward = 38.28
2022-01-26 14:18:17.860 | DEBUG    | __main__:trials:24 - Trial = 22966/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.861 | DEBUG    | __main__:trials:29 - Trial = 22966/30000 | Total reward = 35.04
2022-01-26 14:18:17.864 | DEBUG    | __main__:trials:24 - Trial = 22967/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.866 | DEBUG    | __main__:trials:29 - Trial = 22967/30000 | Total reward = 62.12
2022-01-26 14:18:17.869 | DEBUG    | __main__:trials:26 - Trial = 22968/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:17.871 | DEBUG    | __main__:trials:29 - Trial = 22968/30000 | Total reward = 15.64
2022-01-26 14:18:17.873 | DEBUG    | __main__:trials:24 - Trial = 22969/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.875 | DEBUG    | __main__:trials:29 - Trial = 22969/30000 | Total reward = 52.53
2022-01-26 14:18:17.877 | DEBUG    | __main__:trials:24 - Trial = 22970/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.878 | DEBUG    | __main__:trials:29 - Trial = 22970/30000 | Total reward = 39.31
2022-01-26 14:18:17.881 | DEBUG    | __main__:trials:24 - Trial = 22971/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.882 | DEBUG    | __main__:trials:29 - Trial = 22971/30000 | Total reward = 27.43
2022-01-26 14:18:17.885 | DEBUG    | __main__:trials:24 - Trial = 22972/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.887 | DEBUG    | __main__:trials:29 - Trial = 22972/30000 | Total reward = 52.05
2022-01-26 14:18:17.890 | DEBUG    | __main__:trials:24 - Trial = 22973/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.891 | DEBUG    | __main__:trials:29 - Trial = 22973/30000 | Total reward = 55.95
2022-01-26 14:18:17.895 | DEBUG    | __main__:trials:24 - Trial = 22974/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.895 | DEBUG    | __main__:trials:29 - Trial = 22974/30000 | Total reward = 45.90
2022-01-26 14:18:17.898 | DEBUG    | __main__:trials:24 - Trial = 22975/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.899 | DEBUG    | __main__:trials:29 - Trial = 22975/30000 | Total reward = 50.78
2022-01-26 14:18:17.902 | DEBUG    | __main__:trials:24 - Trial = 22976/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.904 | DEBUG    | __main__:trials:29 - Trial = 22976/30000 | Total reward = 32.46
2022-01-26 14:18:17.908 | DEBUG    | __main__:trials:24 - Trial = 22977/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.910 | DEBUG    | __main__:trials:29 - Trial = 22977/30000 | Total reward = 36.57
2022-01-26 14:18:17.913 | DEBUG    | __main__:trials:24 - Trial = 22978/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.914 | DEBUG    | __main__:trials:29 - Trial = 22978/30000 | Total reward = 58.96
2022-01-26 14:18:17.917 | DEBUG    | __main__:trials:24 - Trial = 22979/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.918 | DEBUG    | __main__:trials:29 - Trial = 22979/30000 | Total reward = 26.92
2022-01-26 14:18:17.921 | DEBUG    | __main__:trials:24 - Trial = 22980/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.922 | DEBUG    | __main__:trials:29 - Trial = 22980/30000 | Total reward = 36.55
2022-01-26 14:18:17.926 | DEBUG    | __main__:trials:24 - Trial = 22981/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.928 | DEBUG    | __main__:trials:29 - Trial = 22981/30000 | Total reward = 35.71
2022-01-26 14:18:17.931 | DEBUG    | __main__:trials:24 - Trial = 22982/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.933 | DEBUG    | __main__:trials:29 - Trial = 22982/30000 | Total reward = 49.68
2022-01-26 14:18:17.935 | DEBUG    | __main__:trials:24 - Trial = 22983/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.937 | DEBUG    | __main__:trials:29 - Trial = 22983/30000 | Total reward = 50.71
2022-01-26 14:18:17.941 | DEBUG    | __main__:trials:24 - Trial = 22984/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.943 | DEBUG    | __main__:trials:29 - Trial = 22984/30000 | Total reward = 50.09
2022-01-26 14:18:17.947 | DEBUG    | __main__:trials:24 - Trial = 22985/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.949 | DEBUG    | __main__:trials:29 - Trial = 22985/30000 | Total reward = 51.15
2022-01-26 14:18:17.952 | DEBUG    | __main__:trials:24 - Trial = 22986/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.953 | DEBUG    | __main__:trials:29 - Trial = 22986/30000 | Total reward = 37.68
2022-01-26 14:18:17.957 | DEBUG    | __main__:trials:24 - Trial = 22987/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.959 | DEBUG    | __main__:trials:29 - Trial = 22987/30000 | Total reward = 58.36
2022-01-26 14:18:17.963 | DEBUG    | __main__:trials:24 - Trial = 22988/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.964 | DEBUG    | __main__:trials:29 - Trial = 22988/30000 | Total reward = 50.06
2022-01-26 14:18:17.968 | DEBUG    | __main__:trials:24 - Trial = 22989/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.969 | DEBUG    | __main__:trials:29 - Trial = 22989/30000 | Total reward = 31.54
2022-01-26 14:18:17.972 | DEBUG    | __main__:trials:24 - Trial = 22990/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.974 | DEBUG    | __main__:trials:29 - Trial = 22990/30000 | Total reward = 40.18
2022-01-26 14:18:17.977 | DEBUG    | __main__:trials:24 - Trial = 22991/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.979 | DEBUG    | __main__:trials:29 - Trial = 22991/30000 | Total reward = 44.10
2022-01-26 14:18:17.982 | DEBUG    | __main__:trials:24 - Trial = 22992/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.983 | DEBUG    | __main__:trials:29 - Trial = 22992/30000 | Total reward = 42.65
2022-01-26 14:18:17.987 | DEBUG    | __main__:trials:24 - Trial = 22993/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.988 | DEBUG    | __main__:trials:29 - Trial = 22993/30000 | Total reward = 47.17
2022-01-26 14:18:17.991 | DEBUG    | __main__:trials:24 - Trial = 22994/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.992 | DEBUG    | __main__:trials:29 - Trial = 22994/30000 | Total reward = 54.20
2022-01-26 14:18:17.996 | DEBUG    | __main__:trials:24 - Trial = 22995/30000 | Max number of steps (20) reached
2022-01-26 14:18:17.997 | DEBUG    | __main__:trials:29 - Trial = 22995/30000 | Total reward = 63.76
2022-01-26 14:18:18.000 | DEBUG    | __main__:trials:24 - Trial = 22996/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.001 | DEBUG    | __main__:trials:29 - Trial = 22996/30000 | Total reward = 47.80
2022-01-26 14:18:18.005 | DEBUG    | __main__:trials:24 - Trial = 22997/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.005 | DEBUG    | __main__:trials:29 - Trial = 22997/30000 | Total reward = 38.14
2022-01-26 14:18:18.009 | DEBUG    | __main__:trials:24 - Trial = 22998/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.009 | DEBUG    | __main__:trials:29 - Trial = 22998/30000 | Total reward = 37.44
2022-01-26 14:18:18.014 | DEBUG    | __main__:trials:24 - Trial = 22999/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.016 | DEBUG    | __main__:trials:29 - Trial = 22999/30000 | Total reward = 36.27
2022-01-26 14:18:18.020 | DEBUG    | __main__:trials:24 - Trial = 23000/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.021 | DEBUG    | __main__:trials:29 - Trial = 23000/30000 | Total reward = 51.47
2022-01-26 14:18:18.025 | DEBUG    | __main__:trials:24 - Trial = 23001/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.027 | DEBUG    | __main__:trials:29 - Trial = 23001/30000 | Total reward = 46.95
2022-01-26 14:18:18.030 | DEBUG    | __main__:trials:24 - Trial = 23002/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.031 | DEBUG    | __main__:trials:29 - Trial = 23002/30000 | Total reward = 46.71
2022-01-26 14:18:18.036 | DEBUG    | __main__:trials:24 - Trial = 23003/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.037 | DEBUG    | __main__:trials:29 - Trial = 23003/30000 | Total reward = 44.92
2022-01-26 14:18:18.041 | DEBUG    | __main__:trials:24 - Trial = 23004/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.043 | DEBUG    | __main__:trials:29 - Trial = 23004/30000 | Total reward = 56.29
2022-01-26 14:18:18.046 | DEBUG    | __main__:trials:24 - Trial = 23005/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.047 | DEBUG    | __main__:trials:29 - Trial = 23005/30000 | Total reward = 46.56
2022-01-26 14:18:18.051 | DEBUG    | __main__:trials:24 - Trial = 23006/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.052 | DEBUG    | __main__:trials:29 - Trial = 23006/30000 | Total reward = 42.04
2022-01-26 14:18:18.056 | DEBUG    | __main__:trials:24 - Trial = 23007/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.058 | DEBUG    | __main__:trials:29 - Trial = 23007/30000 | Total reward = 48.05
2022-01-26 14:18:18.062 | DEBUG    | __main__:trials:24 - Trial = 23008/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.063 | DEBUG    | __main__:trials:29 - Trial = 23008/30000 | Total reward = 40.02
2022-01-26 14:18:18.067 | DEBUG    | __main__:trials:24 - Trial = 23009/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.068 | DEBUG    | __main__:trials:29 - Trial = 23009/30000 | Total reward = 39.08
2022-01-26 14:18:18.072 | DEBUG    | __main__:trials:24 - Trial = 23010/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.073 | DEBUG    | __main__:trials:29 - Trial = 23010/30000 | Total reward = 32.25
2022-01-26 14:18:18.077 | DEBUG    | __main__:trials:24 - Trial = 23011/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.078 | DEBUG    | __main__:trials:29 - Trial = 23011/30000 | Total reward = 38.68
2022-01-26 14:18:18.081 | DEBUG    | __main__:trials:24 - Trial = 23012/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.082 | DEBUG    | __main__:trials:29 - Trial = 23012/30000 | Total reward = 40.05
2022-01-26 14:18:18.085 | DEBUG    | __main__:trials:24 - Trial = 23013/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.087 | DEBUG    | __main__:trials:29 - Trial = 23013/30000 | Total reward = 29.28
2022-01-26 14:18:18.090 | DEBUG    | __main__:trials:24 - Trial = 23014/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.091 | DEBUG    | __main__:trials:29 - Trial = 23014/30000 | Total reward = 39.73
2022-01-26 14:18:18.095 | DEBUG    | __main__:trials:24 - Trial = 23015/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.096 | DEBUG    | __main__:trials:29 - Trial = 23015/30000 | Total reward = 36.24
2022-01-26 14:18:18.100 | DEBUG    | __main__:trials:24 - Trial = 23016/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.101 | DEBUG    | __main__:trials:29 - Trial = 23016/30000 | Total reward = 33.42
2022-01-26 14:18:18.104 | DEBUG    | __main__:trials:24 - Trial = 23017/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.106 | DEBUG    | __main__:trials:29 - Trial = 23017/30000 | Total reward = 43.05
2022-01-26 14:18:18.109 | DEBUG    | __main__:trials:24 - Trial = 23018/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.109 | DEBUG    | __main__:trials:29 - Trial = 23018/30000 | Total reward = 40.57
2022-01-26 14:18:18.113 | DEBUG    | __main__:trials:24 - Trial = 23019/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.114 | DEBUG    | __main__:trials:29 - Trial = 23019/30000 | Total reward = 46.29
2022-01-26 14:18:18.117 | DEBUG    | __main__:trials:24 - Trial = 23020/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.119 | DEBUG    | __main__:trials:29 - Trial = 23020/30000 | Total reward = 35.84
2022-01-26 14:18:18.123 | DEBUG    | __main__:trials:24 - Trial = 23021/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.124 | DEBUG    | __main__:trials:29 - Trial = 23021/30000 | Total reward = 42.77
2022-01-26 14:18:18.128 | DEBUG    | __main__:trials:26 - Trial = 23022/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.130 | DEBUG    | __main__:trials:29 - Trial = 23022/30000 | Total reward = 26.56
2022-01-26 14:18:18.134 | DEBUG    | __main__:trials:24 - Trial = 23023/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.134 | DEBUG    | __main__:trials:29 - Trial = 23023/30000 | Total reward = 48.26
2022-01-26 14:18:18.139 | DEBUG    | __main__:trials:24 - Trial = 23024/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.140 | DEBUG    | __main__:trials:29 - Trial = 23024/30000 | Total reward = 39.07
2022-01-26 14:18:18.144 | DEBUG    | __main__:trials:24 - Trial = 23025/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.146 | DEBUG    | __main__:trials:29 - Trial = 23025/30000 | Total reward = 43.96
2022-01-26 14:18:18.150 | DEBUG    | __main__:trials:24 - Trial = 23026/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.151 | DEBUG    | __main__:trials:29 - Trial = 23026/30000 | Total reward = 44.53
2022-01-26 14:18:18.155 | DEBUG    | __main__:trials:24 - Trial = 23027/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.155 | DEBUG    | __main__:trials:29 - Trial = 23027/30000 | Total reward = 45.67
2022-01-26 14:18:18.160 | DEBUG    | __main__:trials:24 - Trial = 23028/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.161 | DEBUG    | __main__:trials:29 - Trial = 23028/30000 | Total reward = 53.00
2022-01-26 14:18:18.164 | DEBUG    | __main__:trials:24 - Trial = 23029/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.166 | DEBUG    | __main__:trials:29 - Trial = 23029/30000 | Total reward = 34.06
2022-01-26 14:18:18.170 | DEBUG    | __main__:trials:24 - Trial = 23030/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.171 | DEBUG    | __main__:trials:29 - Trial = 23030/30000 | Total reward = 54.15
2022-01-26 14:18:18.175 | DEBUG    | __main__:trials:24 - Trial = 23031/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.177 | DEBUG    | __main__:trials:29 - Trial = 23031/30000 | Total reward = 37.00
2022-01-26 14:18:18.181 | DEBUG    | __main__:trials:24 - Trial = 23032/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.182 | DEBUG    | __main__:trials:29 - Trial = 23032/30000 | Total reward = 35.33
2022-01-26 14:18:18.186 | DEBUG    | __main__:trials:24 - Trial = 23033/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.188 | DEBUG    | __main__:trials:29 - Trial = 23033/30000 | Total reward = 61.74
2022-01-26 14:18:18.191 | DEBUG    | __main__:trials:24 - Trial = 23034/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.192 | DEBUG    | __main__:trials:29 - Trial = 23034/30000 | Total reward = 46.85
2022-01-26 14:18:18.196 | DEBUG    | __main__:trials:24 - Trial = 23035/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.197 | DEBUG    | __main__:trials:29 - Trial = 23035/30000 | Total reward = 39.15
2022-01-26 14:18:18.200 | DEBUG    | __main__:trials:24 - Trial = 23036/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.202 | DEBUG    | __main__:trials:29 - Trial = 23036/30000 | Total reward = 42.77
2022-01-26 14:18:18.205 | DEBUG    | __main__:trials:26 - Trial = 23037/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.206 | DEBUG    | __main__:trials:29 - Trial = 23037/30000 | Total reward = 40.61
2022-01-26 14:18:18.209 | DEBUG    | __main__:trials:26 - Trial = 23038/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.211 | DEBUG    | __main__:trials:29 - Trial = 23038/30000 | Total reward = 27.01
2022-01-26 14:18:18.214 | DEBUG    | __main__:trials:24 - Trial = 23039/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.216 | DEBUG    | __main__:trials:29 - Trial = 23039/30000 | Total reward = 49.47
2022-01-26 14:18:18.219 | DEBUG    | __main__:trials:24 - Trial = 23040/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.219 | DEBUG    | __main__:trials:29 - Trial = 23040/30000 | Total reward = 44.98
2022-01-26 14:18:18.223 | DEBUG    | __main__:trials:24 - Trial = 23041/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.225 | DEBUG    | __main__:trials:29 - Trial = 23041/30000 | Total reward = 44.06
2022-01-26 14:18:18.228 | DEBUG    | __main__:trials:24 - Trial = 23042/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.230 | DEBUG    | __main__:trials:29 - Trial = 23042/30000 | Total reward = 41.33
2022-01-26 14:18:18.233 | DEBUG    | __main__:trials:24 - Trial = 23043/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.234 | DEBUG    | __main__:trials:29 - Trial = 23043/30000 | Total reward = 38.46
2022-01-26 14:18:18.237 | DEBUG    | __main__:trials:24 - Trial = 23044/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.238 | DEBUG    | __main__:trials:29 - Trial = 23044/30000 | Total reward = 38.26
2022-01-26 14:18:18.242 | DEBUG    | __main__:trials:24 - Trial = 23045/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.243 | DEBUG    | __main__:trials:29 - Trial = 23045/30000 | Total reward = 49.99
2022-01-26 14:18:18.246 | DEBUG    | __main__:trials:24 - Trial = 23046/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.247 | DEBUG    | __main__:trials:29 - Trial = 23046/30000 | Total reward = 55.75
2022-01-26 14:18:18.250 | DEBUG    | __main__:trials:24 - Trial = 23047/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.252 | DEBUG    | __main__:trials:29 - Trial = 23047/30000 | Total reward = 41.37
2022-01-26 14:18:18.255 | DEBUG    | __main__:trials:24 - Trial = 23048/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.257 | DEBUG    | __main__:trials:29 - Trial = 23048/30000 | Total reward = 39.90
2022-01-26 14:18:18.260 | DEBUG    | __main__:trials:24 - Trial = 23049/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.260 | DEBUG    | __main__:trials:29 - Trial = 23049/30000 | Total reward = 42.81
2022-01-26 14:18:18.264 | DEBUG    | __main__:trials:26 - Trial = 23050/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.264 | DEBUG    | __main__:trials:29 - Trial = 23050/30000 | Total reward = 32.38
2022-01-26 14:18:18.268 | DEBUG    | __main__:trials:24 - Trial = 23051/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.269 | DEBUG    | __main__:trials:29 - Trial = 23051/30000 | Total reward = 40.13
2022-01-26 14:18:18.273 | DEBUG    | __main__:trials:24 - Trial = 23052/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.274 | DEBUG    | __main__:trials:29 - Trial = 23052/30000 | Total reward = 47.65
2022-01-26 14:18:18.277 | DEBUG    | __main__:trials:24 - Trial = 23053/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.278 | DEBUG    | __main__:trials:29 - Trial = 23053/30000 | Total reward = 39.97
2022-01-26 14:18:18.281 | DEBUG    | __main__:trials:24 - Trial = 23054/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.282 | DEBUG    | __main__:trials:29 - Trial = 23054/30000 | Total reward = 35.15
2022-01-26 14:18:18.284 | DEBUG    | __main__:trials:26 - Trial = 23055/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.285 | DEBUG    | __main__:trials:29 - Trial = 23055/30000 | Total reward = 17.27
2022-01-26 14:18:18.289 | DEBUG    | __main__:trials:24 - Trial = 23056/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.290 | DEBUG    | __main__:trials:29 - Trial = 23056/30000 | Total reward = 23.64
2022-01-26 14:18:18.293 | DEBUG    | __main__:trials:24 - Trial = 23057/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.294 | DEBUG    | __main__:trials:29 - Trial = 23057/30000 | Total reward = 49.20
2022-01-26 14:18:18.297 | DEBUG    | __main__:trials:24 - Trial = 23058/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.298 | DEBUG    | __main__:trials:29 - Trial = 23058/30000 | Total reward = 37.38
2022-01-26 14:18:18.302 | DEBUG    | __main__:trials:24 - Trial = 23059/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.303 | DEBUG    | __main__:trials:29 - Trial = 23059/30000 | Total reward = 38.62
2022-01-26 14:18:18.306 | DEBUG    | __main__:trials:24 - Trial = 23060/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.307 | DEBUG    | __main__:trials:29 - Trial = 23060/30000 | Total reward = 50.38
2022-01-26 14:18:18.311 | DEBUG    | __main__:trials:24 - Trial = 23061/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.311 | DEBUG    | __main__:trials:29 - Trial = 23061/30000 | Total reward = 53.14
2022-01-26 14:18:18.315 | DEBUG    | __main__:trials:24 - Trial = 23062/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.317 | DEBUG    | __main__:trials:29 - Trial = 23062/30000 | Total reward = 48.98
2022-01-26 14:18:18.320 | DEBUG    | __main__:trials:24 - Trial = 23063/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.321 | DEBUG    | __main__:trials:29 - Trial = 23063/30000 | Total reward = 45.81
2022-01-26 14:18:18.324 | DEBUG    | __main__:trials:24 - Trial = 23064/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.326 | DEBUG    | __main__:trials:29 - Trial = 23064/30000 | Total reward = 42.77
2022-01-26 14:18:18.329 | DEBUG    | __main__:trials:24 - Trial = 23065/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.329 | DEBUG    | __main__:trials:29 - Trial = 23065/30000 | Total reward = 48.95
2022-01-26 14:18:18.332 | DEBUG    | __main__:trials:24 - Trial = 23066/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.333 | DEBUG    | __main__:trials:29 - Trial = 23066/30000 | Total reward = 35.55
2022-01-26 14:18:18.337 | DEBUG    | __main__:trials:24 - Trial = 23067/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.338 | DEBUG    | __main__:trials:29 - Trial = 23067/30000 | Total reward = 44.96
2022-01-26 14:18:18.341 | DEBUG    | __main__:trials:24 - Trial = 23068/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.343 | DEBUG    | __main__:trials:29 - Trial = 23068/30000 | Total reward = 36.00
2022-01-26 14:18:18.346 | DEBUG    | __main__:trials:24 - Trial = 23069/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.348 | DEBUG    | __main__:trials:29 - Trial = 23069/30000 | Total reward = 65.73
2022-01-26 14:18:18.350 | DEBUG    | __main__:trials:26 - Trial = 23070/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.351 | DEBUG    | __main__:trials:29 - Trial = 23070/30000 | Total reward = 19.13
2022-01-26 14:18:18.355 | DEBUG    | __main__:trials:24 - Trial = 23071/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.355 | DEBUG    | __main__:trials:29 - Trial = 23071/30000 | Total reward = 47.25
2022-01-26 14:18:18.359 | DEBUG    | __main__:trials:24 - Trial = 23072/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.360 | DEBUG    | __main__:trials:29 - Trial = 23072/30000 | Total reward = 50.09
2022-01-26 14:18:18.363 | DEBUG    | __main__:trials:24 - Trial = 23073/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.366 | DEBUG    | __main__:trials:29 - Trial = 23073/30000 | Total reward = 52.26
2022-01-26 14:18:18.369 | DEBUG    | __main__:trials:24 - Trial = 23074/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.369 | DEBUG    | __main__:trials:29 - Trial = 23074/30000 | Total reward = 42.66
2022-01-26 14:18:18.373 | DEBUG    | __main__:trials:24 - Trial = 23075/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.374 | DEBUG    | __main__:trials:29 - Trial = 23075/30000 | Total reward = 48.20
2022-01-26 14:18:18.377 | DEBUG    | __main__:trials:24 - Trial = 23076/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.378 | DEBUG    | __main__:trials:29 - Trial = 23076/30000 | Total reward = 49.03
2022-01-26 14:18:18.381 | DEBUG    | __main__:trials:24 - Trial = 23077/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.383 | DEBUG    | __main__:trials:29 - Trial = 23077/30000 | Total reward = 48.15
2022-01-26 14:18:18.387 | DEBUG    | __main__:trials:24 - Trial = 23078/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.388 | DEBUG    | __main__:trials:29 - Trial = 23078/30000 | Total reward = 51.32
2022-01-26 14:18:18.392 | DEBUG    | __main__:trials:24 - Trial = 23079/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.393 | DEBUG    | __main__:trials:29 - Trial = 23079/30000 | Total reward = 26.82
2022-01-26 14:18:18.396 | DEBUG    | __main__:trials:24 - Trial = 23080/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.398 | DEBUG    | __main__:trials:29 - Trial = 23080/30000 | Total reward = 23.58
2022-01-26 14:18:18.401 | DEBUG    | __main__:trials:24 - Trial = 23081/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.402 | DEBUG    | __main__:trials:29 - Trial = 23081/30000 | Total reward = 29.69
2022-01-26 14:18:18.405 | DEBUG    | __main__:trials:24 - Trial = 23082/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.406 | DEBUG    | __main__:trials:29 - Trial = 23082/30000 | Total reward = 39.90
2022-01-26 14:18:18.409 | DEBUG    | __main__:trials:24 - Trial = 23083/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.411 | DEBUG    | __main__:trials:29 - Trial = 23083/30000 | Total reward = 65.27
2022-01-26 14:18:18.414 | DEBUG    | __main__:trials:24 - Trial = 23084/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.416 | DEBUG    | __main__:trials:29 - Trial = 23084/30000 | Total reward = 25.12
2022-01-26 14:18:18.419 | DEBUG    | __main__:trials:24 - Trial = 23085/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.419 | DEBUG    | __main__:trials:29 - Trial = 23085/30000 | Total reward = 45.20
2022-01-26 14:18:18.423 | DEBUG    | __main__:trials:24 - Trial = 23086/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.424 | DEBUG    | __main__:trials:29 - Trial = 23086/30000 | Total reward = 43.28
2022-01-26 14:18:18.427 | DEBUG    | __main__:trials:24 - Trial = 23087/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.428 | DEBUG    | __main__:trials:29 - Trial = 23087/30000 | Total reward = 50.84
2022-01-26 14:18:18.431 | DEBUG    | __main__:trials:24 - Trial = 23088/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.433 | DEBUG    | __main__:trials:29 - Trial = 23088/30000 | Total reward = 50.96
2022-01-26 14:18:18.436 | DEBUG    | __main__:trials:24 - Trial = 23089/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.436 | DEBUG    | __main__:trials:29 - Trial = 23089/30000 | Total reward = 29.56
2022-01-26 14:18:18.440 | DEBUG    | __main__:trials:24 - Trial = 23090/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.441 | DEBUG    | __main__:trials:29 - Trial = 23090/30000 | Total reward = 49.80
2022-01-26 14:18:18.444 | DEBUG    | __main__:trials:24 - Trial = 23091/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.445 | DEBUG    | __main__:trials:29 - Trial = 23091/30000 | Total reward = 32.11
2022-01-26 14:18:18.448 | DEBUG    | __main__:trials:24 - Trial = 23092/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.449 | DEBUG    | __main__:trials:29 - Trial = 23092/30000 | Total reward = 50.91
2022-01-26 14:18:18.453 | DEBUG    | __main__:trials:24 - Trial = 23093/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.453 | DEBUG    | __main__:trials:29 - Trial = 23093/30000 | Total reward = 51.31
2022-01-26 14:18:18.457 | DEBUG    | __main__:trials:24 - Trial = 23094/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.458 | DEBUG    | __main__:trials:29 - Trial = 23094/30000 | Total reward = 50.17
2022-01-26 14:18:18.461 | DEBUG    | __main__:trials:24 - Trial = 23095/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.462 | DEBUG    | __main__:trials:29 - Trial = 23095/30000 | Total reward = 50.84
2022-01-26 14:18:18.466 | DEBUG    | __main__:trials:24 - Trial = 23096/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.467 | DEBUG    | __main__:trials:29 - Trial = 23096/30000 | Total reward = 54.30
2022-01-26 14:18:18.471 | DEBUG    | __main__:trials:24 - Trial = 23097/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.471 | DEBUG    | __main__:trials:29 - Trial = 23097/30000 | Total reward = 48.74
2022-01-26 14:18:18.475 | DEBUG    | __main__:trials:24 - Trial = 23098/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.477 | DEBUG    | __main__:trials:29 - Trial = 23098/30000 | Total reward = 40.01
2022-01-26 14:18:18.480 | DEBUG    | __main__:trials:24 - Trial = 23099/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.481 | DEBUG    | __main__:trials:29 - Trial = 23099/30000 | Total reward = 54.85
2022-01-26 14:18:18.484 | DEBUG    | __main__:trials:24 - Trial = 23100/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.485 | DEBUG    | __main__:trials:29 - Trial = 23100/30000 | Total reward = 43.44
2022-01-26 14:18:18.488 | DEBUG    | __main__:trials:24 - Trial = 23101/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.490 | DEBUG    | __main__:trials:29 - Trial = 23101/30000 | Total reward = 34.60
2022-01-26 14:18:18.493 | DEBUG    | __main__:trials:24 - Trial = 23102/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.494 | DEBUG    | __main__:trials:29 - Trial = 23102/30000 | Total reward = 50.84
2022-01-26 14:18:18.497 | DEBUG    | __main__:trials:24 - Trial = 23103/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.498 | DEBUG    | __main__:trials:29 - Trial = 23103/30000 | Total reward = 49.63
2022-01-26 14:18:18.501 | DEBUG    | __main__:trials:24 - Trial = 23104/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.502 | DEBUG    | __main__:trials:29 - Trial = 23104/30000 | Total reward = 51.55
2022-01-26 14:18:18.505 | DEBUG    | __main__:trials:24 - Trial = 23105/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.506 | DEBUG    | __main__:trials:29 - Trial = 23105/30000 | Total reward = 32.94
2022-01-26 14:18:18.509 | DEBUG    | __main__:trials:24 - Trial = 23106/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.510 | DEBUG    | __main__:trials:29 - Trial = 23106/30000 | Total reward = 41.06
2022-01-26 14:18:18.513 | DEBUG    | __main__:trials:24 - Trial = 23107/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.514 | DEBUG    | __main__:trials:29 - Trial = 23107/30000 | Total reward = 49.94
2022-01-26 14:18:18.517 | DEBUG    | __main__:trials:24 - Trial = 23108/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.518 | DEBUG    | __main__:trials:29 - Trial = 23108/30000 | Total reward = 34.89
2022-01-26 14:18:18.522 | DEBUG    | __main__:trials:24 - Trial = 23109/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.523 | DEBUG    | __main__:trials:29 - Trial = 23109/30000 | Total reward = 57.53
2022-01-26 14:18:18.527 | DEBUG    | __main__:trials:24 - Trial = 23110/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.529 | DEBUG    | __main__:trials:29 - Trial = 23110/30000 | Total reward = 55.60
2022-01-26 14:18:18.532 | DEBUG    | __main__:trials:24 - Trial = 23111/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.533 | DEBUG    | __main__:trials:29 - Trial = 23111/30000 | Total reward = 62.72
2022-01-26 14:18:18.537 | DEBUG    | __main__:trials:26 - Trial = 23112/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.539 | DEBUG    | __main__:trials:29 - Trial = 23112/30000 | Total reward = 21.45
2022-01-26 14:18:18.542 | DEBUG    | __main__:trials:24 - Trial = 23113/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.543 | DEBUG    | __main__:trials:29 - Trial = 23113/30000 | Total reward = 51.36
2022-01-26 14:18:18.547 | DEBUG    | __main__:trials:24 - Trial = 23114/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.548 | DEBUG    | __main__:trials:29 - Trial = 23114/30000 | Total reward = 27.04
2022-01-26 14:18:18.552 | DEBUG    | __main__:trials:24 - Trial = 23115/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.554 | DEBUG    | __main__:trials:29 - Trial = 23115/30000 | Total reward = 54.90
2022-01-26 14:18:18.557 | DEBUG    | __main__:trials:24 - Trial = 23116/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.559 | DEBUG    | __main__:trials:29 - Trial = 23116/30000 | Total reward = 55.60
2022-01-26 14:18:18.562 | DEBUG    | __main__:trials:24 - Trial = 23117/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.564 | DEBUG    | __main__:trials:29 - Trial = 23117/30000 | Total reward = 49.17
2022-01-26 14:18:18.567 | DEBUG    | __main__:trials:24 - Trial = 23118/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.569 | DEBUG    | __main__:trials:29 - Trial = 23118/30000 | Total reward = 55.28
2022-01-26 14:18:18.573 | DEBUG    | __main__:trials:24 - Trial = 23119/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.573 | DEBUG    | __main__:trials:29 - Trial = 23119/30000 | Total reward = 35.39
2022-01-26 14:18:18.577 | DEBUG    | __main__:trials:24 - Trial = 23120/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.579 | DEBUG    | __main__:trials:29 - Trial = 23120/30000 | Total reward = 21.59
2022-01-26 14:18:18.582 | DEBUG    | __main__:trials:24 - Trial = 23121/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.584 | DEBUG    | __main__:trials:29 - Trial = 23121/30000 | Total reward = 37.38
2022-01-26 14:18:18.589 | DEBUG    | __main__:trials:24 - Trial = 23122/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.590 | DEBUG    | __main__:trials:29 - Trial = 23122/30000 | Total reward = 36.69
2022-01-26 14:18:18.594 | DEBUG    | __main__:trials:24 - Trial = 23123/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.595 | DEBUG    | __main__:trials:29 - Trial = 23123/30000 | Total reward = 54.23
2022-01-26 14:18:18.599 | DEBUG    | __main__:trials:24 - Trial = 23124/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.601 | DEBUG    | __main__:trials:29 - Trial = 23124/30000 | Total reward = 60.48
2022-01-26 14:18:18.604 | DEBUG    | __main__:trials:24 - Trial = 23125/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.606 | DEBUG    | __main__:trials:29 - Trial = 23125/30000 | Total reward = 51.48
2022-01-26 14:18:18.610 | DEBUG    | __main__:trials:24 - Trial = 23126/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.610 | DEBUG    | __main__:trials:29 - Trial = 23126/30000 | Total reward = 53.07
2022-01-26 14:18:18.614 | DEBUG    | __main__:trials:24 - Trial = 23127/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.616 | DEBUG    | __main__:trials:29 - Trial = 23127/30000 | Total reward = 41.62
2022-01-26 14:18:18.620 | DEBUG    | __main__:trials:24 - Trial = 23128/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.621 | DEBUG    | __main__:trials:29 - Trial = 23128/30000 | Total reward = 51.36
2022-01-26 14:18:18.624 | DEBUG    | __main__:trials:24 - Trial = 23129/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.626 | DEBUG    | __main__:trials:29 - Trial = 23129/30000 | Total reward = 50.61
2022-01-26 14:18:18.630 | DEBUG    | __main__:trials:24 - Trial = 23130/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.630 | DEBUG    | __main__:trials:29 - Trial = 23130/30000 | Total reward = 48.22
2022-01-26 14:18:18.635 | DEBUG    | __main__:trials:24 - Trial = 23131/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.637 | DEBUG    | __main__:trials:29 - Trial = 23131/30000 | Total reward = 50.55
2022-01-26 14:18:18.640 | DEBUG    | __main__:trials:24 - Trial = 23132/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.641 | DEBUG    | __main__:trials:29 - Trial = 23132/30000 | Total reward = 50.81
2022-01-26 14:18:18.646 | DEBUG    | __main__:trials:24 - Trial = 23133/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.647 | DEBUG    | __main__:trials:29 - Trial = 23133/30000 | Total reward = 31.82
2022-01-26 14:18:18.650 | DEBUG    | __main__:trials:24 - Trial = 23134/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.651 | DEBUG    | __main__:trials:29 - Trial = 23134/30000 | Total reward = 38.79
2022-01-26 14:18:18.654 | DEBUG    | __main__:trials:24 - Trial = 23135/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.656 | DEBUG    | __main__:trials:29 - Trial = 23135/30000 | Total reward = 49.94
2022-01-26 14:18:18.660 | DEBUG    | __main__:trials:24 - Trial = 23136/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.661 | DEBUG    | __main__:trials:29 - Trial = 23136/30000 | Total reward = 49.85
2022-01-26 14:18:18.664 | DEBUG    | __main__:trials:24 - Trial = 23137/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.666 | DEBUG    | __main__:trials:29 - Trial = 23137/30000 | Total reward = 47.57
2022-01-26 14:18:18.670 | DEBUG    | __main__:trials:24 - Trial = 23138/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.671 | DEBUG    | __main__:trials:29 - Trial = 23138/30000 | Total reward = 48.24
2022-01-26 14:18:18.675 | DEBUG    | __main__:trials:24 - Trial = 23139/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.676 | DEBUG    | __main__:trials:29 - Trial = 23139/30000 | Total reward = 45.27
2022-01-26 14:18:18.680 | DEBUG    | __main__:trials:24 - Trial = 23140/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.681 | DEBUG    | __main__:trials:29 - Trial = 23140/30000 | Total reward = 50.22
2022-01-26 14:18:18.686 | DEBUG    | __main__:trials:24 - Trial = 23141/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.687 | DEBUG    | __main__:trials:29 - Trial = 23141/30000 | Total reward = 59.42
2022-01-26 14:18:18.691 | DEBUG    | __main__:trials:24 - Trial = 23142/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.692 | DEBUG    | __main__:trials:29 - Trial = 23142/30000 | Total reward = 40.83
2022-01-26 14:18:18.696 | DEBUG    | __main__:trials:24 - Trial = 23143/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.698 | DEBUG    | __main__:trials:29 - Trial = 23143/30000 | Total reward = 41.44
2022-01-26 14:18:18.702 | DEBUG    | __main__:trials:24 - Trial = 23144/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.702 | DEBUG    | __main__:trials:29 - Trial = 23144/30000 | Total reward = 49.90
2022-01-26 14:18:18.706 | DEBUG    | __main__:trials:24 - Trial = 23145/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.708 | DEBUG    | __main__:trials:29 - Trial = 23145/30000 | Total reward = 51.19
2022-01-26 14:18:18.712 | DEBUG    | __main__:trials:24 - Trial = 23146/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.713 | DEBUG    | __main__:trials:29 - Trial = 23146/30000 | Total reward = 50.96
2022-01-26 14:18:18.717 | DEBUG    | __main__:trials:24 - Trial = 23147/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.718 | DEBUG    | __main__:trials:29 - Trial = 23147/30000 | Total reward = 45.51
2022-01-26 14:18:18.722 | DEBUG    | __main__:trials:24 - Trial = 23148/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.724 | DEBUG    | __main__:trials:29 - Trial = 23148/30000 | Total reward = 57.38
2022-01-26 14:18:18.727 | DEBUG    | __main__:trials:24 - Trial = 23149/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.729 | DEBUG    | __main__:trials:29 - Trial = 23149/30000 | Total reward = 54.68
2022-01-26 14:18:18.732 | DEBUG    | __main__:trials:24 - Trial = 23150/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.734 | DEBUG    | __main__:trials:29 - Trial = 23150/30000 | Total reward = 55.60
2022-01-26 14:18:18.738 | DEBUG    | __main__:trials:24 - Trial = 23151/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.739 | DEBUG    | __main__:trials:29 - Trial = 23151/30000 | Total reward = 54.87
2022-01-26 14:18:18.743 | DEBUG    | __main__:trials:24 - Trial = 23152/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.743 | DEBUG    | __main__:trials:29 - Trial = 23152/30000 | Total reward = 43.28
2022-01-26 14:18:18.747 | DEBUG    | __main__:trials:24 - Trial = 23153/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.749 | DEBUG    | __main__:trials:29 - Trial = 23153/30000 | Total reward = 41.76
2022-01-26 14:18:18.752 | DEBUG    | __main__:trials:24 - Trial = 23154/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.753 | DEBUG    | __main__:trials:29 - Trial = 23154/30000 | Total reward = 51.37
2022-01-26 14:18:18.757 | DEBUG    | __main__:trials:24 - Trial = 23155/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.758 | DEBUG    | __main__:trials:29 - Trial = 23155/30000 | Total reward = 32.67
2022-01-26 14:18:18.762 | DEBUG    | __main__:trials:24 - Trial = 23156/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.764 | DEBUG    | __main__:trials:29 - Trial = 23156/30000 | Total reward = 40.28
2022-01-26 14:18:18.767 | DEBUG    | __main__:trials:24 - Trial = 23157/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.768 | DEBUG    | __main__:trials:29 - Trial = 23157/30000 | Total reward = 53.22
2022-01-26 14:18:18.772 | DEBUG    | __main__:trials:24 - Trial = 23158/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.773 | DEBUG    | __main__:trials:29 - Trial = 23158/30000 | Total reward = 63.50
2022-01-26 14:18:18.777 | DEBUG    | __main__:trials:24 - Trial = 23159/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.778 | DEBUG    | __main__:trials:29 - Trial = 23159/30000 | Total reward = 38.77
2022-01-26 14:18:18.782 | DEBUG    | __main__:trials:24 - Trial = 23160/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.784 | DEBUG    | __main__:trials:29 - Trial = 23160/30000 | Total reward = 44.23
2022-01-26 14:18:18.787 | DEBUG    | __main__:trials:24 - Trial = 23161/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.788 | DEBUG    | __main__:trials:29 - Trial = 23161/30000 | Total reward = 53.12
2022-01-26 14:18:18.793 | DEBUG    | __main__:trials:24 - Trial = 23162/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.794 | DEBUG    | __main__:trials:29 - Trial = 23162/30000 | Total reward = 40.84
2022-01-26 14:18:18.797 | DEBUG    | __main__:trials:24 - Trial = 23163/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.798 | DEBUG    | __main__:trials:29 - Trial = 23163/30000 | Total reward = 48.71
2022-01-26 14:18:18.801 | DEBUG    | __main__:trials:24 - Trial = 23164/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.802 | DEBUG    | __main__:trials:29 - Trial = 23164/30000 | Total reward = 44.07
2022-01-26 14:18:18.805 | DEBUG    | __main__:trials:24 - Trial = 23165/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.807 | DEBUG    | __main__:trials:29 - Trial = 23165/30000 | Total reward = 29.36
2022-01-26 14:18:18.810 | DEBUG    | __main__:trials:24 - Trial = 23166/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.813 | DEBUG    | __main__:trials:29 - Trial = 23166/30000 | Total reward = 36.64
2022-01-26 14:18:18.816 | DEBUG    | __main__:trials:24 - Trial = 23167/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.816 | DEBUG    | __main__:trials:29 - Trial = 23167/30000 | Total reward = 54.77
2022-01-26 14:18:18.820 | DEBUG    | __main__:trials:24 - Trial = 23168/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.820 | DEBUG    | __main__:trials:29 - Trial = 23168/30000 | Total reward = 48.69
2022-01-26 14:18:18.824 | DEBUG    | __main__:trials:24 - Trial = 23169/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.825 | DEBUG    | __main__:trials:29 - Trial = 23169/30000 | Total reward = 44.21
2022-01-26 14:18:18.830 | DEBUG    | __main__:trials:24 - Trial = 23170/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.831 | DEBUG    | __main__:trials:29 - Trial = 23170/30000 | Total reward = 62.21
2022-01-26 14:18:18.836 | DEBUG    | __main__:trials:24 - Trial = 23171/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.837 | DEBUG    | __main__:trials:29 - Trial = 23171/30000 | Total reward = 41.94
2022-01-26 14:18:18.841 | DEBUG    | __main__:trials:24 - Trial = 23172/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.842 | DEBUG    | __main__:trials:29 - Trial = 23172/30000 | Total reward = 51.94
2022-01-26 14:18:18.845 | DEBUG    | __main__:trials:24 - Trial = 23173/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.847 | DEBUG    | __main__:trials:29 - Trial = 23173/30000 | Total reward = 40.55
2022-01-26 14:18:18.851 | DEBUG    | __main__:trials:24 - Trial = 23174/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.852 | DEBUG    | __main__:trials:29 - Trial = 23174/30000 | Total reward = 63.41
2022-01-26 14:18:18.856 | DEBUG    | __main__:trials:24 - Trial = 23175/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.858 | DEBUG    | __main__:trials:29 - Trial = 23175/30000 | Total reward = 33.45
2022-01-26 14:18:18.861 | DEBUG    | __main__:trials:24 - Trial = 23176/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.863 | DEBUG    | __main__:trials:29 - Trial = 23176/30000 | Total reward = 47.56
2022-01-26 14:18:18.867 | DEBUG    | __main__:trials:24 - Trial = 23177/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.867 | DEBUG    | __main__:trials:29 - Trial = 23177/30000 | Total reward = 39.42
2022-01-26 14:18:18.872 | DEBUG    | __main__:trials:24 - Trial = 23178/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.873 | DEBUG    | __main__:trials:29 - Trial = 23178/30000 | Total reward = 42.07
2022-01-26 14:18:18.877 | DEBUG    | __main__:trials:24 - Trial = 23179/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.878 | DEBUG    | __main__:trials:29 - Trial = 23179/30000 | Total reward = 55.02
2022-01-26 14:18:18.882 | DEBUG    | __main__:trials:24 - Trial = 23180/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.884 | DEBUG    | __main__:trials:29 - Trial = 23180/30000 | Total reward = 62.57
2022-01-26 14:18:18.888 | DEBUG    | __main__:trials:24 - Trial = 23181/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.888 | DEBUG    | __main__:trials:29 - Trial = 23181/30000 | Total reward = 55.60
2022-01-26 14:18:18.893 | DEBUG    | __main__:trials:24 - Trial = 23182/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.895 | DEBUG    | __main__:trials:29 - Trial = 23182/30000 | Total reward = 47.33
2022-01-26 14:18:18.899 | DEBUG    | __main__:trials:24 - Trial = 23183/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.900 | DEBUG    | __main__:trials:29 - Trial = 23183/30000 | Total reward = 44.63
2022-01-26 14:18:18.904 | DEBUG    | __main__:trials:24 - Trial = 23184/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.905 | DEBUG    | __main__:trials:29 - Trial = 23184/30000 | Total reward = 55.78
2022-01-26 14:18:18.908 | DEBUG    | __main__:trials:24 - Trial = 23185/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.909 | DEBUG    | __main__:trials:29 - Trial = 23185/30000 | Total reward = 44.45
2022-01-26 14:18:18.913 | DEBUG    | __main__:trials:24 - Trial = 23186/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.914 | DEBUG    | __main__:trials:29 - Trial = 23186/30000 | Total reward = 54.61
2022-01-26 14:18:18.917 | DEBUG    | __main__:trials:24 - Trial = 23187/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.918 | DEBUG    | __main__:trials:29 - Trial = 23187/30000 | Total reward = 35.46
2022-01-26 14:18:18.920 | DEBUG    | __main__:trials:26 - Trial = 23188/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.921 | DEBUG    | __main__:trials:29 - Trial = 23188/30000 | Total reward = 18.66
2022-01-26 14:18:18.926 | DEBUG    | __main__:trials:24 - Trial = 23189/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.927 | DEBUG    | __main__:trials:29 - Trial = 23189/30000 | Total reward = 49.07
2022-01-26 14:18:18.931 | DEBUG    | __main__:trials:24 - Trial = 23190/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.932 | DEBUG    | __main__:trials:29 - Trial = 23190/30000 | Total reward = 55.15
2022-01-26 14:18:18.936 | DEBUG    | __main__:trials:24 - Trial = 23191/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.936 | DEBUG    | __main__:trials:29 - Trial = 23191/30000 | Total reward = 45.28
2022-01-26 14:18:18.941 | DEBUG    | __main__:trials:24 - Trial = 23192/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.943 | DEBUG    | __main__:trials:29 - Trial = 23192/30000 | Total reward = 56.22
2022-01-26 14:18:18.946 | DEBUG    | __main__:trials:26 - Trial = 23193/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.947 | DEBUG    | __main__:trials:29 - Trial = 23193/30000 | Total reward = 27.50
2022-01-26 14:18:18.950 | DEBUG    | __main__:trials:24 - Trial = 23194/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.952 | DEBUG    | __main__:trials:29 - Trial = 23194/30000 | Total reward = 41.62
2022-01-26 14:18:18.955 | DEBUG    | __main__:trials:24 - Trial = 23195/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.956 | DEBUG    | __main__:trials:29 - Trial = 23195/30000 | Total reward = 47.99
2022-01-26 14:18:18.959 | DEBUG    | __main__:trials:24 - Trial = 23196/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.961 | DEBUG    | __main__:trials:29 - Trial = 23196/30000 | Total reward = 55.51
2022-01-26 14:18:18.964 | DEBUG    | __main__:trials:24 - Trial = 23197/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.966 | DEBUG    | __main__:trials:29 - Trial = 23197/30000 | Total reward = 36.15
2022-01-26 14:18:18.970 | DEBUG    | __main__:trials:26 - Trial = 23198/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:18.970 | DEBUG    | __main__:trials:29 - Trial = 23198/30000 | Total reward = 26.80
2022-01-26 14:18:18.975 | DEBUG    | __main__:trials:24 - Trial = 23199/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.976 | DEBUG    | __main__:trials:29 - Trial = 23199/30000 | Total reward = 37.81
2022-01-26 14:18:18.979 | DEBUG    | __main__:trials:24 - Trial = 23200/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.981 | DEBUG    | __main__:trials:29 - Trial = 23200/30000 | Total reward = 45.87
2022-01-26 14:18:18.985 | DEBUG    | __main__:trials:24 - Trial = 23201/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.986 | DEBUG    | __main__:trials:29 - Trial = 23201/30000 | Total reward = 39.75
2022-01-26 14:18:18.990 | DEBUG    | __main__:trials:24 - Trial = 23202/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.992 | DEBUG    | __main__:trials:29 - Trial = 23202/30000 | Total reward = 41.87
2022-01-26 14:18:18.995 | DEBUG    | __main__:trials:24 - Trial = 23203/30000 | Max number of steps (20) reached
2022-01-26 14:18:18.997 | DEBUG    | __main__:trials:29 - Trial = 23203/30000 | Total reward = 51.74
2022-01-26 14:18:19.001 | DEBUG    | __main__:trials:24 - Trial = 23204/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.002 | DEBUG    | __main__:trials:29 - Trial = 23204/30000 | Total reward = 45.89
2022-01-26 14:18:19.006 | DEBUG    | __main__:trials:24 - Trial = 23205/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.007 | DEBUG    | __main__:trials:29 - Trial = 23205/30000 | Total reward = 43.18
2022-01-26 14:18:19.011 | DEBUG    | __main__:trials:24 - Trial = 23206/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.012 | DEBUG    | __main__:trials:29 - Trial = 23206/30000 | Total reward = 32.49
2022-01-26 14:18:19.016 | DEBUG    | __main__:trials:24 - Trial = 23207/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.017 | DEBUG    | __main__:trials:29 - Trial = 23207/30000 | Total reward = 58.69
2022-01-26 14:18:19.021 | DEBUG    | __main__:trials:24 - Trial = 23208/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.022 | DEBUG    | __main__:trials:29 - Trial = 23208/30000 | Total reward = 38.03
2022-01-26 14:18:19.026 | DEBUG    | __main__:trials:24 - Trial = 23209/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.027 | DEBUG    | __main__:trials:29 - Trial = 23209/30000 | Total reward = 58.94
2022-01-26 14:18:19.031 | DEBUG    | __main__:trials:24 - Trial = 23210/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.032 | DEBUG    | __main__:trials:29 - Trial = 23210/30000 | Total reward = 46.50
2022-01-26 14:18:19.036 | DEBUG    | __main__:trials:24 - Trial = 23211/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.037 | DEBUG    | __main__:trials:29 - Trial = 23211/30000 | Total reward = 45.56
2022-01-26 14:18:19.042 | DEBUG    | __main__:trials:24 - Trial = 23212/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.043 | DEBUG    | __main__:trials:29 - Trial = 23212/30000 | Total reward = 36.47
2022-01-26 14:18:19.047 | DEBUG    | __main__:trials:24 - Trial = 23213/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.048 | DEBUG    | __main__:trials:29 - Trial = 23213/30000 | Total reward = 40.76
2022-01-26 14:18:19.052 | DEBUG    | __main__:trials:24 - Trial = 23214/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.053 | DEBUG    | __main__:trials:29 - Trial = 23214/30000 | Total reward = 45.72
2022-01-26 14:18:19.057 | DEBUG    | __main__:trials:24 - Trial = 23215/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.058 | DEBUG    | __main__:trials:29 - Trial = 23215/30000 | Total reward = 38.15
2022-01-26 14:18:19.062 | DEBUG    | __main__:trials:24 - Trial = 23216/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.064 | DEBUG    | __main__:trials:29 - Trial = 23216/30000 | Total reward = 46.55
2022-01-26 14:18:19.067 | DEBUG    | __main__:trials:24 - Trial = 23217/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.068 | DEBUG    | __main__:trials:29 - Trial = 23217/30000 | Total reward = 50.84
2022-01-26 14:18:19.072 | DEBUG    | __main__:trials:24 - Trial = 23218/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.073 | DEBUG    | __main__:trials:29 - Trial = 23218/30000 | Total reward = 50.93
2022-01-26 14:18:19.076 | DEBUG    | __main__:trials:24 - Trial = 23219/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.078 | DEBUG    | __main__:trials:29 - Trial = 23219/30000 | Total reward = 36.14
2022-01-26 14:18:19.081 | DEBUG    | __main__:trials:24 - Trial = 23220/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.083 | DEBUG    | __main__:trials:29 - Trial = 23220/30000 | Total reward = 53.09
2022-01-26 14:18:19.086 | DEBUG    | __main__:trials:24 - Trial = 23221/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.088 | DEBUG    | __main__:trials:29 - Trial = 23221/30000 | Total reward = 40.35
2022-01-26 14:18:19.091 | DEBUG    | __main__:trials:24 - Trial = 23222/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.093 | DEBUG    | __main__:trials:29 - Trial = 23222/30000 | Total reward = 52.96
2022-01-26 14:18:19.096 | DEBUG    | __main__:trials:24 - Trial = 23223/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.098 | DEBUG    | __main__:trials:29 - Trial = 23223/30000 | Total reward = 49.23
2022-01-26 14:18:19.102 | DEBUG    | __main__:trials:24 - Trial = 23224/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.102 | DEBUG    | __main__:trials:29 - Trial = 23224/30000 | Total reward = 32.61
2022-01-26 14:18:19.106 | DEBUG    | __main__:trials:24 - Trial = 23225/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.108 | DEBUG    | __main__:trials:29 - Trial = 23225/30000 | Total reward = 41.58
2022-01-26 14:18:19.110 | DEBUG    | __main__:trials:26 - Trial = 23226/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.112 | DEBUG    | __main__:trials:29 - Trial = 23226/30000 | Total reward = 15.08
2022-01-26 14:18:19.114 | DEBUG    | __main__:trials:24 - Trial = 23227/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.116 | DEBUG    | __main__:trials:29 - Trial = 23227/30000 | Total reward = 42.83
2022-01-26 14:18:19.120 | DEBUG    | __main__:trials:24 - Trial = 23228/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.121 | DEBUG    | __main__:trials:29 - Trial = 23228/30000 | Total reward = 50.84
2022-01-26 14:18:19.125 | DEBUG    | __main__:trials:24 - Trial = 23229/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.127 | DEBUG    | __main__:trials:29 - Trial = 23229/30000 | Total reward = 30.76
2022-01-26 14:18:19.130 | DEBUG    | __main__:trials:24 - Trial = 23230/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.131 | DEBUG    | __main__:trials:29 - Trial = 23230/30000 | Total reward = 50.84
2022-01-26 14:18:19.134 | DEBUG    | __main__:trials:24 - Trial = 23231/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.136 | DEBUG    | __main__:trials:29 - Trial = 23231/30000 | Total reward = 58.84
2022-01-26 14:18:19.140 | DEBUG    | __main__:trials:24 - Trial = 23232/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.141 | DEBUG    | __main__:trials:29 - Trial = 23232/30000 | Total reward = 42.36
2022-01-26 14:18:19.145 | DEBUG    | __main__:trials:24 - Trial = 23233/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.146 | DEBUG    | __main__:trials:29 - Trial = 23233/30000 | Total reward = 49.88
2022-01-26 14:18:19.149 | DEBUG    | __main__:trials:24 - Trial = 23234/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.150 | DEBUG    | __main__:trials:29 - Trial = 23234/30000 | Total reward = 46.19
2022-01-26 14:18:19.154 | DEBUG    | __main__:trials:24 - Trial = 23235/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.156 | DEBUG    | __main__:trials:29 - Trial = 23235/30000 | Total reward = 50.14
2022-01-26 14:18:19.160 | DEBUG    | __main__:trials:24 - Trial = 23236/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.161 | DEBUG    | __main__:trials:29 - Trial = 23236/30000 | Total reward = 45.16
2022-01-26 14:18:19.165 | DEBUG    | __main__:trials:24 - Trial = 23237/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.167 | DEBUG    | __main__:trials:29 - Trial = 23237/30000 | Total reward = 45.05
2022-01-26 14:18:19.170 | DEBUG    | __main__:trials:24 - Trial = 23238/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.171 | DEBUG    | __main__:trials:29 - Trial = 23238/30000 | Total reward = 44.72
2022-01-26 14:18:19.174 | DEBUG    | __main__:trials:24 - Trial = 23239/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.175 | DEBUG    | __main__:trials:29 - Trial = 23239/30000 | Total reward = 53.14
2022-01-26 14:18:19.179 | DEBUG    | __main__:trials:24 - Trial = 23240/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.180 | DEBUG    | __main__:trials:29 - Trial = 23240/30000 | Total reward = 51.69
2022-01-26 14:18:19.184 | DEBUG    | __main__:trials:24 - Trial = 23241/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.185 | DEBUG    | __main__:trials:29 - Trial = 23241/30000 | Total reward = 53.80
2022-01-26 14:18:19.189 | DEBUG    | __main__:trials:24 - Trial = 23242/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.191 | DEBUG    | __main__:trials:29 - Trial = 23242/30000 | Total reward = 34.97
2022-01-26 14:18:19.194 | DEBUG    | __main__:trials:24 - Trial = 23243/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.196 | DEBUG    | __main__:trials:29 - Trial = 23243/30000 | Total reward = 42.28
2022-01-26 14:18:19.200 | DEBUG    | __main__:trials:24 - Trial = 23244/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.201 | DEBUG    | __main__:trials:29 - Trial = 23244/30000 | Total reward = 35.52
2022-01-26 14:18:19.204 | DEBUG    | __main__:trials:24 - Trial = 23245/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.206 | DEBUG    | __main__:trials:29 - Trial = 23245/30000 | Total reward = 38.18
2022-01-26 14:18:19.210 | DEBUG    | __main__:trials:24 - Trial = 23246/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.211 | DEBUG    | __main__:trials:29 - Trial = 23246/30000 | Total reward = 37.01
2022-01-26 14:18:19.215 | DEBUG    | __main__:trials:24 - Trial = 23247/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.215 | DEBUG    | __main__:trials:29 - Trial = 23247/30000 | Total reward = 44.20
2022-01-26 14:18:19.220 | DEBUG    | __main__:trials:24 - Trial = 23248/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.220 | DEBUG    | __main__:trials:29 - Trial = 23248/30000 | Total reward = 36.11
2022-01-26 14:18:19.225 | DEBUG    | __main__:trials:24 - Trial = 23249/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.226 | DEBUG    | __main__:trials:29 - Trial = 23249/30000 | Total reward = 40.38
2022-01-26 14:18:19.229 | DEBUG    | __main__:trials:24 - Trial = 23250/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.231 | DEBUG    | __main__:trials:29 - Trial = 23250/30000 | Total reward = 39.76
2022-01-26 14:18:19.234 | DEBUG    | __main__:trials:24 - Trial = 23251/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.236 | DEBUG    | __main__:trials:29 - Trial = 23251/30000 | Total reward = 42.78
2022-01-26 14:18:19.239 | DEBUG    | __main__:trials:24 - Trial = 23252/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.241 | DEBUG    | __main__:trials:29 - Trial = 23252/30000 | Total reward = 44.46
2022-01-26 14:18:19.244 | DEBUG    | __main__:trials:24 - Trial = 23253/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.245 | DEBUG    | __main__:trials:29 - Trial = 23253/30000 | Total reward = 48.89
2022-01-26 14:18:19.249 | DEBUG    | __main__:trials:24 - Trial = 23254/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.251 | DEBUG    | __main__:trials:29 - Trial = 23254/30000 | Total reward = 47.58
2022-01-26 14:18:19.254 | DEBUG    | __main__:trials:24 - Trial = 23255/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.256 | DEBUG    | __main__:trials:29 - Trial = 23255/30000 | Total reward = 42.72
2022-01-26 14:18:19.259 | DEBUG    | __main__:trials:24 - Trial = 23256/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.261 | DEBUG    | __main__:trials:29 - Trial = 23256/30000 | Total reward = 43.59
2022-01-26 14:18:19.264 | DEBUG    | __main__:trials:24 - Trial = 23257/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.265 | DEBUG    | __main__:trials:29 - Trial = 23257/30000 | Total reward = 42.55
2022-01-26 14:18:19.268 | DEBUG    | __main__:trials:24 - Trial = 23258/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.271 | DEBUG    | __main__:trials:29 - Trial = 23258/30000 | Total reward = 38.73
2022-01-26 14:18:19.275 | DEBUG    | __main__:trials:24 - Trial = 23259/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.275 | DEBUG    | __main__:trials:29 - Trial = 23259/30000 | Total reward = 32.49
2022-01-26 14:18:19.278 | DEBUG    | __main__:trials:26 - Trial = 23260/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.281 | DEBUG    | __main__:trials:29 - Trial = 23260/30000 | Total reward = 25.86
2022-01-26 14:18:19.284 | DEBUG    | __main__:trials:26 - Trial = 23261/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.285 | DEBUG    | __main__:trials:29 - Trial = 23261/30000 | Total reward = 18.00
2022-01-26 14:18:19.289 | DEBUG    | __main__:trials:24 - Trial = 23262/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.291 | DEBUG    | __main__:trials:29 - Trial = 23262/30000 | Total reward = 29.65
2022-01-26 14:18:19.294 | DEBUG    | __main__:trials:26 - Trial = 23263/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.296 | DEBUG    | __main__:trials:29 - Trial = 23263/30000 | Total reward = 18.83
2022-01-26 14:18:19.299 | DEBUG    | __main__:trials:24 - Trial = 23264/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.301 | DEBUG    | __main__:trials:29 - Trial = 23264/30000 | Total reward = 20.18
2022-01-26 14:18:19.304 | DEBUG    | __main__:trials:24 - Trial = 23265/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.306 | DEBUG    | __main__:trials:29 - Trial = 23265/30000 | Total reward = 32.48
2022-01-26 14:18:19.310 | DEBUG    | __main__:trials:24 - Trial = 23266/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.311 | DEBUG    | __main__:trials:29 - Trial = 23266/30000 | Total reward = 31.23
2022-01-26 14:18:19.314 | DEBUG    | __main__:trials:24 - Trial = 23267/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.316 | DEBUG    | __main__:trials:29 - Trial = 23267/30000 | Total reward = 21.12
2022-01-26 14:18:19.319 | DEBUG    | __main__:trials:26 - Trial = 23268/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.321 | DEBUG    | __main__:trials:29 - Trial = 23268/30000 | Total reward = 22.75
2022-01-26 14:18:19.324 | DEBUG    | __main__:trials:24 - Trial = 23269/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.326 | DEBUG    | __main__:trials:29 - Trial = 23269/30000 | Total reward = 36.30
2022-01-26 14:18:19.330 | DEBUG    | __main__:trials:24 - Trial = 23270/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.330 | DEBUG    | __main__:trials:29 - Trial = 23270/30000 | Total reward = 31.76
2022-01-26 14:18:19.335 | DEBUG    | __main__:trials:24 - Trial = 23271/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.336 | DEBUG    | __main__:trials:29 - Trial = 23271/30000 | Total reward = 31.06
2022-01-26 14:18:19.340 | DEBUG    | __main__:trials:24 - Trial = 23272/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.341 | DEBUG    | __main__:trials:29 - Trial = 23272/30000 | Total reward = 38.32
2022-01-26 14:18:19.344 | DEBUG    | __main__:trials:26 - Trial = 23273/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.346 | DEBUG    | __main__:trials:29 - Trial = 23273/30000 | Total reward = 21.98
2022-01-26 14:18:19.349 | DEBUG    | __main__:trials:24 - Trial = 23274/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.351 | DEBUG    | __main__:trials:29 - Trial = 23274/30000 | Total reward = 50.05
2022-01-26 14:18:19.355 | DEBUG    | __main__:trials:24 - Trial = 23275/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.356 | DEBUG    | __main__:trials:29 - Trial = 23275/30000 | Total reward = 38.03
2022-01-26 14:18:19.360 | DEBUG    | __main__:trials:24 - Trial = 23276/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.361 | DEBUG    | __main__:trials:29 - Trial = 23276/30000 | Total reward = 36.11
2022-01-26 14:18:19.365 | DEBUG    | __main__:trials:24 - Trial = 23277/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.366 | DEBUG    | __main__:trials:29 - Trial = 23277/30000 | Total reward = 36.56
2022-01-26 14:18:19.370 | DEBUG    | __main__:trials:24 - Trial = 23278/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.371 | DEBUG    | __main__:trials:29 - Trial = 23278/30000 | Total reward = 42.66
2022-01-26 14:18:19.375 | DEBUG    | __main__:trials:24 - Trial = 23279/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.376 | DEBUG    | __main__:trials:29 - Trial = 23279/30000 | Total reward = 39.88
2022-01-26 14:18:19.380 | DEBUG    | __main__:trials:24 - Trial = 23280/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.382 | DEBUG    | __main__:trials:29 - Trial = 23280/30000 | Total reward = 32.17
2022-01-26 14:18:19.385 | DEBUG    | __main__:trials:24 - Trial = 23281/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.387 | DEBUG    | __main__:trials:29 - Trial = 23281/30000 | Total reward = 40.84
2022-01-26 14:18:19.390 | DEBUG    | __main__:trials:24 - Trial = 23282/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.393 | DEBUG    | __main__:trials:29 - Trial = 23282/30000 | Total reward = 41.64
2022-01-26 14:18:19.397 | DEBUG    | __main__:trials:24 - Trial = 23283/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.397 | DEBUG    | __main__:trials:29 - Trial = 23283/30000 | Total reward = 31.16
2022-01-26 14:18:19.401 | DEBUG    | __main__:trials:24 - Trial = 23284/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.402 | DEBUG    | __main__:trials:29 - Trial = 23284/30000 | Total reward = 32.40
2022-01-26 14:18:19.406 | DEBUG    | __main__:trials:24 - Trial = 23285/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.408 | DEBUG    | __main__:trials:29 - Trial = 23285/30000 | Total reward = 46.40
2022-01-26 14:18:19.411 | DEBUG    | __main__:trials:24 - Trial = 23286/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.412 | DEBUG    | __main__:trials:29 - Trial = 23286/30000 | Total reward = 40.45
2022-01-26 14:18:19.416 | DEBUG    | __main__:trials:24 - Trial = 23287/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.418 | DEBUG    | __main__:trials:29 - Trial = 23287/30000 | Total reward = 49.33
2022-01-26 14:18:19.421 | DEBUG    | __main__:trials:24 - Trial = 23288/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.423 | DEBUG    | __main__:trials:29 - Trial = 23288/30000 | Total reward = 44.14
2022-01-26 14:18:19.426 | DEBUG    | __main__:trials:26 - Trial = 23289/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.427 | DEBUG    | __main__:trials:29 - Trial = 23289/30000 | Total reward = 19.16
2022-01-26 14:18:19.431 | DEBUG    | __main__:trials:24 - Trial = 23290/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.433 | DEBUG    | __main__:trials:29 - Trial = 23290/30000 | Total reward = 38.67
2022-01-26 14:18:19.436 | DEBUG    | __main__:trials:24 - Trial = 23291/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.438 | DEBUG    | __main__:trials:29 - Trial = 23291/30000 | Total reward = 39.45
2022-01-26 14:18:19.441 | DEBUG    | __main__:trials:24 - Trial = 23292/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.443 | DEBUG    | __main__:trials:29 - Trial = 23292/30000 | Total reward = 37.07
2022-01-26 14:18:19.447 | DEBUG    | __main__:trials:24 - Trial = 23293/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.448 | DEBUG    | __main__:trials:29 - Trial = 23293/30000 | Total reward = 50.75
2022-01-26 14:18:19.452 | DEBUG    | __main__:trials:24 - Trial = 23294/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.454 | DEBUG    | __main__:trials:29 - Trial = 23294/30000 | Total reward = 39.39
2022-01-26 14:18:19.457 | DEBUG    | __main__:trials:24 - Trial = 23295/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.459 | DEBUG    | __main__:trials:29 - Trial = 23295/30000 | Total reward = 50.28
2022-01-26 14:18:19.463 | DEBUG    | __main__:trials:26 - Trial = 23296/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.464 | DEBUG    | __main__:trials:29 - Trial = 23296/30000 | Total reward = 26.95
2022-01-26 14:18:19.468 | DEBUG    | __main__:trials:24 - Trial = 23297/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.470 | DEBUG    | __main__:trials:29 - Trial = 23297/30000 | Total reward = 37.71
2022-01-26 14:18:19.473 | DEBUG    | __main__:trials:24 - Trial = 23298/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.475 | DEBUG    | __main__:trials:29 - Trial = 23298/30000 | Total reward = 31.56
2022-01-26 14:18:19.478 | DEBUG    | __main__:trials:26 - Trial = 23299/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.480 | DEBUG    | __main__:trials:29 - Trial = 23299/30000 | Total reward = 31.11
2022-01-26 14:18:19.484 | DEBUG    | __main__:trials:24 - Trial = 23300/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.485 | DEBUG    | __main__:trials:29 - Trial = 23300/30000 | Total reward = 46.88
2022-01-26 14:18:19.489 | DEBUG    | __main__:trials:24 - Trial = 23301/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.491 | DEBUG    | __main__:trials:29 - Trial = 23301/30000 | Total reward = 38.66
2022-01-26 14:18:19.494 | DEBUG    | __main__:trials:24 - Trial = 23302/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.495 | DEBUG    | __main__:trials:29 - Trial = 23302/30000 | Total reward = 38.71
2022-01-26 14:18:19.499 | DEBUG    | __main__:trials:24 - Trial = 23303/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.501 | DEBUG    | __main__:trials:29 - Trial = 23303/30000 | Total reward = 39.83
2022-01-26 14:18:19.503 | DEBUG    | __main__:trials:26 - Trial = 23304/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.505 | DEBUG    | __main__:trials:29 - Trial = 23304/30000 | Total reward = 11.25
2022-01-26 14:18:19.508 | DEBUG    | __main__:trials:24 - Trial = 23305/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.510 | DEBUG    | __main__:trials:29 - Trial = 23305/30000 | Total reward = 28.43
2022-01-26 14:18:19.514 | DEBUG    | __main__:trials:24 - Trial = 23306/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.515 | DEBUG    | __main__:trials:29 - Trial = 23306/30000 | Total reward = 43.34
2022-01-26 14:18:19.519 | DEBUG    | __main__:trials:24 - Trial = 23307/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.521 | DEBUG    | __main__:trials:29 - Trial = 23307/30000 | Total reward = 41.22
2022-01-26 14:18:19.524 | DEBUG    | __main__:trials:24 - Trial = 23308/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.525 | DEBUG    | __main__:trials:29 - Trial = 23308/30000 | Total reward = 41.16
2022-01-26 14:18:19.529 | DEBUG    | __main__:trials:24 - Trial = 23309/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.530 | DEBUG    | __main__:trials:29 - Trial = 23309/30000 | Total reward = 38.45
2022-01-26 14:18:19.534 | DEBUG    | __main__:trials:26 - Trial = 23310/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.535 | DEBUG    | __main__:trials:29 - Trial = 23310/30000 | Total reward = 19.57
2022-01-26 14:18:19.538 | DEBUG    | __main__:trials:24 - Trial = 23311/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.540 | DEBUG    | __main__:trials:29 - Trial = 23311/30000 | Total reward = 47.91
2022-01-26 14:18:19.544 | DEBUG    | __main__:trials:24 - Trial = 23312/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.545 | DEBUG    | __main__:trials:29 - Trial = 23312/30000 | Total reward = 47.04
2022-01-26 14:18:19.549 | DEBUG    | __main__:trials:24 - Trial = 23313/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.550 | DEBUG    | __main__:trials:29 - Trial = 23313/30000 | Total reward = 41.39
2022-01-26 14:18:19.554 | DEBUG    | __main__:trials:24 - Trial = 23314/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.555 | DEBUG    | __main__:trials:29 - Trial = 23314/30000 | Total reward = 34.24
2022-01-26 14:18:19.559 | DEBUG    | __main__:trials:26 - Trial = 23315/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.560 | DEBUG    | __main__:trials:29 - Trial = 23315/30000 | Total reward = 21.17
2022-01-26 14:18:19.564 | DEBUG    | __main__:trials:24 - Trial = 23316/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.566 | DEBUG    | __main__:trials:29 - Trial = 23316/30000 | Total reward = 33.25
2022-01-26 14:18:19.569 | DEBUG    | __main__:trials:26 - Trial = 23317/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.569 | DEBUG    | __main__:trials:29 - Trial = 23317/30000 | Total reward = 18.13
2022-01-26 14:18:19.574 | DEBUG    | __main__:trials:24 - Trial = 23318/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.575 | DEBUG    | __main__:trials:29 - Trial = 23318/30000 | Total reward = 37.89
2022-01-26 14:18:19.579 | DEBUG    | __main__:trials:24 - Trial = 23319/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.581 | DEBUG    | __main__:trials:29 - Trial = 23319/30000 | Total reward = 46.07
2022-01-26 14:18:19.585 | DEBUG    | __main__:trials:24 - Trial = 23320/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.586 | DEBUG    | __main__:trials:29 - Trial = 23320/30000 | Total reward = 63.18
2022-01-26 14:18:19.589 | DEBUG    | __main__:trials:24 - Trial = 23321/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.590 | DEBUG    | __main__:trials:29 - Trial = 23321/30000 | Total reward = 48.10
2022-01-26 14:18:19.595 | DEBUG    | __main__:trials:24 - Trial = 23322/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.597 | DEBUG    | __main__:trials:29 - Trial = 23322/30000 | Total reward = 51.93
2022-01-26 14:18:19.600 | DEBUG    | __main__:trials:24 - Trial = 23323/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.601 | DEBUG    | __main__:trials:29 - Trial = 23323/30000 | Total reward = 41.20
2022-01-26 14:18:19.605 | DEBUG    | __main__:trials:24 - Trial = 23324/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.606 | DEBUG    | __main__:trials:29 - Trial = 23324/30000 | Total reward = 37.60
2022-01-26 14:18:19.609 | DEBUG    | __main__:trials:24 - Trial = 23325/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.611 | DEBUG    | __main__:trials:29 - Trial = 23325/30000 | Total reward = 43.32
2022-01-26 14:18:19.615 | DEBUG    | __main__:trials:24 - Trial = 23326/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.617 | DEBUG    | __main__:trials:29 - Trial = 23326/30000 | Total reward = 39.55
2022-01-26 14:18:19.620 | DEBUG    | __main__:trials:24 - Trial = 23327/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.622 | DEBUG    | __main__:trials:29 - Trial = 23327/30000 | Total reward = 40.95
2022-01-26 14:18:19.626 | DEBUG    | __main__:trials:24 - Trial = 23328/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.627 | DEBUG    | __main__:trials:29 - Trial = 23328/30000 | Total reward = 37.89
2022-01-26 14:18:19.631 | DEBUG    | __main__:trials:24 - Trial = 23329/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.632 | DEBUG    | __main__:trials:29 - Trial = 23329/30000 | Total reward = 45.64
2022-01-26 14:18:19.636 | DEBUG    | __main__:trials:24 - Trial = 23330/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.637 | DEBUG    | __main__:trials:29 - Trial = 23330/30000 | Total reward = 29.98
2022-01-26 14:18:19.641 | DEBUG    | __main__:trials:24 - Trial = 23331/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.642 | DEBUG    | __main__:trials:29 - Trial = 23331/30000 | Total reward = 55.20
2022-01-26 14:18:19.645 | DEBUG    | __main__:trials:24 - Trial = 23332/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.646 | DEBUG    | __main__:trials:29 - Trial = 23332/30000 | Total reward = 36.15
2022-01-26 14:18:19.649 | DEBUG    | __main__:trials:24 - Trial = 23333/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.651 | DEBUG    | __main__:trials:29 - Trial = 23333/30000 | Total reward = 39.10
2022-01-26 14:18:19.654 | DEBUG    | __main__:trials:26 - Trial = 23334/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.656 | DEBUG    | __main__:trials:29 - Trial = 23334/30000 | Total reward = 27.71
2022-01-26 14:18:19.659 | DEBUG    | __main__:trials:24 - Trial = 23335/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.661 | DEBUG    | __main__:trials:29 - Trial = 23335/30000 | Total reward = 39.37
2022-01-26 14:18:19.663 | DEBUG    | __main__:trials:26 - Trial = 23336/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.665 | DEBUG    | __main__:trials:29 - Trial = 23336/30000 | Total reward = 20.94
2022-01-26 14:18:19.668 | DEBUG    | __main__:trials:24 - Trial = 23337/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.670 | DEBUG    | __main__:trials:29 - Trial = 23337/30000 | Total reward = 47.59
2022-01-26 14:18:19.674 | DEBUG    | __main__:trials:24 - Trial = 23338/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.674 | DEBUG    | __main__:trials:29 - Trial = 23338/30000 | Total reward = 37.37
2022-01-26 14:18:19.678 | DEBUG    | __main__:trials:24 - Trial = 23339/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.680 | DEBUG    | __main__:trials:29 - Trial = 23339/30000 | Total reward = 47.67
2022-01-26 14:18:19.684 | DEBUG    | __main__:trials:24 - Trial = 23340/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.685 | DEBUG    | __main__:trials:29 - Trial = 23340/30000 | Total reward = 48.59
2022-01-26 14:18:19.689 | DEBUG    | __main__:trials:24 - Trial = 23341/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.691 | DEBUG    | __main__:trials:29 - Trial = 23341/30000 | Total reward = 39.36
2022-01-26 14:18:19.694 | DEBUG    | __main__:trials:24 - Trial = 23342/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.696 | DEBUG    | __main__:trials:29 - Trial = 23342/30000 | Total reward = 38.11
2022-01-26 14:18:19.700 | DEBUG    | __main__:trials:24 - Trial = 23343/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.701 | DEBUG    | __main__:trials:29 - Trial = 23343/30000 | Total reward = 36.32
2022-01-26 14:18:19.705 | DEBUG    | __main__:trials:24 - Trial = 23344/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.707 | DEBUG    | __main__:trials:29 - Trial = 23344/30000 | Total reward = 44.32
2022-01-26 14:18:19.710 | DEBUG    | __main__:trials:24 - Trial = 23345/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.712 | DEBUG    | __main__:trials:29 - Trial = 23345/30000 | Total reward = 50.01
2022-01-26 14:18:19.716 | DEBUG    | __main__:trials:24 - Trial = 23346/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.716 | DEBUG    | __main__:trials:29 - Trial = 23346/30000 | Total reward = 39.57
2022-01-26 14:18:19.720 | DEBUG    | __main__:trials:24 - Trial = 23347/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.722 | DEBUG    | __main__:trials:29 - Trial = 23347/30000 | Total reward = 37.13
2022-01-26 14:18:19.725 | DEBUG    | __main__:trials:24 - Trial = 23348/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.726 | DEBUG    | __main__:trials:29 - Trial = 23348/30000 | Total reward = 37.93
2022-01-26 14:18:19.729 | DEBUG    | __main__:trials:24 - Trial = 23349/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.731 | DEBUG    | __main__:trials:29 - Trial = 23349/30000 | Total reward = 37.23
2022-01-26 14:18:19.734 | DEBUG    | __main__:trials:24 - Trial = 23350/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.736 | DEBUG    | __main__:trials:29 - Trial = 23350/30000 | Total reward = 32.67
2022-01-26 14:18:19.740 | DEBUG    | __main__:trials:24 - Trial = 23351/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.742 | DEBUG    | __main__:trials:29 - Trial = 23351/30000 | Total reward = 39.32
2022-01-26 14:18:19.745 | DEBUG    | __main__:trials:24 - Trial = 23352/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.747 | DEBUG    | __main__:trials:29 - Trial = 23352/30000 | Total reward = 38.77
2022-01-26 14:18:19.750 | DEBUG    | __main__:trials:24 - Trial = 23353/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.752 | DEBUG    | __main__:trials:29 - Trial = 23353/30000 | Total reward = 50.52
2022-01-26 14:18:19.755 | DEBUG    | __main__:trials:26 - Trial = 23354/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.757 | DEBUG    | __main__:trials:29 - Trial = 23354/30000 | Total reward = 31.72
2022-01-26 14:18:19.761 | DEBUG    | __main__:trials:24 - Trial = 23355/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.762 | DEBUG    | __main__:trials:29 - Trial = 23355/30000 | Total reward = 32.54
2022-01-26 14:18:19.765 | DEBUG    | __main__:trials:24 - Trial = 23356/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.767 | DEBUG    | __main__:trials:29 - Trial = 23356/30000 | Total reward = 36.20
2022-01-26 14:18:19.771 | DEBUG    | __main__:trials:24 - Trial = 23357/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.772 | DEBUG    | __main__:trials:29 - Trial = 23357/30000 | Total reward = 38.75
2022-01-26 14:18:19.776 | DEBUG    | __main__:trials:24 - Trial = 23358/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.777 | DEBUG    | __main__:trials:29 - Trial = 23358/30000 | Total reward = 38.98
2022-01-26 14:18:19.781 | DEBUG    | __main__:trials:24 - Trial = 23359/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.782 | DEBUG    | __main__:trials:29 - Trial = 23359/30000 | Total reward = 46.18
2022-01-26 14:18:19.785 | DEBUG    | __main__:trials:24 - Trial = 23360/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.786 | DEBUG    | __main__:trials:29 - Trial = 23360/30000 | Total reward = 37.05
2022-01-26 14:18:19.789 | DEBUG    | __main__:trials:24 - Trial = 23361/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.791 | DEBUG    | __main__:trials:29 - Trial = 23361/30000 | Total reward = 33.91
2022-01-26 14:18:19.794 | DEBUG    | __main__:trials:24 - Trial = 23362/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.795 | DEBUG    | __main__:trials:29 - Trial = 23362/30000 | Total reward = 42.55
2022-01-26 14:18:19.799 | DEBUG    | __main__:trials:24 - Trial = 23363/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.802 | DEBUG    | __main__:trials:29 - Trial = 23363/30000 | Total reward = 32.82
2022-01-26 14:18:19.806 | DEBUG    | __main__:trials:24 - Trial = 23364/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.808 | DEBUG    | __main__:trials:29 - Trial = 23364/30000 | Total reward = 38.84
2022-01-26 14:18:19.811 | DEBUG    | __main__:trials:24 - Trial = 23365/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.813 | DEBUG    | __main__:trials:29 - Trial = 23365/30000 | Total reward = 31.69
2022-01-26 14:18:19.817 | DEBUG    | __main__:trials:24 - Trial = 23366/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.818 | DEBUG    | __main__:trials:29 - Trial = 23366/30000 | Total reward = 38.44
2022-01-26 14:18:19.822 | DEBUG    | __main__:trials:24 - Trial = 23367/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.823 | DEBUG    | __main__:trials:29 - Trial = 23367/30000 | Total reward = 39.45
2022-01-26 14:18:19.826 | DEBUG    | __main__:trials:24 - Trial = 23368/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.828 | DEBUG    | __main__:trials:29 - Trial = 23368/30000 | Total reward = 45.54
2022-01-26 14:18:19.831 | DEBUG    | __main__:trials:24 - Trial = 23369/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.833 | DEBUG    | __main__:trials:29 - Trial = 23369/30000 | Total reward = 52.70
2022-01-26 14:18:19.836 | DEBUG    | __main__:trials:24 - Trial = 23370/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.838 | DEBUG    | __main__:trials:29 - Trial = 23370/30000 | Total reward = 33.39
2022-01-26 14:18:19.842 | DEBUG    | __main__:trials:24 - Trial = 23371/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.843 | DEBUG    | __main__:trials:29 - Trial = 23371/30000 | Total reward = 32.28
2022-01-26 14:18:19.847 | DEBUG    | __main__:trials:24 - Trial = 23372/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.848 | DEBUG    | __main__:trials:29 - Trial = 23372/30000 | Total reward = 38.17
2022-01-26 14:18:19.852 | DEBUG    | __main__:trials:24 - Trial = 23373/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.854 | DEBUG    | __main__:trials:29 - Trial = 23373/30000 | Total reward = 35.37
2022-01-26 14:18:19.857 | DEBUG    | __main__:trials:24 - Trial = 23374/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.859 | DEBUG    | __main__:trials:29 - Trial = 23374/30000 | Total reward = 45.43
2022-01-26 14:18:19.862 | DEBUG    | __main__:trials:26 - Trial = 23375/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.864 | DEBUG    | __main__:trials:29 - Trial = 23375/30000 | Total reward = 29.73
2022-01-26 14:18:19.868 | DEBUG    | __main__:trials:24 - Trial = 23376/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.869 | DEBUG    | __main__:trials:29 - Trial = 23376/30000 | Total reward = 50.39
2022-01-26 14:18:19.873 | DEBUG    | __main__:trials:24 - Trial = 23377/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.875 | DEBUG    | __main__:trials:29 - Trial = 23377/30000 | Total reward = 39.35
2022-01-26 14:18:19.878 | DEBUG    | __main__:trials:26 - Trial = 23378/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.879 | DEBUG    | __main__:trials:29 - Trial = 23378/30000 | Total reward = 20.52
2022-01-26 14:18:19.883 | DEBUG    | __main__:trials:24 - Trial = 23379/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.884 | DEBUG    | __main__:trials:29 - Trial = 23379/30000 | Total reward = 36.12
2022-01-26 14:18:19.888 | DEBUG    | __main__:trials:24 - Trial = 23380/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.890 | DEBUG    | __main__:trials:29 - Trial = 23380/30000 | Total reward = 30.99
2022-01-26 14:18:19.893 | DEBUG    | __main__:trials:26 - Trial = 23381/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.894 | DEBUG    | __main__:trials:29 - Trial = 23381/30000 | Total reward = 31.25
2022-01-26 14:18:19.898 | DEBUG    | __main__:trials:24 - Trial = 23382/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.900 | DEBUG    | __main__:trials:29 - Trial = 23382/30000 | Total reward = 36.57
2022-01-26 14:18:19.903 | DEBUG    | __main__:trials:24 - Trial = 23383/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.904 | DEBUG    | __main__:trials:29 - Trial = 23383/30000 | Total reward = 51.22
2022-01-26 14:18:19.908 | DEBUG    | __main__:trials:24 - Trial = 23384/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.910 | DEBUG    | __main__:trials:29 - Trial = 23384/30000 | Total reward = 39.94
2022-01-26 14:18:19.913 | DEBUG    | __main__:trials:24 - Trial = 23385/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.915 | DEBUG    | __main__:trials:29 - Trial = 23385/30000 | Total reward = 36.99
2022-01-26 14:18:19.919 | DEBUG    | __main__:trials:26 - Trial = 23386/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.921 | DEBUG    | __main__:trials:29 - Trial = 23386/30000 | Total reward = 30.98
2022-01-26 14:18:19.924 | DEBUG    | __main__:trials:24 - Trial = 23387/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.925 | DEBUG    | __main__:trials:29 - Trial = 23387/30000 | Total reward = 43.86
2022-01-26 14:18:19.929 | DEBUG    | __main__:trials:26 - Trial = 23388/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.930 | DEBUG    | __main__:trials:29 - Trial = 23388/30000 | Total reward = 23.51
2022-01-26 14:18:19.934 | DEBUG    | __main__:trials:26 - Trial = 23389/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.935 | DEBUG    | __main__:trials:29 - Trial = 23389/30000 | Total reward = 27.92
2022-01-26 14:18:19.939 | DEBUG    | __main__:trials:26 - Trial = 23390/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:19.939 | DEBUG    | __main__:trials:29 - Trial = 23390/30000 | Total reward = 29.24
2022-01-26 14:18:19.943 | DEBUG    | __main__:trials:24 - Trial = 23391/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.945 | DEBUG    | __main__:trials:29 - Trial = 23391/30000 | Total reward = 34.72
2022-01-26 14:18:19.948 | DEBUG    | __main__:trials:24 - Trial = 23392/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.950 | DEBUG    | __main__:trials:29 - Trial = 23392/30000 | Total reward = 49.77
2022-01-26 14:18:19.953 | DEBUG    | __main__:trials:24 - Trial = 23393/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.955 | DEBUG    | __main__:trials:29 - Trial = 23393/30000 | Total reward = 29.06
2022-01-26 14:18:19.959 | DEBUG    | __main__:trials:24 - Trial = 23394/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.959 | DEBUG    | __main__:trials:29 - Trial = 23394/30000 | Total reward = 45.55
2022-01-26 14:18:19.964 | DEBUG    | __main__:trials:24 - Trial = 23395/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.965 | DEBUG    | __main__:trials:29 - Trial = 23395/30000 | Total reward = 47.77
2022-01-26 14:18:19.969 | DEBUG    | __main__:trials:24 - Trial = 23396/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.971 | DEBUG    | __main__:trials:29 - Trial = 23396/30000 | Total reward = 44.31
2022-01-26 14:18:19.974 | DEBUG    | __main__:trials:24 - Trial = 23397/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.975 | DEBUG    | __main__:trials:29 - Trial = 23397/30000 | Total reward = 37.20
2022-01-26 14:18:19.979 | DEBUG    | __main__:trials:24 - Trial = 23398/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.980 | DEBUG    | __main__:trials:29 - Trial = 23398/30000 | Total reward = 44.68
2022-01-26 14:18:19.985 | DEBUG    | __main__:trials:24 - Trial = 23399/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.986 | DEBUG    | __main__:trials:29 - Trial = 23399/30000 | Total reward = 39.06
2022-01-26 14:18:19.991 | DEBUG    | __main__:trials:24 - Trial = 23400/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.992 | DEBUG    | __main__:trials:29 - Trial = 23400/30000 | Total reward = 39.05
2022-01-26 14:18:19.995 | DEBUG    | __main__:trials:24 - Trial = 23401/30000 | Max number of steps (20) reached
2022-01-26 14:18:19.997 | DEBUG    | __main__:trials:29 - Trial = 23401/30000 | Total reward = 48.71
2022-01-26 14:18:20.000 | DEBUG    | __main__:trials:26 - Trial = 23402/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.001 | DEBUG    | __main__:trials:29 - Trial = 23402/30000 | Total reward = 26.69
2022-01-26 14:18:20.005 | DEBUG    | __main__:trials:26 - Trial = 23403/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.006 | DEBUG    | __main__:trials:29 - Trial = 23403/30000 | Total reward = 19.36
2022-01-26 14:18:20.010 | DEBUG    | __main__:trials:24 - Trial = 23404/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.010 | DEBUG    | __main__:trials:29 - Trial = 23404/30000 | Total reward = 40.41
2022-01-26 14:18:20.014 | DEBUG    | __main__:trials:24 - Trial = 23405/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.016 | DEBUG    | __main__:trials:29 - Trial = 23405/30000 | Total reward = 31.53
2022-01-26 14:18:20.019 | DEBUG    | __main__:trials:24 - Trial = 23406/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.021 | DEBUG    | __main__:trials:29 - Trial = 23406/30000 | Total reward = 27.74
2022-01-26 14:18:20.025 | DEBUG    | __main__:trials:24 - Trial = 23407/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.026 | DEBUG    | __main__:trials:29 - Trial = 23407/30000 | Total reward = 45.74
2022-01-26 14:18:20.030 | DEBUG    | __main__:trials:26 - Trial = 23408/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.031 | DEBUG    | __main__:trials:29 - Trial = 23408/30000 | Total reward = 15.49
2022-01-26 14:18:20.035 | DEBUG    | __main__:trials:26 - Trial = 23409/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.037 | DEBUG    | __main__:trials:29 - Trial = 23409/30000 | Total reward = 27.08
2022-01-26 14:18:20.040 | DEBUG    | __main__:trials:24 - Trial = 23410/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.041 | DEBUG    | __main__:trials:29 - Trial = 23410/30000 | Total reward = 31.38
2022-01-26 14:18:20.046 | DEBUG    | __main__:trials:24 - Trial = 23411/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.046 | DEBUG    | __main__:trials:29 - Trial = 23411/30000 | Total reward = 41.13
2022-01-26 14:18:20.051 | DEBUG    | __main__:trials:24 - Trial = 23412/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.052 | DEBUG    | __main__:trials:29 - Trial = 23412/30000 | Total reward = 28.24
2022-01-26 14:18:20.056 | DEBUG    | __main__:trials:24 - Trial = 23413/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.057 | DEBUG    | __main__:trials:29 - Trial = 23413/30000 | Total reward = 48.79
2022-01-26 14:18:20.061 | DEBUG    | __main__:trials:24 - Trial = 23414/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.063 | DEBUG    | __main__:trials:29 - Trial = 23414/30000 | Total reward = 40.05
2022-01-26 14:18:20.065 | DEBUG    | __main__:trials:26 - Trial = 23415/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.067 | DEBUG    | __main__:trials:29 - Trial = 23415/30000 | Total reward = 13.76
2022-01-26 14:18:20.071 | DEBUG    | __main__:trials:24 - Trial = 23416/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.072 | DEBUG    | __main__:trials:29 - Trial = 23416/30000 | Total reward = 23.06
2022-01-26 14:18:20.076 | DEBUG    | __main__:trials:24 - Trial = 23417/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.077 | DEBUG    | __main__:trials:29 - Trial = 23417/30000 | Total reward = 41.67
2022-01-26 14:18:20.081 | DEBUG    | __main__:trials:24 - Trial = 23418/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.083 | DEBUG    | __main__:trials:29 - Trial = 23418/30000 | Total reward = 42.14
2022-01-26 14:18:20.086 | DEBUG    | __main__:trials:24 - Trial = 23419/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.088 | DEBUG    | __main__:trials:29 - Trial = 23419/30000 | Total reward = 34.15
2022-01-26 14:18:20.091 | DEBUG    | __main__:trials:24 - Trial = 23420/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.092 | DEBUG    | __main__:trials:29 - Trial = 23420/30000 | Total reward = 38.80
2022-01-26 14:18:20.096 | DEBUG    | __main__:trials:24 - Trial = 23421/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.097 | DEBUG    | __main__:trials:29 - Trial = 23421/30000 | Total reward = 34.04
2022-01-26 14:18:20.101 | DEBUG    | __main__:trials:24 - Trial = 23422/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.103 | DEBUG    | __main__:trials:29 - Trial = 23422/30000 | Total reward = 33.86
2022-01-26 14:18:20.106 | DEBUG    | __main__:trials:24 - Trial = 23423/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.108 | DEBUG    | __main__:trials:29 - Trial = 23423/30000 | Total reward = 33.28
2022-01-26 14:18:20.112 | DEBUG    | __main__:trials:24 - Trial = 23424/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.114 | DEBUG    | __main__:trials:29 - Trial = 23424/30000 | Total reward = 37.90
2022-01-26 14:18:20.118 | DEBUG    | __main__:trials:26 - Trial = 23425/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.119 | DEBUG    | __main__:trials:29 - Trial = 23425/30000 | Total reward = 20.74
2022-01-26 14:18:20.122 | DEBUG    | __main__:trials:24 - Trial = 23426/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.124 | DEBUG    | __main__:trials:29 - Trial = 23426/30000 | Total reward = 48.24
2022-01-26 14:18:20.128 | DEBUG    | __main__:trials:24 - Trial = 23427/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.130 | DEBUG    | __main__:trials:29 - Trial = 23427/30000 | Total reward = 49.44
2022-01-26 14:18:20.134 | DEBUG    | __main__:trials:24 - Trial = 23428/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.135 | DEBUG    | __main__:trials:29 - Trial = 23428/30000 | Total reward = 30.18
2022-01-26 14:18:20.139 | DEBUG    | __main__:trials:24 - Trial = 23429/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.141 | DEBUG    | __main__:trials:29 - Trial = 23429/30000 | Total reward = -1.60
2022-01-26 14:18:20.145 | DEBUG    | __main__:trials:24 - Trial = 23430/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.146 | DEBUG    | __main__:trials:29 - Trial = 23430/30000 | Total reward = 35.09
2022-01-26 14:18:20.150 | DEBUG    | __main__:trials:24 - Trial = 23431/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.151 | DEBUG    | __main__:trials:29 - Trial = 23431/30000 | Total reward = 41.08
2022-01-26 14:18:20.154 | DEBUG    | __main__:trials:24 - Trial = 23432/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.155 | DEBUG    | __main__:trials:29 - Trial = 23432/30000 | Total reward = 34.84
2022-01-26 14:18:20.158 | DEBUG    | __main__:trials:24 - Trial = 23433/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.159 | DEBUG    | __main__:trials:29 - Trial = 23433/30000 | Total reward = 42.24
2022-01-26 14:18:20.162 | DEBUG    | __main__:trials:24 - Trial = 23434/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.163 | DEBUG    | __main__:trials:29 - Trial = 23434/30000 | Total reward = 33.79
2022-01-26 14:18:20.166 | DEBUG    | __main__:trials:24 - Trial = 23435/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.167 | DEBUG    | __main__:trials:29 - Trial = 23435/30000 | Total reward = 34.62
2022-01-26 14:18:20.170 | DEBUG    | __main__:trials:24 - Trial = 23436/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.171 | DEBUG    | __main__:trials:29 - Trial = 23436/30000 | Total reward = 26.47
2022-01-26 14:18:20.174 | DEBUG    | __main__:trials:24 - Trial = 23437/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.175 | DEBUG    | __main__:trials:29 - Trial = 23437/30000 | Total reward = 43.00
2022-01-26 14:18:20.178 | DEBUG    | __main__:trials:24 - Trial = 23438/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.179 | DEBUG    | __main__:trials:29 - Trial = 23438/30000 | Total reward = 31.95
2022-01-26 14:18:20.182 | DEBUG    | __main__:trials:24 - Trial = 23439/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.183 | DEBUG    | __main__:trials:29 - Trial = 23439/30000 | Total reward = 47.05
2022-01-26 14:18:20.186 | DEBUG    | __main__:trials:24 - Trial = 23440/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.187 | DEBUG    | __main__:trials:29 - Trial = 23440/30000 | Total reward = 31.78
2022-01-26 14:18:20.190 | DEBUG    | __main__:trials:24 - Trial = 23441/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.191 | DEBUG    | __main__:trials:29 - Trial = 23441/30000 | Total reward = 20.37
2022-01-26 14:18:20.194 | DEBUG    | __main__:trials:24 - Trial = 23442/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.194 | DEBUG    | __main__:trials:29 - Trial = 23442/30000 | Total reward = 40.01
2022-01-26 14:18:20.197 | DEBUG    | __main__:trials:24 - Trial = 23443/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.199 | DEBUG    | __main__:trials:29 - Trial = 23443/30000 | Total reward = 44.99
2022-01-26 14:18:20.202 | DEBUG    | __main__:trials:24 - Trial = 23444/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.203 | DEBUG    | __main__:trials:29 - Trial = 23444/30000 | Total reward = 50.83
2022-01-26 14:18:20.206 | DEBUG    | __main__:trials:24 - Trial = 23445/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.207 | DEBUG    | __main__:trials:29 - Trial = 23445/30000 | Total reward = 14.66
2022-01-26 14:18:20.210 | DEBUG    | __main__:trials:24 - Trial = 23446/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.211 | DEBUG    | __main__:trials:29 - Trial = 23446/30000 | Total reward = 34.85
2022-01-26 14:18:20.214 | DEBUG    | __main__:trials:26 - Trial = 23447/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.215 | DEBUG    | __main__:trials:29 - Trial = 23447/30000 | Total reward = 27.75
2022-01-26 14:18:20.217 | DEBUG    | __main__:trials:24 - Trial = 23448/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.218 | DEBUG    | __main__:trials:29 - Trial = 23448/30000 | Total reward = 51.27
2022-01-26 14:18:20.221 | DEBUG    | __main__:trials:24 - Trial = 23449/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.223 | DEBUG    | __main__:trials:29 - Trial = 23449/30000 | Total reward = 33.56
2022-01-26 14:18:20.226 | DEBUG    | __main__:trials:24 - Trial = 23450/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.228 | DEBUG    | __main__:trials:29 - Trial = 23450/30000 | Total reward = 42.66
2022-01-26 14:18:20.231 | DEBUG    | __main__:trials:24 - Trial = 23451/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.232 | DEBUG    | __main__:trials:29 - Trial = 23451/30000 | Total reward = 35.89
2022-01-26 14:18:20.235 | DEBUG    | __main__:trials:24 - Trial = 23452/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.235 | DEBUG    | __main__:trials:29 - Trial = 23452/30000 | Total reward = 50.82
2022-01-26 14:18:20.239 | DEBUG    | __main__:trials:24 - Trial = 23453/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.240 | DEBUG    | __main__:trials:29 - Trial = 23453/30000 | Total reward = 32.17
2022-01-26 14:18:20.242 | DEBUG    | __main__:trials:26 - Trial = 23454/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.243 | DEBUG    | __main__:trials:29 - Trial = 23454/30000 | Total reward = 19.69
2022-01-26 14:18:20.246 | DEBUG    | __main__:trials:24 - Trial = 23455/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.247 | DEBUG    | __main__:trials:29 - Trial = 23455/30000 | Total reward = 47.60
2022-01-26 14:18:20.250 | DEBUG    | __main__:trials:24 - Trial = 23456/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.251 | DEBUG    | __main__:trials:29 - Trial = 23456/30000 | Total reward = 45.76
2022-01-26 14:18:20.254 | DEBUG    | __main__:trials:24 - Trial = 23457/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.255 | DEBUG    | __main__:trials:29 - Trial = 23457/30000 | Total reward = 30.25
2022-01-26 14:18:20.258 | DEBUG    | __main__:trials:24 - Trial = 23458/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.259 | DEBUG    | __main__:trials:29 - Trial = 23458/30000 | Total reward = 32.74
2022-01-26 14:18:20.262 | DEBUG    | __main__:trials:24 - Trial = 23459/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.263 | DEBUG    | __main__:trials:29 - Trial = 23459/30000 | Total reward = 45.76
2022-01-26 14:18:20.266 | DEBUG    | __main__:trials:24 - Trial = 23460/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.266 | DEBUG    | __main__:trials:29 - Trial = 23460/30000 | Total reward = 27.33
2022-01-26 14:18:20.269 | DEBUG    | __main__:trials:24 - Trial = 23461/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.270 | DEBUG    | __main__:trials:29 - Trial = 23461/30000 | Total reward = 41.07
2022-01-26 14:18:20.273 | DEBUG    | __main__:trials:24 - Trial = 23462/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.275 | DEBUG    | __main__:trials:29 - Trial = 23462/30000 | Total reward = 35.95
2022-01-26 14:18:20.279 | DEBUG    | __main__:trials:24 - Trial = 23463/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.280 | DEBUG    | __main__:trials:29 - Trial = 23463/30000 | Total reward = 49.93
2022-01-26 14:18:20.284 | DEBUG    | __main__:trials:24 - Trial = 23464/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.284 | DEBUG    | __main__:trials:29 - Trial = 23464/30000 | Total reward = 25.62
2022-01-26 14:18:20.289 | DEBUG    | __main__:trials:24 - Trial = 23465/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.290 | DEBUG    | __main__:trials:29 - Trial = 23465/30000 | Total reward = 46.18
2022-01-26 14:18:20.294 | DEBUG    | __main__:trials:24 - Trial = 23466/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.296 | DEBUG    | __main__:trials:29 - Trial = 23466/30000 | Total reward = 47.84
2022-01-26 14:18:20.299 | DEBUG    | __main__:trials:24 - Trial = 23467/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.301 | DEBUG    | __main__:trials:29 - Trial = 23467/30000 | Total reward = 34.75
2022-01-26 14:18:20.303 | DEBUG    | __main__:trials:26 - Trial = 23468/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.305 | DEBUG    | __main__:trials:29 - Trial = 23468/30000 | Total reward = 27.07
2022-01-26 14:18:20.308 | DEBUG    | __main__:trials:26 - Trial = 23469/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.310 | DEBUG    | __main__:trials:29 - Trial = 23469/30000 | Total reward = 35.10
2022-01-26 14:18:20.314 | DEBUG    | __main__:trials:24 - Trial = 23470/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.314 | DEBUG    | __main__:trials:29 - Trial = 23470/30000 | Total reward = 42.76
2022-01-26 14:18:20.318 | DEBUG    | __main__:trials:24 - Trial = 23471/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.320 | DEBUG    | __main__:trials:29 - Trial = 23471/30000 | Total reward = 42.04
2022-01-26 14:18:20.323 | DEBUG    | __main__:trials:24 - Trial = 23472/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.324 | DEBUG    | __main__:trials:29 - Trial = 23472/30000 | Total reward = 36.15
2022-01-26 14:18:20.328 | DEBUG    | __main__:trials:26 - Trial = 23473/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.329 | DEBUG    | __main__:trials:29 - Trial = 23473/30000 | Total reward = 21.48
2022-01-26 14:18:20.332 | DEBUG    | __main__:trials:26 - Trial = 23474/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.334 | DEBUG    | __main__:trials:29 - Trial = 23474/30000 | Total reward = 13.69
2022-01-26 14:18:20.337 | DEBUG    | __main__:trials:24 - Trial = 23475/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.339 | DEBUG    | __main__:trials:29 - Trial = 23475/30000 | Total reward = 36.10
2022-01-26 14:18:20.342 | DEBUG    | __main__:trials:24 - Trial = 23476/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.344 | DEBUG    | __main__:trials:29 - Trial = 23476/30000 | Total reward = 23.54
2022-01-26 14:18:20.347 | DEBUG    | __main__:trials:26 - Trial = 23477/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.348 | DEBUG    | __main__:trials:29 - Trial = 23477/30000 | Total reward = 22.31
2022-01-26 14:18:20.352 | DEBUG    | __main__:trials:26 - Trial = 23478/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.354 | DEBUG    | __main__:trials:29 - Trial = 23478/30000 | Total reward = 24.51
2022-01-26 14:18:20.357 | DEBUG    | __main__:trials:24 - Trial = 23479/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.359 | DEBUG    | __main__:trials:29 - Trial = 23479/30000 | Total reward = 26.52
2022-01-26 14:18:20.362 | DEBUG    | __main__:trials:26 - Trial = 23480/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.363 | DEBUG    | __main__:trials:29 - Trial = 23480/30000 | Total reward = 24.88
2022-01-26 14:18:20.367 | DEBUG    | __main__:trials:24 - Trial = 23481/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.368 | DEBUG    | __main__:trials:29 - Trial = 23481/30000 | Total reward = 41.91
2022-01-26 14:18:20.372 | DEBUG    | __main__:trials:24 - Trial = 23482/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.374 | DEBUG    | __main__:trials:29 - Trial = 23482/30000 | Total reward = 28.01
2022-01-26 14:18:20.378 | DEBUG    | __main__:trials:24 - Trial = 23483/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.379 | DEBUG    | __main__:trials:29 - Trial = 23483/30000 | Total reward = 52.00
2022-01-26 14:18:20.383 | DEBUG    | __main__:trials:24 - Trial = 23484/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.384 | DEBUG    | __main__:trials:29 - Trial = 23484/30000 | Total reward = 34.31
2022-01-26 14:18:20.388 | DEBUG    | __main__:trials:24 - Trial = 23485/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.389 | DEBUG    | __main__:trials:29 - Trial = 23485/30000 | Total reward = 49.73
2022-01-26 14:18:20.392 | DEBUG    | __main__:trials:24 - Trial = 23486/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.394 | DEBUG    | __main__:trials:29 - Trial = 23486/30000 | Total reward = 22.53
2022-01-26 14:18:20.397 | DEBUG    | __main__:trials:24 - Trial = 23487/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.398 | DEBUG    | __main__:trials:29 - Trial = 23487/30000 | Total reward = 42.19
2022-01-26 14:18:20.401 | DEBUG    | __main__:trials:26 - Trial = 23488/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.401 | DEBUG    | __main__:trials:29 - Trial = 23488/30000 | Total reward = 22.11
2022-01-26 14:18:20.405 | DEBUG    | __main__:trials:26 - Trial = 23489/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.407 | DEBUG    | __main__:trials:29 - Trial = 23489/30000 | Total reward = 17.52
2022-01-26 14:18:20.410 | DEBUG    | __main__:trials:24 - Trial = 23490/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.411 | DEBUG    | __main__:trials:29 - Trial = 23490/30000 | Total reward = 51.64
2022-01-26 14:18:20.415 | DEBUG    | __main__:trials:24 - Trial = 23491/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.417 | DEBUG    | __main__:trials:29 - Trial = 23491/30000 | Total reward = 51.89
2022-01-26 14:18:20.420 | DEBUG    | __main__:trials:24 - Trial = 23492/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.422 | DEBUG    | __main__:trials:29 - Trial = 23492/30000 | Total reward = 35.90
2022-01-26 14:18:20.426 | DEBUG    | __main__:trials:26 - Trial = 23493/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.427 | DEBUG    | __main__:trials:29 - Trial = 23493/30000 | Total reward = 28.08
2022-01-26 14:18:20.431 | DEBUG    | __main__:trials:24 - Trial = 23494/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.432 | DEBUG    | __main__:trials:29 - Trial = 23494/30000 | Total reward = 39.00
2022-01-26 14:18:20.436 | DEBUG    | __main__:trials:24 - Trial = 23495/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.436 | DEBUG    | __main__:trials:29 - Trial = 23495/30000 | Total reward = 39.94
2022-01-26 14:18:20.440 | DEBUG    | __main__:trials:24 - Trial = 23496/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.442 | DEBUG    | __main__:trials:29 - Trial = 23496/30000 | Total reward = 41.83
2022-01-26 14:18:20.446 | DEBUG    | __main__:trials:24 - Trial = 23497/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.446 | DEBUG    | __main__:trials:29 - Trial = 23497/30000 | Total reward = 41.23
2022-01-26 14:18:20.450 | DEBUG    | __main__:trials:24 - Trial = 23498/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.452 | DEBUG    | __main__:trials:29 - Trial = 23498/30000 | Total reward = 29.48
2022-01-26 14:18:20.455 | DEBUG    | __main__:trials:24 - Trial = 23499/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.457 | DEBUG    | __main__:trials:29 - Trial = 23499/30000 | Total reward = 47.08
2022-01-26 14:18:20.460 | DEBUG    | __main__:trials:24 - Trial = 23500/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.462 | DEBUG    | __main__:trials:29 - Trial = 23500/30000 | Total reward = 40.55
2022-01-26 14:18:20.466 | DEBUG    | __main__:trials:24 - Trial = 23501/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.467 | DEBUG    | __main__:trials:29 - Trial = 23501/30000 | Total reward = 35.66
2022-01-26 14:18:20.471 | DEBUG    | __main__:trials:24 - Trial = 23502/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.473 | DEBUG    | __main__:trials:29 - Trial = 23502/30000 | Total reward = 31.15
2022-01-26 14:18:20.476 | DEBUG    | __main__:trials:24 - Trial = 23503/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.477 | DEBUG    | __main__:trials:29 - Trial = 23503/30000 | Total reward = 36.50
2022-01-26 14:18:20.482 | DEBUG    | __main__:trials:24 - Trial = 23504/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.482 | DEBUG    | __main__:trials:29 - Trial = 23504/30000 | Total reward = 40.73
2022-01-26 14:18:20.487 | DEBUG    | __main__:trials:24 - Trial = 23505/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.488 | DEBUG    | __main__:trials:29 - Trial = 23505/30000 | Total reward = 34.46
2022-01-26 14:18:20.492 | DEBUG    | __main__:trials:24 - Trial = 23506/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.493 | DEBUG    | __main__:trials:29 - Trial = 23506/30000 | Total reward = 45.11
2022-01-26 14:18:20.496 | DEBUG    | __main__:trials:24 - Trial = 23507/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.498 | DEBUG    | __main__:trials:29 - Trial = 23507/30000 | Total reward = 30.50
2022-01-26 14:18:20.502 | DEBUG    | __main__:trials:24 - Trial = 23508/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.503 | DEBUG    | __main__:trials:29 - Trial = 23508/30000 | Total reward = 42.30
2022-01-26 14:18:20.507 | DEBUG    | __main__:trials:24 - Trial = 23509/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.508 | DEBUG    | __main__:trials:29 - Trial = 23509/30000 | Total reward = 25.10
2022-01-26 14:18:20.512 | DEBUG    | __main__:trials:26 - Trial = 23510/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.513 | DEBUG    | __main__:trials:29 - Trial = 23510/30000 | Total reward = 22.11
2022-01-26 14:18:20.517 | DEBUG    | __main__:trials:24 - Trial = 23511/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.517 | DEBUG    | __main__:trials:29 - Trial = 23511/30000 | Total reward = 33.35
2022-01-26 14:18:20.521 | DEBUG    | __main__:trials:24 - Trial = 23512/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.522 | DEBUG    | __main__:trials:29 - Trial = 23512/30000 | Total reward = 44.62
2022-01-26 14:18:20.526 | DEBUG    | __main__:trials:24 - Trial = 23513/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.527 | DEBUG    | __main__:trials:29 - Trial = 23513/30000 | Total reward = 27.36
2022-01-26 14:18:20.531 | DEBUG    | __main__:trials:24 - Trial = 23514/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.532 | DEBUG    | __main__:trials:29 - Trial = 23514/30000 | Total reward = 41.06
2022-01-26 14:18:20.536 | DEBUG    | __main__:trials:24 - Trial = 23515/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.537 | DEBUG    | __main__:trials:29 - Trial = 23515/30000 | Total reward = 28.67
2022-01-26 14:18:20.541 | DEBUG    | __main__:trials:24 - Trial = 23516/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.542 | DEBUG    | __main__:trials:29 - Trial = 23516/30000 | Total reward = 47.65
2022-01-26 14:18:20.546 | DEBUG    | __main__:trials:26 - Trial = 23517/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.547 | DEBUG    | __main__:trials:29 - Trial = 23517/30000 | Total reward = 16.95
2022-01-26 14:18:20.550 | DEBUG    | __main__:trials:26 - Trial = 23518/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.552 | DEBUG    | __main__:trials:29 - Trial = 23518/30000 | Total reward = 22.12
2022-01-26 14:18:20.554 | DEBUG    | __main__:trials:26 - Trial = 23519/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.555 | DEBUG    | __main__:trials:29 - Trial = 23519/30000 | Total reward = 11.94
2022-01-26 14:18:20.559 | DEBUG    | __main__:trials:24 - Trial = 23520/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.561 | DEBUG    | __main__:trials:29 - Trial = 23520/30000 | Total reward = 44.58
2022-01-26 14:18:20.564 | DEBUG    | __main__:trials:24 - Trial = 23521/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.565 | DEBUG    | __main__:trials:29 - Trial = 23521/30000 | Total reward = 34.48
2022-01-26 14:18:20.568 | DEBUG    | __main__:trials:26 - Trial = 23522/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.570 | DEBUG    | __main__:trials:29 - Trial = 23522/30000 | Total reward = 19.13
2022-01-26 14:18:20.572 | DEBUG    | __main__:trials:24 - Trial = 23523/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.574 | DEBUG    | __main__:trials:29 - Trial = 23523/30000 | Total reward = 34.84
2022-01-26 14:18:20.577 | DEBUG    | __main__:trials:24 - Trial = 23524/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.578 | DEBUG    | __main__:trials:29 - Trial = 23524/30000 | Total reward = 55.81
2022-01-26 14:18:20.581 | DEBUG    | __main__:trials:24 - Trial = 23525/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.582 | DEBUG    | __main__:trials:29 - Trial = 23525/30000 | Total reward = 30.65
2022-01-26 14:18:20.586 | DEBUG    | __main__:trials:24 - Trial = 23526/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.587 | DEBUG    | __main__:trials:29 - Trial = 23526/30000 | Total reward = 33.86
2022-01-26 14:18:20.591 | DEBUG    | __main__:trials:26 - Trial = 23527/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.592 | DEBUG    | __main__:trials:29 - Trial = 23527/30000 | Total reward = 32.17
2022-01-26 14:18:20.596 | DEBUG    | __main__:trials:24 - Trial = 23528/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.597 | DEBUG    | __main__:trials:29 - Trial = 23528/30000 | Total reward = 42.64
2022-01-26 14:18:20.601 | DEBUG    | __main__:trials:24 - Trial = 23529/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.602 | DEBUG    | __main__:trials:29 - Trial = 23529/30000 | Total reward = 43.98
2022-01-26 14:18:20.606 | DEBUG    | __main__:trials:24 - Trial = 23530/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.608 | DEBUG    | __main__:trials:29 - Trial = 23530/30000 | Total reward = 42.95
2022-01-26 14:18:20.611 | DEBUG    | __main__:trials:24 - Trial = 23531/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.612 | DEBUG    | __main__:trials:29 - Trial = 23531/30000 | Total reward = 33.86
2022-01-26 14:18:20.616 | DEBUG    | __main__:trials:24 - Trial = 23532/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.618 | DEBUG    | __main__:trials:29 - Trial = 23532/30000 | Total reward = 28.00
2022-01-26 14:18:20.621 | DEBUG    | __main__:trials:24 - Trial = 23533/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.622 | DEBUG    | __main__:trials:29 - Trial = 23533/30000 | Total reward = 39.22
2022-01-26 14:18:20.626 | DEBUG    | __main__:trials:24 - Trial = 23534/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.627 | DEBUG    | __main__:trials:29 - Trial = 23534/30000 | Total reward = 33.86
2022-01-26 14:18:20.631 | DEBUG    | __main__:trials:24 - Trial = 23535/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.632 | DEBUG    | __main__:trials:29 - Trial = 23535/30000 | Total reward = 48.70
2022-01-26 14:18:20.636 | DEBUG    | __main__:trials:24 - Trial = 23536/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.637 | DEBUG    | __main__:trials:29 - Trial = 23536/30000 | Total reward = 42.95
2022-01-26 14:18:20.641 | DEBUG    | __main__:trials:24 - Trial = 23537/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.642 | DEBUG    | __main__:trials:29 - Trial = 23537/30000 | Total reward = 46.31
2022-01-26 14:18:20.647 | DEBUG    | __main__:trials:24 - Trial = 23538/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.649 | DEBUG    | __main__:trials:29 - Trial = 23538/30000 | Total reward = 41.63
2022-01-26 14:18:20.652 | DEBUG    | __main__:trials:24 - Trial = 23539/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.653 | DEBUG    | __main__:trials:29 - Trial = 23539/30000 | Total reward = 38.73
2022-01-26 14:18:20.657 | DEBUG    | __main__:trials:24 - Trial = 23540/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.658 | DEBUG    | __main__:trials:29 - Trial = 23540/30000 | Total reward = 44.68
2022-01-26 14:18:20.662 | DEBUG    | __main__:trials:24 - Trial = 23541/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.663 | DEBUG    | __main__:trials:29 - Trial = 23541/30000 | Total reward = 44.85
2022-01-26 14:18:20.667 | DEBUG    | __main__:trials:24 - Trial = 23542/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.668 | DEBUG    | __main__:trials:29 - Trial = 23542/30000 | Total reward = 48.46
2022-01-26 14:18:20.672 | DEBUG    | __main__:trials:26 - Trial = 23543/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.672 | DEBUG    | __main__:trials:29 - Trial = 23543/30000 | Total reward = 13.62
2022-01-26 14:18:20.677 | DEBUG    | __main__:trials:26 - Trial = 23544/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.678 | DEBUG    | __main__:trials:29 - Trial = 23544/30000 | Total reward = 23.85
2022-01-26 14:18:20.681 | DEBUG    | __main__:trials:24 - Trial = 23545/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.683 | DEBUG    | __main__:trials:29 - Trial = 23545/30000 | Total reward = 33.27
2022-01-26 14:18:20.686 | DEBUG    | __main__:trials:24 - Trial = 23546/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.686 | DEBUG    | __main__:trials:29 - Trial = 23546/30000 | Total reward = 49.99
2022-01-26 14:18:20.690 | DEBUG    | __main__:trials:24 - Trial = 23547/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.691 | DEBUG    | __main__:trials:29 - Trial = 23547/30000 | Total reward = 28.77
2022-01-26 14:18:20.694 | DEBUG    | __main__:trials:24 - Trial = 23548/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.696 | DEBUG    | __main__:trials:29 - Trial = 23548/30000 | Total reward = 31.53
2022-01-26 14:18:20.700 | DEBUG    | __main__:trials:24 - Trial = 23549/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.701 | DEBUG    | __main__:trials:29 - Trial = 23549/30000 | Total reward = 54.22
2022-01-26 14:18:20.705 | DEBUG    | __main__:trials:24 - Trial = 23550/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.707 | DEBUG    | __main__:trials:29 - Trial = 23550/30000 | Total reward = 33.03
2022-01-26 14:18:20.709 | DEBUG    | __main__:trials:26 - Trial = 23551/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.711 | DEBUG    | __main__:trials:29 - Trial = 23551/30000 | Total reward = 19.47
2022-01-26 14:18:20.715 | DEBUG    | __main__:trials:24 - Trial = 23552/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.716 | DEBUG    | __main__:trials:29 - Trial = 23552/30000 | Total reward = 44.56
2022-01-26 14:18:20.719 | DEBUG    | __main__:trials:24 - Trial = 23553/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.721 | DEBUG    | __main__:trials:29 - Trial = 23553/30000 | Total reward = 30.95
2022-01-26 14:18:20.725 | DEBUG    | __main__:trials:24 - Trial = 23554/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.725 | DEBUG    | __main__:trials:29 - Trial = 23554/30000 | Total reward = 46.79
2022-01-26 14:18:20.729 | DEBUG    | __main__:trials:24 - Trial = 23555/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.731 | DEBUG    | __main__:trials:29 - Trial = 23555/30000 | Total reward = 31.58
2022-01-26 14:18:20.734 | DEBUG    | __main__:trials:24 - Trial = 23556/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.735 | DEBUG    | __main__:trials:29 - Trial = 23556/30000 | Total reward = 33.49
2022-01-26 14:18:20.739 | DEBUG    | __main__:trials:26 - Trial = 23557/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.740 | DEBUG    | __main__:trials:29 - Trial = 23557/30000 | Total reward = 33.28
2022-01-26 14:18:20.744 | DEBUG    | __main__:trials:24 - Trial = 23558/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.746 | DEBUG    | __main__:trials:29 - Trial = 23558/30000 | Total reward = 39.44
2022-01-26 14:18:20.749 | DEBUG    | __main__:trials:24 - Trial = 23559/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.751 | DEBUG    | __main__:trials:29 - Trial = 23559/30000 | Total reward = 28.42
2022-01-26 14:18:20.755 | DEBUG    | __main__:trials:24 - Trial = 23560/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.755 | DEBUG    | __main__:trials:29 - Trial = 23560/30000 | Total reward = 37.91
2022-01-26 14:18:20.760 | DEBUG    | __main__:trials:24 - Trial = 23561/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.760 | DEBUG    | __main__:trials:29 - Trial = 23561/30000 | Total reward = 51.20
2022-01-26 14:18:20.764 | DEBUG    | __main__:trials:26 - Trial = 23562/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.765 | DEBUG    | __main__:trials:29 - Trial = 23562/30000 | Total reward = 16.18
2022-01-26 14:18:20.768 | DEBUG    | __main__:trials:24 - Trial = 23563/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.769 | DEBUG    | __main__:trials:29 - Trial = 23563/30000 | Total reward = 30.40
2022-01-26 14:18:20.773 | DEBUG    | __main__:trials:24 - Trial = 23564/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.773 | DEBUG    | __main__:trials:29 - Trial = 23564/30000 | Total reward = 32.82
2022-01-26 14:18:20.777 | DEBUG    | __main__:trials:24 - Trial = 23565/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.778 | DEBUG    | __main__:trials:29 - Trial = 23565/30000 | Total reward = 34.09
2022-01-26 14:18:20.781 | DEBUG    | __main__:trials:24 - Trial = 23566/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.783 | DEBUG    | __main__:trials:29 - Trial = 23566/30000 | Total reward = 37.31
2022-01-26 14:18:20.786 | DEBUG    | __main__:trials:24 - Trial = 23567/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.787 | DEBUG    | __main__:trials:29 - Trial = 23567/30000 | Total reward = 49.98
2022-01-26 14:18:20.790 | DEBUG    | __main__:trials:24 - Trial = 23568/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.792 | DEBUG    | __main__:trials:29 - Trial = 23568/30000 | Total reward = 29.78
2022-01-26 14:18:20.795 | DEBUG    | __main__:trials:24 - Trial = 23569/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.796 | DEBUG    | __main__:trials:29 - Trial = 23569/30000 | Total reward = 54.09
2022-01-26 14:18:20.800 | DEBUG    | __main__:trials:24 - Trial = 23570/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.801 | DEBUG    | __main__:trials:29 - Trial = 23570/30000 | Total reward = 46.12
2022-01-26 14:18:20.809 | DEBUG    | __main__:trials:24 - Trial = 23571/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.810 | DEBUG    | __main__:trials:29 - Trial = 23571/30000 | Total reward = 37.48
2022-01-26 14:18:20.813 | DEBUG    | __main__:trials:26 - Trial = 23572/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.814 | DEBUG    | __main__:trials:29 - Trial = 23572/30000 | Total reward = 28.06
2022-01-26 14:18:20.818 | DEBUG    | __main__:trials:24 - Trial = 23573/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.819 | DEBUG    | __main__:trials:29 - Trial = 23573/30000 | Total reward = 47.65
2022-01-26 14:18:20.822 | DEBUG    | __main__:trials:24 - Trial = 23574/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.824 | DEBUG    | __main__:trials:29 - Trial = 23574/30000 | Total reward = 25.00
2022-01-26 14:18:20.828 | DEBUG    | __main__:trials:24 - Trial = 23575/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.828 | DEBUG    | __main__:trials:29 - Trial = 23575/30000 | Total reward = 10.19
2022-01-26 14:18:20.832 | DEBUG    | __main__:trials:24 - Trial = 23576/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.834 | DEBUG    | __main__:trials:29 - Trial = 23576/30000 | Total reward = 36.84
2022-01-26 14:18:20.837 | DEBUG    | __main__:trials:24 - Trial = 23577/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.838 | DEBUG    | __main__:trials:29 - Trial = 23577/30000 | Total reward = 47.14
2022-01-26 14:18:20.841 | DEBUG    | __main__:trials:24 - Trial = 23578/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.843 | DEBUG    | __main__:trials:29 - Trial = 23578/30000 | Total reward = 33.27
2022-01-26 14:18:20.846 | DEBUG    | __main__:trials:24 - Trial = 23579/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.848 | DEBUG    | __main__:trials:29 - Trial = 23579/30000 | Total reward = 36.26
2022-01-26 14:18:20.852 | DEBUG    | __main__:trials:24 - Trial = 23580/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.853 | DEBUG    | __main__:trials:29 - Trial = 23580/30000 | Total reward = 37.15
2022-01-26 14:18:20.857 | DEBUG    | __main__:trials:24 - Trial = 23581/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.857 | DEBUG    | __main__:trials:29 - Trial = 23581/30000 | Total reward = 41.96
2022-01-26 14:18:20.861 | DEBUG    | __main__:trials:24 - Trial = 23582/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.863 | DEBUG    | __main__:trials:29 - Trial = 23582/30000 | Total reward = 45.26
2022-01-26 14:18:20.867 | DEBUG    | __main__:trials:24 - Trial = 23583/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.868 | DEBUG    | __main__:trials:29 - Trial = 23583/30000 | Total reward = 24.15
2022-01-26 14:18:20.871 | DEBUG    | __main__:trials:24 - Trial = 23584/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.873 | DEBUG    | __main__:trials:29 - Trial = 23584/30000 | Total reward = 24.16
2022-01-26 14:18:20.876 | DEBUG    | __main__:trials:26 - Trial = 23585/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.878 | DEBUG    | __main__:trials:29 - Trial = 23585/30000 | Total reward = 17.79
2022-01-26 14:18:20.881 | DEBUG    | __main__:trials:24 - Trial = 23586/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.883 | DEBUG    | __main__:trials:29 - Trial = 23586/30000 | Total reward = 31.68
2022-01-26 14:18:20.887 | DEBUG    | __main__:trials:24 - Trial = 23587/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.887 | DEBUG    | __main__:trials:29 - Trial = 23587/30000 | Total reward = 46.80
2022-01-26 14:18:20.892 | DEBUG    | __main__:trials:24 - Trial = 23588/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.893 | DEBUG    | __main__:trials:29 - Trial = 23588/30000 | Total reward = 36.39
2022-01-26 14:18:20.896 | DEBUG    | __main__:trials:24 - Trial = 23589/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.898 | DEBUG    | __main__:trials:29 - Trial = 23589/30000 | Total reward = 37.47
2022-01-26 14:18:20.901 | DEBUG    | __main__:trials:24 - Trial = 23590/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.903 | DEBUG    | __main__:trials:29 - Trial = 23590/30000 | Total reward = 53.27
2022-01-26 14:18:20.906 | DEBUG    | __main__:trials:24 - Trial = 23591/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.907 | DEBUG    | __main__:trials:29 - Trial = 23591/30000 | Total reward = 40.00
2022-01-26 14:18:20.910 | DEBUG    | __main__:trials:24 - Trial = 23592/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.912 | DEBUG    | __main__:trials:29 - Trial = 23592/30000 | Total reward = 35.39
2022-01-26 14:18:20.916 | DEBUG    | __main__:trials:24 - Trial = 23593/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.917 | DEBUG    | __main__:trials:29 - Trial = 23593/30000 | Total reward = 39.21
2022-01-26 14:18:20.921 | DEBUG    | __main__:trials:26 - Trial = 23594/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.922 | DEBUG    | __main__:trials:29 - Trial = 23594/30000 | Total reward = 32.56
2022-01-26 14:18:20.925 | DEBUG    | __main__:trials:24 - Trial = 23595/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.926 | DEBUG    | __main__:trials:29 - Trial = 23595/30000 | Total reward = 38.33
2022-01-26 14:18:20.929 | DEBUG    | __main__:trials:24 - Trial = 23596/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.931 | DEBUG    | __main__:trials:29 - Trial = 23596/30000 | Total reward = 33.51
2022-01-26 14:18:20.934 | DEBUG    | __main__:trials:24 - Trial = 23597/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.935 | DEBUG    | __main__:trials:29 - Trial = 23597/30000 | Total reward = 34.15
2022-01-26 14:18:20.938 | DEBUG    | __main__:trials:24 - Trial = 23598/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.940 | DEBUG    | __main__:trials:29 - Trial = 23598/30000 | Total reward = 37.40
2022-01-26 14:18:20.943 | DEBUG    | __main__:trials:26 - Trial = 23599/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.944 | DEBUG    | __main__:trials:29 - Trial = 23599/30000 | Total reward = 31.59
2022-01-26 14:18:20.948 | DEBUG    | __main__:trials:24 - Trial = 23600/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.949 | DEBUG    | __main__:trials:29 - Trial = 23600/30000 | Total reward = 33.66
2022-01-26 14:18:20.953 | DEBUG    | __main__:trials:24 - Trial = 23601/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.954 | DEBUG    | __main__:trials:29 - Trial = 23601/30000 | Total reward = 37.12
2022-01-26 14:18:20.958 | DEBUG    | __main__:trials:24 - Trial = 23602/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.958 | DEBUG    | __main__:trials:29 - Trial = 23602/30000 | Total reward = 34.45
2022-01-26 14:18:20.963 | DEBUG    | __main__:trials:24 - Trial = 23603/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.964 | DEBUG    | __main__:trials:29 - Trial = 23603/30000 | Total reward = 37.63
2022-01-26 14:18:20.966 | DEBUG    | __main__:trials:26 - Trial = 23604/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.968 | DEBUG    | __main__:trials:29 - Trial = 23604/30000 | Total reward = 20.78
2022-01-26 14:18:20.971 | DEBUG    | __main__:trials:26 - Trial = 23605/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.972 | DEBUG    | __main__:trials:29 - Trial = 23605/30000 | Total reward = 15.22
2022-01-26 14:18:20.975 | DEBUG    | __main__:trials:24 - Trial = 23606/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.977 | DEBUG    | __main__:trials:29 - Trial = 23606/30000 | Total reward = 32.38
2022-01-26 14:18:20.980 | DEBUG    | __main__:trials:26 - Trial = 23607/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:20.981 | DEBUG    | __main__:trials:29 - Trial = 23607/30000 | Total reward = 28.27
2022-01-26 14:18:20.985 | DEBUG    | __main__:trials:24 - Trial = 23608/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.987 | DEBUG    | __main__:trials:29 - Trial = 23608/30000 | Total reward = 43.56
2022-01-26 14:18:20.990 | DEBUG    | __main__:trials:24 - Trial = 23609/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.992 | DEBUG    | __main__:trials:29 - Trial = 23609/30000 | Total reward = 39.41
2022-01-26 14:18:20.994 | DEBUG    | __main__:trials:24 - Trial = 23610/30000 | Max number of steps (20) reached
2022-01-26 14:18:20.996 | DEBUG    | __main__:trials:29 - Trial = 23610/30000 | Total reward = 36.85
2022-01-26 14:18:20.999 | DEBUG    | __main__:trials:24 - Trial = 23611/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.001 | DEBUG    | __main__:trials:29 - Trial = 23611/30000 | Total reward = 38.59
2022-01-26 14:18:21.004 | DEBUG    | __main__:trials:24 - Trial = 23612/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.006 | DEBUG    | __main__:trials:29 - Trial = 23612/30000 | Total reward = 34.83
2022-01-26 14:18:21.009 | DEBUG    | __main__:trials:24 - Trial = 23613/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.011 | DEBUG    | __main__:trials:29 - Trial = 23613/30000 | Total reward = 49.62
2022-01-26 14:18:21.014 | DEBUG    | __main__:trials:24 - Trial = 23614/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.015 | DEBUG    | __main__:trials:29 - Trial = 23614/30000 | Total reward = 35.91
2022-01-26 14:18:21.019 | DEBUG    | __main__:trials:24 - Trial = 23615/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.021 | DEBUG    | __main__:trials:29 - Trial = 23615/30000 | Total reward = 26.52
2022-01-26 14:18:21.024 | DEBUG    | __main__:trials:24 - Trial = 23616/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.026 | DEBUG    | __main__:trials:29 - Trial = 23616/30000 | Total reward = 36.56
2022-01-26 14:18:21.029 | DEBUG    | __main__:trials:24 - Trial = 23617/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.031 | DEBUG    | __main__:trials:29 - Trial = 23617/30000 | Total reward = 38.57
2022-01-26 14:18:21.034 | DEBUG    | __main__:trials:24 - Trial = 23618/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.036 | DEBUG    | __main__:trials:29 - Trial = 23618/30000 | Total reward = 36.48
2022-01-26 14:18:21.039 | DEBUG    | __main__:trials:26 - Trial = 23619/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.040 | DEBUG    | __main__:trials:29 - Trial = 23619/30000 | Total reward = 27.47
2022-01-26 14:18:21.044 | DEBUG    | __main__:trials:26 - Trial = 23620/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.045 | DEBUG    | __main__:trials:29 - Trial = 23620/30000 | Total reward = 33.87
2022-01-26 14:18:21.048 | DEBUG    | __main__:trials:26 - Trial = 23621/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.050 | DEBUG    | __main__:trials:29 - Trial = 23621/30000 | Total reward = 18.04
2022-01-26 14:18:21.054 | DEBUG    | __main__:trials:24 - Trial = 23622/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.055 | DEBUG    | __main__:trials:29 - Trial = 23622/30000 | Total reward = 43.57
2022-01-26 14:18:21.058 | DEBUG    | __main__:trials:24 - Trial = 23623/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.060 | DEBUG    | __main__:trials:29 - Trial = 23623/30000 | Total reward = 36.50
2022-01-26 14:18:21.063 | DEBUG    | __main__:trials:24 - Trial = 23624/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.064 | DEBUG    | __main__:trials:29 - Trial = 23624/30000 | Total reward = 35.21
2022-01-26 14:18:21.068 | DEBUG    | __main__:trials:24 - Trial = 23625/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.070 | DEBUG    | __main__:trials:29 - Trial = 23625/30000 | Total reward = 38.76
2022-01-26 14:18:21.073 | DEBUG    | __main__:trials:24 - Trial = 23626/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.074 | DEBUG    | __main__:trials:29 - Trial = 23626/30000 | Total reward = 38.84
2022-01-26 14:18:21.078 | DEBUG    | __main__:trials:24 - Trial = 23627/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.080 | DEBUG    | __main__:trials:29 - Trial = 23627/30000 | Total reward = 47.66
2022-01-26 14:18:21.083 | DEBUG    | __main__:trials:24 - Trial = 23628/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.085 | DEBUG    | __main__:trials:29 - Trial = 23628/30000 | Total reward = 37.61
2022-01-26 14:18:21.088 | DEBUG    | __main__:trials:24 - Trial = 23629/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.090 | DEBUG    | __main__:trials:29 - Trial = 23629/30000 | Total reward = 33.50
2022-01-26 14:18:21.093 | DEBUG    | __main__:trials:26 - Trial = 23630/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.094 | DEBUG    | __main__:trials:29 - Trial = 23630/30000 | Total reward = 26.14
2022-01-26 14:18:21.097 | DEBUG    | __main__:trials:24 - Trial = 23631/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.098 | DEBUG    | __main__:trials:29 - Trial = 23631/30000 | Total reward = 36.36
2022-01-26 14:18:21.102 | DEBUG    | __main__:trials:24 - Trial = 23632/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.104 | DEBUG    | __main__:trials:29 - Trial = 23632/30000 | Total reward = 38.06
2022-01-26 14:18:21.107 | DEBUG    | __main__:trials:24 - Trial = 23633/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.108 | DEBUG    | __main__:trials:29 - Trial = 23633/30000 | Total reward = 44.55
2022-01-26 14:18:21.112 | DEBUG    | __main__:trials:24 - Trial = 23634/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.114 | DEBUG    | __main__:trials:29 - Trial = 23634/30000 | Total reward = 34.78
2022-01-26 14:18:21.118 | DEBUG    | __main__:trials:24 - Trial = 23635/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.119 | DEBUG    | __main__:trials:29 - Trial = 23635/30000 | Total reward = 25.34
2022-01-26 14:18:21.122 | DEBUG    | __main__:trials:24 - Trial = 23636/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.124 | DEBUG    | __main__:trials:29 - Trial = 23636/30000 | Total reward = 39.56
2022-01-26 14:18:21.127 | DEBUG    | __main__:trials:24 - Trial = 23637/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.129 | DEBUG    | __main__:trials:29 - Trial = 23637/30000 | Total reward = 35.40
2022-01-26 14:18:21.132 | DEBUG    | __main__:trials:24 - Trial = 23638/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.133 | DEBUG    | __main__:trials:29 - Trial = 23638/30000 | Total reward = 33.72
2022-01-26 14:18:21.137 | DEBUG    | __main__:trials:24 - Trial = 23639/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.138 | DEBUG    | __main__:trials:29 - Trial = 23639/30000 | Total reward = 43.32
2022-01-26 14:18:21.142 | DEBUG    | __main__:trials:24 - Trial = 23640/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.143 | DEBUG    | __main__:trials:29 - Trial = 23640/30000 | Total reward = 35.30
2022-01-26 14:18:21.148 | DEBUG    | __main__:trials:24 - Trial = 23641/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.148 | DEBUG    | __main__:trials:29 - Trial = 23641/30000 | Total reward = 40.56
2022-01-26 14:18:21.152 | DEBUG    | __main__:trials:24 - Trial = 23642/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.154 | DEBUG    | __main__:trials:29 - Trial = 23642/30000 | Total reward = 45.17
2022-01-26 14:18:21.157 | DEBUG    | __main__:trials:24 - Trial = 23643/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.159 | DEBUG    | __main__:trials:29 - Trial = 23643/30000 | Total reward = 37.48
2022-01-26 14:18:21.163 | DEBUG    | __main__:trials:24 - Trial = 23644/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.164 | DEBUG    | __main__:trials:29 - Trial = 23644/30000 | Total reward = 49.01
2022-01-26 14:18:21.168 | DEBUG    | __main__:trials:24 - Trial = 23645/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.168 | DEBUG    | __main__:trials:29 - Trial = 23645/30000 | Total reward = 39.30
2022-01-26 14:18:21.172 | DEBUG    | __main__:trials:24 - Trial = 23646/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.174 | DEBUG    | __main__:trials:29 - Trial = 23646/30000 | Total reward = 41.61
2022-01-26 14:18:21.177 | DEBUG    | __main__:trials:24 - Trial = 23647/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.179 | DEBUG    | __main__:trials:29 - Trial = 23647/30000 | Total reward = 38.45
2022-01-26 14:18:21.182 | DEBUG    | __main__:trials:24 - Trial = 23648/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.184 | DEBUG    | __main__:trials:29 - Trial = 23648/30000 | Total reward = 35.59
2022-01-26 14:18:21.188 | DEBUG    | __main__:trials:24 - Trial = 23649/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.188 | DEBUG    | __main__:trials:29 - Trial = 23649/30000 | Total reward = 34.89
2022-01-26 14:18:21.192 | DEBUG    | __main__:trials:26 - Trial = 23650/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.194 | DEBUG    | __main__:trials:29 - Trial = 23650/30000 | Total reward = 28.68
2022-01-26 14:18:21.197 | DEBUG    | __main__:trials:24 - Trial = 23651/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.199 | DEBUG    | __main__:trials:29 - Trial = 23651/30000 | Total reward = 37.91
2022-01-26 14:18:21.203 | DEBUG    | __main__:trials:24 - Trial = 23652/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.204 | DEBUG    | __main__:trials:29 - Trial = 23652/30000 | Total reward = 26.61
2022-01-26 14:18:21.208 | DEBUG    | __main__:trials:24 - Trial = 23653/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.209 | DEBUG    | __main__:trials:29 - Trial = 23653/30000 | Total reward = 40.22
2022-01-26 14:18:21.213 | DEBUG    | __main__:trials:26 - Trial = 23654/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.214 | DEBUG    | __main__:trials:29 - Trial = 23654/30000 | Total reward = 26.73
2022-01-26 14:18:21.218 | DEBUG    | __main__:trials:24 - Trial = 23655/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.219 | DEBUG    | __main__:trials:29 - Trial = 23655/30000 | Total reward = 36.61
2022-01-26 14:18:21.223 | DEBUG    | __main__:trials:24 - Trial = 23656/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.223 | DEBUG    | __main__:trials:29 - Trial = 23656/30000 | Total reward = 39.56
2022-01-26 14:18:21.228 | DEBUG    | __main__:trials:24 - Trial = 23657/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.228 | DEBUG    | __main__:trials:29 - Trial = 23657/30000 | Total reward = 39.80
2022-01-26 14:18:21.232 | DEBUG    | __main__:trials:24 - Trial = 23658/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.233 | DEBUG    | __main__:trials:29 - Trial = 23658/30000 | Total reward = 47.25
2022-01-26 14:18:21.238 | DEBUG    | __main__:trials:24 - Trial = 23659/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.239 | DEBUG    | __main__:trials:29 - Trial = 23659/30000 | Total reward = 44.22
2022-01-26 14:18:21.242 | DEBUG    | __main__:trials:24 - Trial = 23660/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.244 | DEBUG    | __main__:trials:29 - Trial = 23660/30000 | Total reward = 44.19
2022-01-26 14:18:21.247 | DEBUG    | __main__:trials:24 - Trial = 23661/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.249 | DEBUG    | __main__:trials:29 - Trial = 23661/30000 | Total reward = 37.98
2022-01-26 14:18:21.252 | DEBUG    | __main__:trials:24 - Trial = 23662/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.253 | DEBUG    | __main__:trials:29 - Trial = 23662/30000 | Total reward = 28.90
2022-01-26 14:18:21.256 | DEBUG    | __main__:trials:24 - Trial = 23663/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.257 | DEBUG    | __main__:trials:29 - Trial = 23663/30000 | Total reward = 40.23
2022-01-26 14:18:21.260 | DEBUG    | __main__:trials:24 - Trial = 23664/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.261 | DEBUG    | __main__:trials:29 - Trial = 23664/30000 | Total reward = 33.42
2022-01-26 14:18:21.264 | DEBUG    | __main__:trials:24 - Trial = 23665/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.265 | DEBUG    | __main__:trials:29 - Trial = 23665/30000 | Total reward = 42.38
2022-01-26 14:18:21.268 | DEBUG    | __main__:trials:24 - Trial = 23666/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.269 | DEBUG    | __main__:trials:29 - Trial = 23666/30000 | Total reward = 38.02
2022-01-26 14:18:21.272 | DEBUG    | __main__:trials:24 - Trial = 23667/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.274 | DEBUG    | __main__:trials:29 - Trial = 23667/30000 | Total reward = 39.75
2022-01-26 14:18:21.278 | DEBUG    | __main__:trials:26 - Trial = 23668/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.278 | DEBUG    | __main__:trials:29 - Trial = 23668/30000 | Total reward = 22.08
2022-01-26 14:18:21.282 | DEBUG    | __main__:trials:24 - Trial = 23669/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.283 | DEBUG    | __main__:trials:29 - Trial = 23669/30000 | Total reward = 40.06
2022-01-26 14:18:21.287 | DEBUG    | __main__:trials:24 - Trial = 23670/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.288 | DEBUG    | __main__:trials:29 - Trial = 23670/30000 | Total reward = 35.16
2022-01-26 14:18:21.293 | DEBUG    | __main__:trials:24 - Trial = 23671/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.294 | DEBUG    | __main__:trials:29 - Trial = 23671/30000 | Total reward = 42.64
2022-01-26 14:18:21.298 | DEBUG    | __main__:trials:24 - Trial = 23672/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.299 | DEBUG    | __main__:trials:29 - Trial = 23672/30000 | Total reward = 29.75
2022-01-26 14:18:21.302 | DEBUG    | __main__:trials:24 - Trial = 23673/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.304 | DEBUG    | __main__:trials:29 - Trial = 23673/30000 | Total reward = 46.58
2022-01-26 14:18:21.307 | DEBUG    | __main__:trials:24 - Trial = 23674/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.308 | DEBUG    | __main__:trials:29 - Trial = 23674/30000 | Total reward = 36.85
2022-01-26 14:18:21.312 | DEBUG    | __main__:trials:24 - Trial = 23675/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.314 | DEBUG    | __main__:trials:29 - Trial = 23675/30000 | Total reward = 41.15
2022-01-26 14:18:21.318 | DEBUG    | __main__:trials:24 - Trial = 23676/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.319 | DEBUG    | __main__:trials:29 - Trial = 23676/30000 | Total reward = 45.43
2022-01-26 14:18:21.323 | DEBUG    | __main__:trials:24 - Trial = 23677/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.324 | DEBUG    | __main__:trials:29 - Trial = 23677/30000 | Total reward = 40.00
2022-01-26 14:18:21.328 | DEBUG    | __main__:trials:24 - Trial = 23678/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.328 | DEBUG    | __main__:trials:29 - Trial = 23678/30000 | Total reward = 34.75
2022-01-26 14:18:21.333 | DEBUG    | __main__:trials:24 - Trial = 23679/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.333 | DEBUG    | __main__:trials:29 - Trial = 23679/30000 | Total reward = 43.67
2022-01-26 14:18:21.338 | DEBUG    | __main__:trials:24 - Trial = 23680/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.338 | DEBUG    | __main__:trials:29 - Trial = 23680/30000 | Total reward = 38.08
2022-01-26 14:18:21.343 | DEBUG    | __main__:trials:24 - Trial = 23681/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.345 | DEBUG    | __main__:trials:29 - Trial = 23681/30000 | Total reward = 36.59
2022-01-26 14:18:21.348 | DEBUG    | __main__:trials:24 - Trial = 23682/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.350 | DEBUG    | __main__:trials:29 - Trial = 23682/30000 | Total reward = 44.88
2022-01-26 14:18:21.353 | DEBUG    | __main__:trials:24 - Trial = 23683/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.354 | DEBUG    | __main__:trials:29 - Trial = 23683/30000 | Total reward = 34.58
2022-01-26 14:18:21.357 | DEBUG    | __main__:trials:26 - Trial = 23684/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.359 | DEBUG    | __main__:trials:29 - Trial = 23684/30000 | Total reward = 22.80
2022-01-26 14:18:21.362 | DEBUG    | __main__:trials:24 - Trial = 23685/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.363 | DEBUG    | __main__:trials:29 - Trial = 23685/30000 | Total reward = 36.91
2022-01-26 14:18:21.367 | DEBUG    | __main__:trials:24 - Trial = 23686/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.368 | DEBUG    | __main__:trials:29 - Trial = 23686/30000 | Total reward = 46.91
2022-01-26 14:18:21.372 | DEBUG    | __main__:trials:24 - Trial = 23687/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.374 | DEBUG    | __main__:trials:29 - Trial = 23687/30000 | Total reward = 34.42
2022-01-26 14:18:21.377 | DEBUG    | __main__:trials:24 - Trial = 23688/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.379 | DEBUG    | __main__:trials:29 - Trial = 23688/30000 | Total reward = 35.59
2022-01-26 14:18:21.382 | DEBUG    | __main__:trials:24 - Trial = 23689/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.383 | DEBUG    | __main__:trials:29 - Trial = 23689/30000 | Total reward = 40.00
2022-01-26 14:18:21.388 | DEBUG    | __main__:trials:24 - Trial = 23690/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.389 | DEBUG    | __main__:trials:29 - Trial = 23690/30000 | Total reward = 39.38
2022-01-26 14:18:21.392 | DEBUG    | __main__:trials:24 - Trial = 23691/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.394 | DEBUG    | __main__:trials:29 - Trial = 23691/30000 | Total reward = 38.63
2022-01-26 14:18:21.397 | DEBUG    | __main__:trials:26 - Trial = 23692/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.398 | DEBUG    | __main__:trials:29 - Trial = 23692/30000 | Total reward = 22.67
2022-01-26 14:18:21.402 | DEBUG    | __main__:trials:24 - Trial = 23693/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.403 | DEBUG    | __main__:trials:29 - Trial = 23693/30000 | Total reward = 37.29
2022-01-26 14:18:21.407 | DEBUG    | __main__:trials:24 - Trial = 23694/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.408 | DEBUG    | __main__:trials:29 - Trial = 23694/30000 | Total reward = 44.07
2022-01-26 14:18:21.412 | DEBUG    | __main__:trials:24 - Trial = 23695/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.413 | DEBUG    | __main__:trials:29 - Trial = 23695/30000 | Total reward = 51.33
2022-01-26 14:18:21.416 | DEBUG    | __main__:trials:26 - Trial = 23696/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.418 | DEBUG    | __main__:trials:29 - Trial = 23696/30000 | Total reward = 24.85
2022-01-26 14:18:21.421 | DEBUG    | __main__:trials:24 - Trial = 23697/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.422 | DEBUG    | __main__:trials:29 - Trial = 23697/30000 | Total reward = 47.02
2022-01-26 14:18:21.426 | DEBUG    | __main__:trials:24 - Trial = 23698/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.427 | DEBUG    | __main__:trials:29 - Trial = 23698/30000 | Total reward = 39.90
2022-01-26 14:18:21.431 | DEBUG    | __main__:trials:24 - Trial = 23699/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.432 | DEBUG    | __main__:trials:29 - Trial = 23699/30000 | Total reward = 45.15
2022-01-26 14:18:21.436 | DEBUG    | __main__:trials:24 - Trial = 23700/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.437 | DEBUG    | __main__:trials:29 - Trial = 23700/30000 | Total reward = 40.23
2022-01-26 14:18:21.440 | DEBUG    | __main__:trials:24 - Trial = 23701/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.442 | DEBUG    | __main__:trials:29 - Trial = 23701/30000 | Total reward = 39.87
2022-01-26 14:18:21.445 | DEBUG    | __main__:trials:26 - Trial = 23702/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.447 | DEBUG    | __main__:trials:29 - Trial = 23702/30000 | Total reward = 27.41
2022-01-26 14:18:21.450 | DEBUG    | __main__:trials:24 - Trial = 23703/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.452 | DEBUG    | __main__:trials:29 - Trial = 23703/30000 | Total reward = 37.29
2022-01-26 14:18:21.456 | DEBUG    | __main__:trials:24 - Trial = 23704/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.456 | DEBUG    | __main__:trials:29 - Trial = 23704/30000 | Total reward = 51.58
2022-01-26 14:18:21.461 | DEBUG    | __main__:trials:24 - Trial = 23705/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.462 | DEBUG    | __main__:trials:29 - Trial = 23705/30000 | Total reward = 60.86
2022-01-26 14:18:21.466 | DEBUG    | __main__:trials:24 - Trial = 23706/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.467 | DEBUG    | __main__:trials:29 - Trial = 23706/30000 | Total reward = 36.36
2022-01-26 14:18:21.470 | DEBUG    | __main__:trials:24 - Trial = 23707/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.472 | DEBUG    | __main__:trials:29 - Trial = 23707/30000 | Total reward = 40.13
2022-01-26 14:18:21.475 | DEBUG    | __main__:trials:24 - Trial = 23708/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.477 | DEBUG    | __main__:trials:29 - Trial = 23708/30000 | Total reward = 54.54
2022-01-26 14:18:21.479 | DEBUG    | __main__:trials:24 - Trial = 23709/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.481 | DEBUG    | __main__:trials:29 - Trial = 23709/30000 | Total reward = 41.55
2022-01-26 14:18:21.485 | DEBUG    | __main__:trials:24 - Trial = 23710/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.486 | DEBUG    | __main__:trials:29 - Trial = 23710/30000 | Total reward = 48.52
2022-01-26 14:18:21.490 | DEBUG    | __main__:trials:24 - Trial = 23711/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.492 | DEBUG    | __main__:trials:29 - Trial = 23711/30000 | Total reward = 42.69
2022-01-26 14:18:21.495 | DEBUG    | __main__:trials:24 - Trial = 23712/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.496 | DEBUG    | __main__:trials:29 - Trial = 23712/30000 | Total reward = 40.00
2022-01-26 14:18:21.500 | DEBUG    | __main__:trials:24 - Trial = 23713/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.501 | DEBUG    | __main__:trials:29 - Trial = 23713/30000 | Total reward = 35.07
2022-01-26 14:18:21.505 | DEBUG    | __main__:trials:26 - Trial = 23714/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.506 | DEBUG    | __main__:trials:29 - Trial = 23714/30000 | Total reward = 26.14
2022-01-26 14:18:21.511 | DEBUG    | __main__:trials:24 - Trial = 23715/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.511 | DEBUG    | __main__:trials:29 - Trial = 23715/30000 | Total reward = 40.00
2022-01-26 14:18:21.516 | DEBUG    | __main__:trials:24 - Trial = 23716/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.518 | DEBUG    | __main__:trials:29 - Trial = 23716/30000 | Total reward = 36.14
2022-01-26 14:18:21.521 | DEBUG    | __main__:trials:24 - Trial = 23717/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.523 | DEBUG    | __main__:trials:29 - Trial = 23717/30000 | Total reward = 45.32
2022-01-26 14:18:21.526 | DEBUG    | __main__:trials:24 - Trial = 23718/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.527 | DEBUG    | __main__:trials:29 - Trial = 23718/30000 | Total reward = 38.12
2022-01-26 14:18:21.532 | DEBUG    | __main__:trials:24 - Trial = 23719/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.533 | DEBUG    | __main__:trials:29 - Trial = 23719/30000 | Total reward = 37.97
2022-01-26 14:18:21.537 | DEBUG    | __main__:trials:24 - Trial = 23720/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.538 | DEBUG    | __main__:trials:29 - Trial = 23720/30000 | Total reward = 35.05
2022-01-26 14:18:21.541 | DEBUG    | __main__:trials:24 - Trial = 23721/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.543 | DEBUG    | __main__:trials:29 - Trial = 23721/30000 | Total reward = 43.69
2022-01-26 14:18:21.547 | DEBUG    | __main__:trials:24 - Trial = 23722/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.548 | DEBUG    | __main__:trials:29 - Trial = 23722/30000 | Total reward = 47.31
2022-01-26 14:18:21.551 | DEBUG    | __main__:trials:24 - Trial = 23723/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.553 | DEBUG    | __main__:trials:29 - Trial = 23723/30000 | Total reward = 36.50
2022-01-26 14:18:21.557 | DEBUG    | __main__:trials:24 - Trial = 23724/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.557 | DEBUG    | __main__:trials:29 - Trial = 23724/30000 | Total reward = 31.81
2022-01-26 14:18:21.562 | DEBUG    | __main__:trials:24 - Trial = 23725/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.563 | DEBUG    | __main__:trials:29 - Trial = 23725/30000 | Total reward = 44.41
2022-01-26 14:18:21.567 | DEBUG    | __main__:trials:24 - Trial = 23726/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.568 | DEBUG    | __main__:trials:29 - Trial = 23726/30000 | Total reward = 42.11
2022-01-26 14:18:21.572 | DEBUG    | __main__:trials:24 - Trial = 23727/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.573 | DEBUG    | __main__:trials:29 - Trial = 23727/30000 | Total reward = 39.80
2022-01-26 14:18:21.578 | DEBUG    | __main__:trials:24 - Trial = 23728/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.579 | DEBUG    | __main__:trials:29 - Trial = 23728/30000 | Total reward = 33.71
2022-01-26 14:18:21.582 | DEBUG    | __main__:trials:26 - Trial = 23729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.584 | DEBUG    | __main__:trials:29 - Trial = 23729/30000 | Total reward = 27.12
2022-01-26 14:18:21.588 | DEBUG    | __main__:trials:24 - Trial = 23730/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.590 | DEBUG    | __main__:trials:29 - Trial = 23730/30000 | Total reward = 50.38
2022-01-26 14:18:21.593 | DEBUG    | __main__:trials:24 - Trial = 23731/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.594 | DEBUG    | __main__:trials:29 - Trial = 23731/30000 | Total reward = 37.94
2022-01-26 14:18:21.598 | DEBUG    | __main__:trials:24 - Trial = 23732/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.599 | DEBUG    | __main__:trials:29 - Trial = 23732/30000 | Total reward = 40.22
2022-01-26 14:18:21.602 | DEBUG    | __main__:trials:24 - Trial = 23733/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.604 | DEBUG    | __main__:trials:29 - Trial = 23733/30000 | Total reward = 40.00
2022-01-26 14:18:21.608 | DEBUG    | __main__:trials:24 - Trial = 23734/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.608 | DEBUG    | __main__:trials:29 - Trial = 23734/30000 | Total reward = 32.58
2022-01-26 14:18:21.612 | DEBUG    | __main__:trials:24 - Trial = 23735/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.614 | DEBUG    | __main__:trials:29 - Trial = 23735/30000 | Total reward = 28.22
2022-01-26 14:18:21.617 | DEBUG    | __main__:trials:24 - Trial = 23736/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.618 | DEBUG    | __main__:trials:29 - Trial = 23736/30000 | Total reward = 49.97
2022-01-26 14:18:21.622 | DEBUG    | __main__:trials:24 - Trial = 23737/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.623 | DEBUG    | __main__:trials:29 - Trial = 23737/30000 | Total reward = 45.93
2022-01-26 14:18:21.627 | DEBUG    | __main__:trials:24 - Trial = 23738/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.629 | DEBUG    | __main__:trials:29 - Trial = 23738/30000 | Total reward = 39.91
2022-01-26 14:18:21.633 | DEBUG    | __main__:trials:24 - Trial = 23739/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.634 | DEBUG    | __main__:trials:29 - Trial = 23739/30000 | Total reward = 47.94
2022-01-26 14:18:21.638 | DEBUG    | __main__:trials:24 - Trial = 23740/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.639 | DEBUG    | __main__:trials:29 - Trial = 23740/30000 | Total reward = 60.32
2022-01-26 14:18:21.643 | DEBUG    | __main__:trials:24 - Trial = 23741/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.645 | DEBUG    | __main__:trials:29 - Trial = 23741/30000 | Total reward = 31.39
2022-01-26 14:18:21.648 | DEBUG    | __main__:trials:24 - Trial = 23742/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.649 | DEBUG    | __main__:trials:29 - Trial = 23742/30000 | Total reward = 50.98
2022-01-26 14:18:21.653 | DEBUG    | __main__:trials:24 - Trial = 23743/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.654 | DEBUG    | __main__:trials:29 - Trial = 23743/30000 | Total reward = 43.28
2022-01-26 14:18:21.658 | DEBUG    | __main__:trials:24 - Trial = 23744/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.659 | DEBUG    | __main__:trials:29 - Trial = 23744/30000 | Total reward = 40.89
2022-01-26 14:18:21.663 | DEBUG    | __main__:trials:26 - Trial = 23745/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.664 | DEBUG    | __main__:trials:29 - Trial = 23745/30000 | Total reward = 16.70
2022-01-26 14:18:21.668 | DEBUG    | __main__:trials:24 - Trial = 23746/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.669 | DEBUG    | __main__:trials:29 - Trial = 23746/30000 | Total reward = 51.02
2022-01-26 14:18:21.673 | DEBUG    | __main__:trials:24 - Trial = 23747/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.674 | DEBUG    | __main__:trials:29 - Trial = 23747/30000 | Total reward = 34.31
2022-01-26 14:18:21.678 | DEBUG    | __main__:trials:24 - Trial = 23748/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.680 | DEBUG    | __main__:trials:29 - Trial = 23748/30000 | Total reward = 32.87
2022-01-26 14:18:21.683 | DEBUG    | __main__:trials:24 - Trial = 23749/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.685 | DEBUG    | __main__:trials:29 - Trial = 23749/30000 | Total reward = 47.34
2022-01-26 14:18:21.688 | DEBUG    | __main__:trials:24 - Trial = 23750/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.690 | DEBUG    | __main__:trials:29 - Trial = 23750/30000 | Total reward = 37.73
2022-01-26 14:18:21.693 | DEBUG    | __main__:trials:24 - Trial = 23751/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.695 | DEBUG    | __main__:trials:29 - Trial = 23751/30000 | Total reward = 42.56
2022-01-26 14:18:21.699 | DEBUG    | __main__:trials:24 - Trial = 23752/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.700 | DEBUG    | __main__:trials:29 - Trial = 23752/30000 | Total reward = 32.75
2022-01-26 14:18:21.704 | DEBUG    | __main__:trials:24 - Trial = 23753/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.705 | DEBUG    | __main__:trials:29 - Trial = 23753/30000 | Total reward = 30.45
2022-01-26 14:18:21.709 | DEBUG    | __main__:trials:24 - Trial = 23754/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.710 | DEBUG    | __main__:trials:29 - Trial = 23754/30000 | Total reward = 24.07
2022-01-26 14:18:21.713 | DEBUG    | __main__:trials:24 - Trial = 23755/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.714 | DEBUG    | __main__:trials:29 - Trial = 23755/30000 | Total reward = 35.74
2022-01-26 14:18:21.719 | DEBUG    | __main__:trials:24 - Trial = 23756/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.721 | DEBUG    | __main__:trials:29 - Trial = 23756/30000 | Total reward = 37.76
2022-01-26 14:18:21.724 | DEBUG    | __main__:trials:24 - Trial = 23757/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.726 | DEBUG    | __main__:trials:29 - Trial = 23757/30000 | Total reward = 34.83
2022-01-26 14:18:21.730 | DEBUG    | __main__:trials:24 - Trial = 23758/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.731 | DEBUG    | __main__:trials:29 - Trial = 23758/30000 | Total reward = 41.13
2022-01-26 14:18:21.736 | DEBUG    | __main__:trials:24 - Trial = 23759/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.737 | DEBUG    | __main__:trials:29 - Trial = 23759/30000 | Total reward = 44.77
2022-01-26 14:18:21.741 | DEBUG    | __main__:trials:24 - Trial = 23760/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.742 | DEBUG    | __main__:trials:29 - Trial = 23760/30000 | Total reward = 36.58
2022-01-26 14:18:21.745 | DEBUG    | __main__:trials:24 - Trial = 23761/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.748 | DEBUG    | __main__:trials:29 - Trial = 23761/30000 | Total reward = 40.00
2022-01-26 14:18:21.753 | DEBUG    | __main__:trials:24 - Trial = 23762/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.756 | DEBUG    | __main__:trials:29 - Trial = 23762/30000 | Total reward = 45.64
2022-01-26 14:18:21.759 | DEBUG    | __main__:trials:24 - Trial = 23763/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.762 | DEBUG    | __main__:trials:29 - Trial = 23763/30000 | Total reward = 38.36
2022-01-26 14:18:21.766 | DEBUG    | __main__:trials:24 - Trial = 23764/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.769 | DEBUG    | __main__:trials:29 - Trial = 23764/30000 | Total reward = 40.20
2022-01-26 14:18:21.773 | DEBUG    | __main__:trials:24 - Trial = 23765/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.775 | DEBUG    | __main__:trials:29 - Trial = 23765/30000 | Total reward = 38.07
2022-01-26 14:18:21.778 | DEBUG    | __main__:trials:24 - Trial = 23766/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.781 | DEBUG    | __main__:trials:29 - Trial = 23766/30000 | Total reward = 40.22
2022-01-26 14:18:21.786 | DEBUG    | __main__:trials:24 - Trial = 23767/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.789 | DEBUG    | __main__:trials:29 - Trial = 23767/30000 | Total reward = 36.90
2022-01-26 14:18:21.792 | DEBUG    | __main__:trials:24 - Trial = 23768/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.795 | DEBUG    | __main__:trials:29 - Trial = 23768/30000 | Total reward = 48.54
2022-01-26 14:18:21.799 | DEBUG    | __main__:trials:24 - Trial = 23769/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.800 | DEBUG    | __main__:trials:29 - Trial = 23769/30000 | Total reward = 49.55
2022-01-26 14:18:21.804 | DEBUG    | __main__:trials:24 - Trial = 23770/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.806 | DEBUG    | __main__:trials:29 - Trial = 23770/30000 | Total reward = 33.89
2022-01-26 14:18:21.809 | DEBUG    | __main__:trials:24 - Trial = 23771/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.811 | DEBUG    | __main__:trials:29 - Trial = 23771/30000 | Total reward = 40.54
2022-01-26 14:18:21.814 | DEBUG    | __main__:trials:24 - Trial = 23772/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.816 | DEBUG    | __main__:trials:29 - Trial = 23772/30000 | Total reward = 48.28
2022-01-26 14:18:21.819 | DEBUG    | __main__:trials:24 - Trial = 23773/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.821 | DEBUG    | __main__:trials:29 - Trial = 23773/30000 | Total reward = 32.09
2022-01-26 14:18:21.824 | DEBUG    | __main__:trials:24 - Trial = 23774/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.826 | DEBUG    | __main__:trials:29 - Trial = 23774/30000 | Total reward = 45.95
2022-01-26 14:18:21.830 | DEBUG    | __main__:trials:24 - Trial = 23775/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.832 | DEBUG    | __main__:trials:29 - Trial = 23775/30000 | Total reward = 49.55
2022-01-26 14:18:21.836 | DEBUG    | __main__:trials:24 - Trial = 23776/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.837 | DEBUG    | __main__:trials:29 - Trial = 23776/30000 | Total reward = 40.30
2022-01-26 14:18:21.841 | DEBUG    | __main__:trials:24 - Trial = 23777/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.843 | DEBUG    | __main__:trials:29 - Trial = 23777/30000 | Total reward = 36.66
2022-01-26 14:18:21.846 | DEBUG    | __main__:trials:24 - Trial = 23778/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.848 | DEBUG    | __main__:trials:29 - Trial = 23778/30000 | Total reward = 46.26
2022-01-26 14:18:21.852 | DEBUG    | __main__:trials:24 - Trial = 23779/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.853 | DEBUG    | __main__:trials:29 - Trial = 23779/30000 | Total reward = 38.22
2022-01-26 14:18:21.857 | DEBUG    | __main__:trials:24 - Trial = 23780/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.859 | DEBUG    | __main__:trials:29 - Trial = 23780/30000 | Total reward = 31.21
2022-01-26 14:18:21.862 | DEBUG    | __main__:trials:24 - Trial = 23781/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.864 | DEBUG    | __main__:trials:29 - Trial = 23781/30000 | Total reward = 39.80
2022-01-26 14:18:21.868 | DEBUG    | __main__:trials:24 - Trial = 23782/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.869 | DEBUG    | __main__:trials:29 - Trial = 23782/30000 | Total reward = 31.13
2022-01-26 14:18:21.872 | DEBUG    | __main__:trials:24 - Trial = 23783/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.874 | DEBUG    | __main__:trials:29 - Trial = 23783/30000 | Total reward = 39.95
2022-01-26 14:18:21.877 | DEBUG    | __main__:trials:24 - Trial = 23784/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.879 | DEBUG    | __main__:trials:29 - Trial = 23784/30000 | Total reward = 38.64
2022-01-26 14:18:21.882 | DEBUG    | __main__:trials:24 - Trial = 23785/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.884 | DEBUG    | __main__:trials:29 - Trial = 23785/30000 | Total reward = 33.23
2022-01-26 14:18:21.887 | DEBUG    | __main__:trials:24 - Trial = 23786/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.889 | DEBUG    | __main__:trials:29 - Trial = 23786/30000 | Total reward = 40.84
2022-01-26 14:18:21.892 | DEBUG    | __main__:trials:24 - Trial = 23787/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.894 | DEBUG    | __main__:trials:29 - Trial = 23787/30000 | Total reward = 34.99
2022-01-26 14:18:21.898 | DEBUG    | __main__:trials:24 - Trial = 23788/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.899 | DEBUG    | __main__:trials:29 - Trial = 23788/30000 | Total reward = 34.41
2022-01-26 14:18:21.903 | DEBUG    | __main__:trials:24 - Trial = 23789/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.905 | DEBUG    | __main__:trials:29 - Trial = 23789/30000 | Total reward = 25.56
2022-01-26 14:18:21.908 | DEBUG    | __main__:trials:24 - Trial = 23790/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.910 | DEBUG    | __main__:trials:29 - Trial = 23790/30000 | Total reward = 40.00
2022-01-26 14:18:21.914 | DEBUG    | __main__:trials:24 - Trial = 23791/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.915 | DEBUG    | __main__:trials:29 - Trial = 23791/30000 | Total reward = 40.05
2022-01-26 14:18:21.919 | DEBUG    | __main__:trials:24 - Trial = 23792/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.921 | DEBUG    | __main__:trials:29 - Trial = 23792/30000 | Total reward = 47.32
2022-01-26 14:18:21.924 | DEBUG    | __main__:trials:24 - Trial = 23793/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.925 | DEBUG    | __main__:trials:29 - Trial = 23793/30000 | Total reward = 17.04
2022-01-26 14:18:21.929 | DEBUG    | __main__:trials:26 - Trial = 23794/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.929 | DEBUG    | __main__:trials:29 - Trial = 23794/30000 | Total reward = 17.70
2022-01-26 14:18:21.933 | DEBUG    | __main__:trials:24 - Trial = 23795/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.934 | DEBUG    | __main__:trials:29 - Trial = 23795/30000 | Total reward = 30.25
2022-01-26 14:18:21.938 | DEBUG    | __main__:trials:24 - Trial = 23796/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.938 | DEBUG    | __main__:trials:29 - Trial = 23796/30000 | Total reward = 40.00
2022-01-26 14:18:21.942 | DEBUG    | __main__:trials:24 - Trial = 23797/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.943 | DEBUG    | __main__:trials:29 - Trial = 23797/30000 | Total reward = 34.10
2022-01-26 14:18:21.946 | DEBUG    | __main__:trials:26 - Trial = 23798/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.947 | DEBUG    | __main__:trials:29 - Trial = 23798/30000 | Total reward = 17.90
2022-01-26 14:18:21.951 | DEBUG    | __main__:trials:24 - Trial = 23799/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.951 | DEBUG    | __main__:trials:29 - Trial = 23799/30000 | Total reward = 51.17
2022-01-26 14:18:21.955 | DEBUG    | __main__:trials:24 - Trial = 23800/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.956 | DEBUG    | __main__:trials:29 - Trial = 23800/30000 | Total reward = 43.37
2022-01-26 14:18:21.960 | DEBUG    | __main__:trials:24 - Trial = 23801/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.961 | DEBUG    | __main__:trials:29 - Trial = 23801/30000 | Total reward = 43.64
2022-01-26 14:18:21.965 | DEBUG    | __main__:trials:24 - Trial = 23802/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.966 | DEBUG    | __main__:trials:29 - Trial = 23802/30000 | Total reward = 53.39
2022-01-26 14:18:21.970 | DEBUG    | __main__:trials:26 - Trial = 23803/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:21.971 | DEBUG    | __main__:trials:29 - Trial = 23803/30000 | Total reward = 29.40
2022-01-26 14:18:21.975 | DEBUG    | __main__:trials:24 - Trial = 23804/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.976 | DEBUG    | __main__:trials:29 - Trial = 23804/30000 | Total reward = 46.01
2022-01-26 14:18:21.980 | DEBUG    | __main__:trials:24 - Trial = 23805/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.981 | DEBUG    | __main__:trials:29 - Trial = 23805/30000 | Total reward = 37.15
2022-01-26 14:18:21.985 | DEBUG    | __main__:trials:24 - Trial = 23806/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.986 | DEBUG    | __main__:trials:29 - Trial = 23806/30000 | Total reward = 33.88
2022-01-26 14:18:21.990 | DEBUG    | __main__:trials:24 - Trial = 23807/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.992 | DEBUG    | __main__:trials:29 - Trial = 23807/30000 | Total reward = 26.79
2022-01-26 14:18:21.995 | DEBUG    | __main__:trials:24 - Trial = 23808/30000 | Max number of steps (20) reached
2022-01-26 14:18:21.997 | DEBUG    | __main__:trials:29 - Trial = 23808/30000 | Total reward = 36.72
2022-01-26 14:18:22.000 | DEBUG    | __main__:trials:24 - Trial = 23809/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.002 | DEBUG    | __main__:trials:29 - Trial = 23809/30000 | Total reward = 36.23
2022-01-26 14:18:22.006 | DEBUG    | __main__:trials:24 - Trial = 23810/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.007 | DEBUG    | __main__:trials:29 - Trial = 23810/30000 | Total reward = 32.52
2022-01-26 14:18:22.011 | DEBUG    | __main__:trials:24 - Trial = 23811/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.012 | DEBUG    | __main__:trials:29 - Trial = 23811/30000 | Total reward = 36.72
2022-01-26 14:18:22.016 | DEBUG    | __main__:trials:26 - Trial = 23812/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.018 | DEBUG    | __main__:trials:29 - Trial = 23812/30000 | Total reward = 28.69
2022-01-26 14:18:22.021 | DEBUG    | __main__:trials:26 - Trial = 23813/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.023 | DEBUG    | __main__:trials:29 - Trial = 23813/30000 | Total reward = 24.66
2022-01-26 14:18:22.028 | DEBUG    | __main__:trials:24 - Trial = 23814/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.029 | DEBUG    | __main__:trials:29 - Trial = 23814/30000 | Total reward = 39.48
2022-01-26 14:18:22.033 | DEBUG    | __main__:trials:24 - Trial = 23815/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.034 | DEBUG    | __main__:trials:29 - Trial = 23815/30000 | Total reward = 31.58
2022-01-26 14:18:22.037 | DEBUG    | __main__:trials:24 - Trial = 23816/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.039 | DEBUG    | __main__:trials:29 - Trial = 23816/30000 | Total reward = 42.85
2022-01-26 14:18:22.042 | DEBUG    | __main__:trials:24 - Trial = 23817/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.044 | DEBUG    | __main__:trials:29 - Trial = 23817/30000 | Total reward = 40.00
2022-01-26 14:18:22.047 | DEBUG    | __main__:trials:24 - Trial = 23818/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.049 | DEBUG    | __main__:trials:29 - Trial = 23818/30000 | Total reward = 37.43
2022-01-26 14:18:22.053 | DEBUG    | __main__:trials:24 - Trial = 23819/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.054 | DEBUG    | __main__:trials:29 - Trial = 23819/30000 | Total reward = 28.14
2022-01-26 14:18:22.057 | DEBUG    | __main__:trials:24 - Trial = 23820/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.058 | DEBUG    | __main__:trials:29 - Trial = 23820/30000 | Total reward = 40.00
2022-01-26 14:18:22.061 | DEBUG    | __main__:trials:24 - Trial = 23821/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.063 | DEBUG    | __main__:trials:29 - Trial = 23821/30000 | Total reward = 6.22
2022-01-26 14:18:22.066 | DEBUG    | __main__:trials:24 - Trial = 23822/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.067 | DEBUG    | __main__:trials:29 - Trial = 23822/30000 | Total reward = 29.80
2022-01-26 14:18:22.072 | DEBUG    | __main__:trials:24 - Trial = 23823/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.073 | DEBUG    | __main__:trials:29 - Trial = 23823/30000 | Total reward = 59.75
2022-01-26 14:18:22.077 | DEBUG    | __main__:trials:24 - Trial = 23824/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.078 | DEBUG    | __main__:trials:29 - Trial = 23824/30000 | Total reward = 40.00
2022-01-26 14:18:22.082 | DEBUG    | __main__:trials:24 - Trial = 23825/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.084 | DEBUG    | __main__:trials:29 - Trial = 23825/30000 | Total reward = 38.67
2022-01-26 14:18:22.088 | DEBUG    | __main__:trials:24 - Trial = 23826/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.089 | DEBUG    | __main__:trials:29 - Trial = 23826/30000 | Total reward = 34.04
2022-01-26 14:18:22.093 | DEBUG    | __main__:trials:24 - Trial = 23827/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.094 | DEBUG    | __main__:trials:29 - Trial = 23827/30000 | Total reward = 27.48
2022-01-26 14:18:22.098 | DEBUG    | __main__:trials:24 - Trial = 23828/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.100 | DEBUG    | __main__:trials:29 - Trial = 23828/30000 | Total reward = 53.50
2022-01-26 14:18:22.103 | DEBUG    | __main__:trials:24 - Trial = 23829/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.105 | DEBUG    | __main__:trials:29 - Trial = 23829/30000 | Total reward = 31.63
2022-01-26 14:18:22.109 | DEBUG    | __main__:trials:24 - Trial = 23830/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.109 | DEBUG    | __main__:trials:29 - Trial = 23830/30000 | Total reward = 39.59
2022-01-26 14:18:22.112 | DEBUG    | __main__:trials:24 - Trial = 23831/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.114 | DEBUG    | __main__:trials:29 - Trial = 23831/30000 | Total reward = 33.50
2022-01-26 14:18:22.118 | DEBUG    | __main__:trials:24 - Trial = 23832/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.119 | DEBUG    | __main__:trials:29 - Trial = 23832/30000 | Total reward = 39.84
2022-01-26 14:18:22.123 | DEBUG    | __main__:trials:24 - Trial = 23833/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.125 | DEBUG    | __main__:trials:29 - Trial = 23833/30000 | Total reward = 49.93
2022-01-26 14:18:22.128 | DEBUG    | __main__:trials:24 - Trial = 23834/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.130 | DEBUG    | __main__:trials:29 - Trial = 23834/30000 | Total reward = 43.97
2022-01-26 14:18:22.133 | DEBUG    | __main__:trials:24 - Trial = 23835/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.135 | DEBUG    | __main__:trials:29 - Trial = 23835/30000 | Total reward = 40.18
2022-01-26 14:18:22.139 | DEBUG    | __main__:trials:24 - Trial = 23836/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.140 | DEBUG    | __main__:trials:29 - Trial = 23836/30000 | Total reward = 39.08
2022-01-26 14:18:22.144 | DEBUG    | __main__:trials:24 - Trial = 23837/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.146 | DEBUG    | __main__:trials:29 - Trial = 23837/30000 | Total reward = 38.17
2022-01-26 14:18:22.149 | DEBUG    | __main__:trials:26 - Trial = 23838/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.151 | DEBUG    | __main__:trials:29 - Trial = 23838/30000 | Total reward = 19.23
2022-01-26 14:18:22.154 | DEBUG    | __main__:trials:24 - Trial = 23839/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.156 | DEBUG    | __main__:trials:29 - Trial = 23839/30000 | Total reward = 36.07
2022-01-26 14:18:22.159 | DEBUG    | __main__:trials:24 - Trial = 23840/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.161 | DEBUG    | __main__:trials:29 - Trial = 23840/30000 | Total reward = 50.84
2022-01-26 14:18:22.164 | DEBUG    | __main__:trials:24 - Trial = 23841/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.166 | DEBUG    | __main__:trials:29 - Trial = 23841/30000 | Total reward = 45.87
2022-01-26 14:18:22.170 | DEBUG    | __main__:trials:24 - Trial = 23842/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.171 | DEBUG    | __main__:trials:29 - Trial = 23842/30000 | Total reward = 42.77
2022-01-26 14:18:22.175 | DEBUG    | __main__:trials:24 - Trial = 23843/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.177 | DEBUG    | __main__:trials:29 - Trial = 23843/30000 | Total reward = 40.33
2022-01-26 14:18:22.180 | DEBUG    | __main__:trials:24 - Trial = 23844/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.182 | DEBUG    | __main__:trials:29 - Trial = 23844/30000 | Total reward = 39.74
2022-01-26 14:18:22.185 | DEBUG    | __main__:trials:24 - Trial = 23845/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.186 | DEBUG    | __main__:trials:29 - Trial = 23845/30000 | Total reward = 31.30
2022-01-26 14:18:22.190 | DEBUG    | __main__:trials:24 - Trial = 23846/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.191 | DEBUG    | __main__:trials:29 - Trial = 23846/30000 | Total reward = 28.61
2022-01-26 14:18:22.195 | DEBUG    | __main__:trials:24 - Trial = 23847/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.196 | DEBUG    | __main__:trials:29 - Trial = 23847/30000 | Total reward = 40.81
2022-01-26 14:18:22.200 | DEBUG    | __main__:trials:24 - Trial = 23848/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.202 | DEBUG    | __main__:trials:29 - Trial = 23848/30000 | Total reward = 37.15
2022-01-26 14:18:22.205 | DEBUG    | __main__:trials:24 - Trial = 23849/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.207 | DEBUG    | __main__:trials:29 - Trial = 23849/30000 | Total reward = 48.03
2022-01-26 14:18:22.211 | DEBUG    | __main__:trials:24 - Trial = 23850/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.212 | DEBUG    | __main__:trials:29 - Trial = 23850/30000 | Total reward = 34.87
2022-01-26 14:18:22.216 | DEBUG    | __main__:trials:24 - Trial = 23851/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.218 | DEBUG    | __main__:trials:29 - Trial = 23851/30000 | Total reward = 34.33
2022-01-26 14:18:22.221 | DEBUG    | __main__:trials:24 - Trial = 23852/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.223 | DEBUG    | __main__:trials:29 - Trial = 23852/30000 | Total reward = 41.68
2022-01-26 14:18:22.227 | DEBUG    | __main__:trials:24 - Trial = 23853/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.228 | DEBUG    | __main__:trials:29 - Trial = 23853/30000 | Total reward = 49.13
2022-01-26 14:18:22.231 | DEBUG    | __main__:trials:24 - Trial = 23854/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.233 | DEBUG    | __main__:trials:29 - Trial = 23854/30000 | Total reward = 38.14
2022-01-26 14:18:22.237 | DEBUG    | __main__:trials:24 - Trial = 23855/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.238 | DEBUG    | __main__:trials:29 - Trial = 23855/30000 | Total reward = 50.21
2022-01-26 14:18:22.242 | DEBUG    | __main__:trials:24 - Trial = 23856/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.243 | DEBUG    | __main__:trials:29 - Trial = 23856/30000 | Total reward = 32.04
2022-01-26 14:18:22.247 | DEBUG    | __main__:trials:24 - Trial = 23857/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.248 | DEBUG    | __main__:trials:29 - Trial = 23857/30000 | Total reward = 45.38
2022-01-26 14:18:22.252 | DEBUG    | __main__:trials:24 - Trial = 23858/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.254 | DEBUG    | __main__:trials:29 - Trial = 23858/30000 | Total reward = 39.25
2022-01-26 14:18:22.258 | DEBUG    | __main__:trials:24 - Trial = 23859/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.259 | DEBUG    | __main__:trials:29 - Trial = 23859/30000 | Total reward = 32.21
2022-01-26 14:18:22.263 | DEBUG    | __main__:trials:24 - Trial = 23860/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.265 | DEBUG    | __main__:trials:29 - Trial = 23860/30000 | Total reward = 39.80
2022-01-26 14:18:22.268 | DEBUG    | __main__:trials:24 - Trial = 23861/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.270 | DEBUG    | __main__:trials:29 - Trial = 23861/30000 | Total reward = 26.30
2022-01-26 14:18:22.274 | DEBUG    | __main__:trials:24 - Trial = 23862/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.275 | DEBUG    | __main__:trials:29 - Trial = 23862/30000 | Total reward = 37.61
2022-01-26 14:18:22.278 | DEBUG    | __main__:trials:26 - Trial = 23863/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.280 | DEBUG    | __main__:trials:29 - Trial = 23863/30000 | Total reward = 20.79
2022-01-26 14:18:22.284 | DEBUG    | __main__:trials:24 - Trial = 23864/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.285 | DEBUG    | __main__:trials:29 - Trial = 23864/30000 | Total reward = 34.89
2022-01-26 14:18:22.289 | DEBUG    | __main__:trials:24 - Trial = 23865/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.291 | DEBUG    | __main__:trials:29 - Trial = 23865/30000 | Total reward = 36.00
2022-01-26 14:18:22.295 | DEBUG    | __main__:trials:24 - Trial = 23866/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.296 | DEBUG    | __main__:trials:29 - Trial = 23866/30000 | Total reward = 36.02
2022-01-26 14:18:22.300 | DEBUG    | __main__:trials:24 - Trial = 23867/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.301 | DEBUG    | __main__:trials:29 - Trial = 23867/30000 | Total reward = 37.73
2022-01-26 14:18:22.305 | DEBUG    | __main__:trials:24 - Trial = 23868/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.306 | DEBUG    | __main__:trials:29 - Trial = 23868/30000 | Total reward = 36.69
2022-01-26 14:18:22.309 | DEBUG    | __main__:trials:24 - Trial = 23869/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.310 | DEBUG    | __main__:trials:29 - Trial = 23869/30000 | Total reward = 37.58
2022-01-26 14:18:22.313 | DEBUG    | __main__:trials:24 - Trial = 23870/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.314 | DEBUG    | __main__:trials:29 - Trial = 23870/30000 | Total reward = 30.92
2022-01-26 14:18:22.317 | DEBUG    | __main__:trials:24 - Trial = 23871/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.319 | DEBUG    | __main__:trials:29 - Trial = 23871/30000 | Total reward = 40.79
2022-01-26 14:18:22.323 | DEBUG    | __main__:trials:24 - Trial = 23872/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.324 | DEBUG    | __main__:trials:29 - Trial = 23872/30000 | Total reward = 34.70
2022-01-26 14:18:22.327 | DEBUG    | __main__:trials:26 - Trial = 23873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.329 | DEBUG    | __main__:trials:29 - Trial = 23873/30000 | Total reward = 13.53
2022-01-26 14:18:22.332 | DEBUG    | __main__:trials:24 - Trial = 23874/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.334 | DEBUG    | __main__:trials:29 - Trial = 23874/30000 | Total reward = 39.95
2022-01-26 14:18:22.338 | DEBUG    | __main__:trials:24 - Trial = 23875/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.339 | DEBUG    | __main__:trials:29 - Trial = 23875/30000 | Total reward = 45.59
2022-01-26 14:18:22.343 | DEBUG    | __main__:trials:24 - Trial = 23876/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.345 | DEBUG    | __main__:trials:29 - Trial = 23876/30000 | Total reward = 40.72
2022-01-26 14:18:22.348 | DEBUG    | __main__:trials:24 - Trial = 23877/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.350 | DEBUG    | __main__:trials:29 - Trial = 23877/30000 | Total reward = 37.11
2022-01-26 14:18:22.354 | DEBUG    | __main__:trials:24 - Trial = 23878/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.355 | DEBUG    | __main__:trials:29 - Trial = 23878/30000 | Total reward = 36.34
2022-01-26 14:18:22.359 | DEBUG    | __main__:trials:24 - Trial = 23879/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.361 | DEBUG    | __main__:trials:29 - Trial = 23879/30000 | Total reward = 39.19
2022-01-26 14:18:22.363 | DEBUG    | __main__:trials:24 - Trial = 23880/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.365 | DEBUG    | __main__:trials:29 - Trial = 23880/30000 | Total reward = 50.48
2022-01-26 14:18:22.369 | DEBUG    | __main__:trials:24 - Trial = 23881/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.371 | DEBUG    | __main__:trials:29 - Trial = 23881/30000 | Total reward = 39.70
2022-01-26 14:18:22.375 | DEBUG    | __main__:trials:24 - Trial = 23882/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.375 | DEBUG    | __main__:trials:29 - Trial = 23882/30000 | Total reward = 34.96
2022-01-26 14:18:22.380 | DEBUG    | __main__:trials:24 - Trial = 23883/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.381 | DEBUG    | __main__:trials:29 - Trial = 23883/30000 | Total reward = 39.62
2022-01-26 14:18:22.385 | DEBUG    | __main__:trials:24 - Trial = 23884/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.386 | DEBUG    | __main__:trials:29 - Trial = 23884/30000 | Total reward = 40.03
2022-01-26 14:18:22.390 | DEBUG    | __main__:trials:24 - Trial = 23885/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.392 | DEBUG    | __main__:trials:29 - Trial = 23885/30000 | Total reward = 45.36
2022-01-26 14:18:22.394 | DEBUG    | __main__:trials:26 - Trial = 23886/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.395 | DEBUG    | __main__:trials:29 - Trial = 23886/30000 | Total reward = 14.91
2022-01-26 14:18:22.399 | DEBUG    | __main__:trials:24 - Trial = 23887/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.400 | DEBUG    | __main__:trials:29 - Trial = 23887/30000 | Total reward = 50.08
2022-01-26 14:18:22.404 | DEBUG    | __main__:trials:24 - Trial = 23888/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.405 | DEBUG    | __main__:trials:29 - Trial = 23888/30000 | Total reward = 33.15
2022-01-26 14:18:22.408 | DEBUG    | __main__:trials:26 - Trial = 23889/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.409 | DEBUG    | __main__:trials:29 - Trial = 23889/30000 | Total reward = 16.87
2022-01-26 14:18:22.413 | DEBUG    | __main__:trials:24 - Trial = 23890/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.414 | DEBUG    | __main__:trials:29 - Trial = 23890/30000 | Total reward = 33.03
2022-01-26 14:18:22.417 | DEBUG    | __main__:trials:24 - Trial = 23891/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.418 | DEBUG    | __main__:trials:29 - Trial = 23891/30000 | Total reward = 47.37
2022-01-26 14:18:22.422 | DEBUG    | __main__:trials:24 - Trial = 23892/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.423 | DEBUG    | __main__:trials:29 - Trial = 23892/30000 | Total reward = 32.73
2022-01-26 14:18:22.427 | DEBUG    | __main__:trials:24 - Trial = 23893/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.429 | DEBUG    | __main__:trials:29 - Trial = 23893/30000 | Total reward = 37.73
2022-01-26 14:18:22.432 | DEBUG    | __main__:trials:24 - Trial = 23894/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.434 | DEBUG    | __main__:trials:29 - Trial = 23894/30000 | Total reward = 41.85
2022-01-26 14:18:22.438 | DEBUG    | __main__:trials:24 - Trial = 23895/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.438 | DEBUG    | __main__:trials:29 - Trial = 23895/30000 | Total reward = 29.72
2022-01-26 14:18:22.442 | DEBUG    | __main__:trials:24 - Trial = 23896/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.444 | DEBUG    | __main__:trials:29 - Trial = 23896/30000 | Total reward = 38.26
2022-01-26 14:18:22.447 | DEBUG    | __main__:trials:24 - Trial = 23897/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.449 | DEBUG    | __main__:trials:29 - Trial = 23897/30000 | Total reward = 36.21
2022-01-26 14:18:22.452 | DEBUG    | __main__:trials:26 - Trial = 23898/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.452 | DEBUG    | __main__:trials:29 - Trial = 23898/30000 | Total reward = 14.97
2022-01-26 14:18:22.456 | DEBUG    | __main__:trials:24 - Trial = 23899/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.458 | DEBUG    | __main__:trials:29 - Trial = 23899/30000 | Total reward = 36.46
2022-01-26 14:18:22.461 | DEBUG    | __main__:trials:24 - Trial = 23900/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.462 | DEBUG    | __main__:trials:29 - Trial = 23900/30000 | Total reward = 32.52
2022-01-26 14:18:22.466 | DEBUG    | __main__:trials:24 - Trial = 23901/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.468 | DEBUG    | __main__:trials:29 - Trial = 23901/30000 | Total reward = 40.47
2022-01-26 14:18:22.471 | DEBUG    | __main__:trials:24 - Trial = 23902/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.472 | DEBUG    | __main__:trials:29 - Trial = 23902/30000 | Total reward = 38.97
2022-01-26 14:18:22.476 | DEBUG    | __main__:trials:26 - Trial = 23903/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.478 | DEBUG    | __main__:trials:29 - Trial = 23903/30000 | Total reward = 30.17
2022-01-26 14:18:22.481 | DEBUG    | __main__:trials:24 - Trial = 23904/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.482 | DEBUG    | __main__:trials:29 - Trial = 23904/30000 | Total reward = 28.70
2022-01-26 14:18:22.486 | DEBUG    | __main__:trials:24 - Trial = 23905/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.488 | DEBUG    | __main__:trials:29 - Trial = 23905/30000 | Total reward = 38.82
2022-01-26 14:18:22.491 | DEBUG    | __main__:trials:24 - Trial = 23906/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.493 | DEBUG    | __main__:trials:29 - Trial = 23906/30000 | Total reward = 49.04
2022-01-26 14:18:22.496 | DEBUG    | __main__:trials:24 - Trial = 23907/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.498 | DEBUG    | __main__:trials:29 - Trial = 23907/30000 | Total reward = 34.81
2022-01-26 14:18:22.502 | DEBUG    | __main__:trials:24 - Trial = 23908/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.503 | DEBUG    | __main__:trials:29 - Trial = 23908/30000 | Total reward = 48.66
2022-01-26 14:18:22.507 | DEBUG    | __main__:trials:24 - Trial = 23909/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.508 | DEBUG    | __main__:trials:29 - Trial = 23909/30000 | Total reward = 36.72
2022-01-26 14:18:22.512 | DEBUG    | __main__:trials:24 - Trial = 23910/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.514 | DEBUG    | __main__:trials:29 - Trial = 23910/30000 | Total reward = 33.28
2022-01-26 14:18:22.518 | DEBUG    | __main__:trials:24 - Trial = 23911/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.519 | DEBUG    | __main__:trials:29 - Trial = 23911/30000 | Total reward = 40.90
2022-01-26 14:18:22.523 | DEBUG    | __main__:trials:24 - Trial = 23912/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.524 | DEBUG    | __main__:trials:29 - Trial = 23912/30000 | Total reward = 43.88
2022-01-26 14:18:22.528 | DEBUG    | __main__:trials:24 - Trial = 23913/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.530 | DEBUG    | __main__:trials:29 - Trial = 23913/30000 | Total reward = 35.58
2022-01-26 14:18:22.533 | DEBUG    | __main__:trials:24 - Trial = 23914/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.535 | DEBUG    | __main__:trials:29 - Trial = 23914/30000 | Total reward = 37.38
2022-01-26 14:18:22.539 | DEBUG    | __main__:trials:24 - Trial = 23915/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.540 | DEBUG    | __main__:trials:29 - Trial = 23915/30000 | Total reward = 39.12
2022-01-26 14:18:22.544 | DEBUG    | __main__:trials:24 - Trial = 23916/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.546 | DEBUG    | __main__:trials:29 - Trial = 23916/30000 | Total reward = 45.75
2022-01-26 14:18:22.549 | DEBUG    | __main__:trials:24 - Trial = 23917/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.551 | DEBUG    | __main__:trials:29 - Trial = 23917/30000 | Total reward = 36.51
2022-01-26 14:18:22.554 | DEBUG    | __main__:trials:24 - Trial = 23918/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.556 | DEBUG    | __main__:trials:29 - Trial = 23918/30000 | Total reward = 39.80
2022-01-26 14:18:22.559 | DEBUG    | __main__:trials:24 - Trial = 23919/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.560 | DEBUG    | __main__:trials:29 - Trial = 23919/30000 | Total reward = 37.73
2022-01-26 14:18:22.564 | DEBUG    | __main__:trials:26 - Trial = 23920/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.566 | DEBUG    | __main__:trials:29 - Trial = 23920/30000 | Total reward = 30.57
2022-01-26 14:18:22.569 | DEBUG    | __main__:trials:24 - Trial = 23921/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.570 | DEBUG    | __main__:trials:29 - Trial = 23921/30000 | Total reward = 44.85
2022-01-26 14:18:22.574 | DEBUG    | __main__:trials:24 - Trial = 23922/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.575 | DEBUG    | __main__:trials:29 - Trial = 23922/30000 | Total reward = 31.85
2022-01-26 14:18:22.579 | DEBUG    | __main__:trials:24 - Trial = 23923/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.581 | DEBUG    | __main__:trials:29 - Trial = 23923/30000 | Total reward = 37.40
2022-01-26 14:18:22.584 | DEBUG    | __main__:trials:24 - Trial = 23924/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.586 | DEBUG    | __main__:trials:29 - Trial = 23924/30000 | Total reward = 39.91
2022-01-26 14:18:22.590 | DEBUG    | __main__:trials:24 - Trial = 23925/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.591 | DEBUG    | __main__:trials:29 - Trial = 23925/30000 | Total reward = 37.99
2022-01-26 14:18:22.595 | DEBUG    | __main__:trials:24 - Trial = 23926/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.596 | DEBUG    | __main__:trials:29 - Trial = 23926/30000 | Total reward = 47.92
2022-01-26 14:18:22.600 | DEBUG    | __main__:trials:24 - Trial = 23927/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.602 | DEBUG    | __main__:trials:29 - Trial = 23927/30000 | Total reward = 38.50
2022-01-26 14:18:22.605 | DEBUG    | __main__:trials:24 - Trial = 23928/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.606 | DEBUG    | __main__:trials:29 - Trial = 23928/30000 | Total reward = 35.20
2022-01-26 14:18:22.610 | DEBUG    | __main__:trials:24 - Trial = 23929/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.612 | DEBUG    | __main__:trials:29 - Trial = 23929/30000 | Total reward = 40.19
2022-01-26 14:18:22.615 | DEBUG    | __main__:trials:24 - Trial = 23930/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.617 | DEBUG    | __main__:trials:29 - Trial = 23930/30000 | Total reward = 35.40
2022-01-26 14:18:22.620 | DEBUG    | __main__:trials:24 - Trial = 23931/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.622 | DEBUG    | __main__:trials:29 - Trial = 23931/30000 | Total reward = 27.82
2022-01-26 14:18:22.625 | DEBUG    | __main__:trials:24 - Trial = 23932/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.627 | DEBUG    | __main__:trials:29 - Trial = 23932/30000 | Total reward = 33.15
2022-01-26 14:18:22.631 | DEBUG    | __main__:trials:24 - Trial = 23933/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.632 | DEBUG    | __main__:trials:29 - Trial = 23933/30000 | Total reward = 38.96
2022-01-26 14:18:22.636 | DEBUG    | __main__:trials:24 - Trial = 23934/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.637 | DEBUG    | __main__:trials:29 - Trial = 23934/30000 | Total reward = 40.00
2022-01-26 14:18:22.641 | DEBUG    | __main__:trials:24 - Trial = 23935/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.642 | DEBUG    | __main__:trials:29 - Trial = 23935/30000 | Total reward = 40.47
2022-01-26 14:18:22.646 | DEBUG    | __main__:trials:24 - Trial = 23936/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.647 | DEBUG    | __main__:trials:29 - Trial = 23936/30000 | Total reward = 32.32
2022-01-26 14:18:22.650 | DEBUG    | __main__:trials:24 - Trial = 23937/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.652 | DEBUG    | __main__:trials:29 - Trial = 23937/30000 | Total reward = 40.00
2022-01-26 14:18:22.656 | DEBUG    | __main__:trials:24 - Trial = 23938/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.656 | DEBUG    | __main__:trials:29 - Trial = 23938/30000 | Total reward = 36.65
2022-01-26 14:18:22.660 | DEBUG    | __main__:trials:24 - Trial = 23939/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.662 | DEBUG    | __main__:trials:29 - Trial = 23939/30000 | Total reward = 35.80
2022-01-26 14:18:22.666 | DEBUG    | __main__:trials:24 - Trial = 23940/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.667 | DEBUG    | __main__:trials:29 - Trial = 23940/30000 | Total reward = 39.56
2022-01-26 14:18:22.671 | DEBUG    | __main__:trials:24 - Trial = 23941/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.672 | DEBUG    | __main__:trials:29 - Trial = 23941/30000 | Total reward = 34.47
2022-01-26 14:18:22.676 | DEBUG    | __main__:trials:26 - Trial = 23942/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.677 | DEBUG    | __main__:trials:29 - Trial = 23942/30000 | Total reward = 30.09
2022-01-26 14:18:22.682 | DEBUG    | __main__:trials:24 - Trial = 23943/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.683 | DEBUG    | __main__:trials:29 - Trial = 23943/30000 | Total reward = 31.32
2022-01-26 14:18:22.686 | DEBUG    | __main__:trials:24 - Trial = 23944/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.688 | DEBUG    | __main__:trials:29 - Trial = 23944/30000 | Total reward = 39.62
2022-01-26 14:18:22.692 | DEBUG    | __main__:trials:24 - Trial = 23945/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.693 | DEBUG    | __main__:trials:29 - Trial = 23945/30000 | Total reward = 39.99
2022-01-26 14:18:22.696 | DEBUG    | __main__:trials:24 - Trial = 23946/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.698 | DEBUG    | __main__:trials:29 - Trial = 23946/30000 | Total reward = 30.57
2022-01-26 14:18:22.702 | DEBUG    | __main__:trials:24 - Trial = 23947/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.703 | DEBUG    | __main__:trials:29 - Trial = 23947/30000 | Total reward = 39.80
2022-01-26 14:18:22.706 | DEBUG    | __main__:trials:24 - Trial = 23948/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.708 | DEBUG    | __main__:trials:29 - Trial = 23948/30000 | Total reward = 40.00
2022-01-26 14:18:22.712 | DEBUG    | __main__:trials:24 - Trial = 23949/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.713 | DEBUG    | __main__:trials:29 - Trial = 23949/30000 | Total reward = 38.52
2022-01-26 14:18:22.717 | DEBUG    | __main__:trials:26 - Trial = 23950/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.718 | DEBUG    | __main__:trials:29 - Trial = 23950/30000 | Total reward = 28.46
2022-01-26 14:18:22.722 | DEBUG    | __main__:trials:24 - Trial = 23951/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.724 | DEBUG    | __main__:trials:29 - Trial = 23951/30000 | Total reward = 50.49
2022-01-26 14:18:22.727 | DEBUG    | __main__:trials:24 - Trial = 23952/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.729 | DEBUG    | __main__:trials:29 - Trial = 23952/30000 | Total reward = 37.07
2022-01-26 14:18:22.733 | DEBUG    | __main__:trials:24 - Trial = 23953/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.734 | DEBUG    | __main__:trials:29 - Trial = 23953/30000 | Total reward = 39.39
2022-01-26 14:18:22.738 | DEBUG    | __main__:trials:24 - Trial = 23954/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.738 | DEBUG    | __main__:trials:29 - Trial = 23954/30000 | Total reward = 37.81
2022-01-26 14:18:22.743 | DEBUG    | __main__:trials:24 - Trial = 23955/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.744 | DEBUG    | __main__:trials:29 - Trial = 23955/30000 | Total reward = 25.32
2022-01-26 14:18:22.748 | DEBUG    | __main__:trials:24 - Trial = 23956/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.750 | DEBUG    | __main__:trials:29 - Trial = 23956/30000 | Total reward = 31.43
2022-01-26 14:18:22.753 | DEBUG    | __main__:trials:24 - Trial = 23957/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.755 | DEBUG    | __main__:trials:29 - Trial = 23957/30000 | Total reward = 41.21
2022-01-26 14:18:22.759 | DEBUG    | __main__:trials:24 - Trial = 23958/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.760 | DEBUG    | __main__:trials:29 - Trial = 23958/30000 | Total reward = 29.35
2022-01-26 14:18:22.764 | DEBUG    | __main__:trials:24 - Trial = 23959/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.765 | DEBUG    | __main__:trials:29 - Trial = 23959/30000 | Total reward = 38.35
2022-01-26 14:18:22.769 | DEBUG    | __main__:trials:24 - Trial = 23960/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.770 | DEBUG    | __main__:trials:29 - Trial = 23960/30000 | Total reward = 37.44
2022-01-26 14:18:22.774 | DEBUG    | __main__:trials:24 - Trial = 23961/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.775 | DEBUG    | __main__:trials:29 - Trial = 23961/30000 | Total reward = 38.05
2022-01-26 14:18:22.779 | DEBUG    | __main__:trials:24 - Trial = 23962/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.780 | DEBUG    | __main__:trials:29 - Trial = 23962/30000 | Total reward = 52.46
2022-01-26 14:18:22.784 | DEBUG    | __main__:trials:24 - Trial = 23963/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.785 | DEBUG    | __main__:trials:29 - Trial = 23963/30000 | Total reward = 40.60
2022-01-26 14:18:22.788 | DEBUG    | __main__:trials:24 - Trial = 23964/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.789 | DEBUG    | __main__:trials:29 - Trial = 23964/30000 | Total reward = 29.86
2022-01-26 14:18:22.792 | DEBUG    | __main__:trials:24 - Trial = 23965/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.793 | DEBUG    | __main__:trials:29 - Trial = 23965/30000 | Total reward = 36.52
2022-01-26 14:18:22.796 | DEBUG    | __main__:trials:24 - Trial = 23966/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.797 | DEBUG    | __main__:trials:29 - Trial = 23966/30000 | Total reward = 39.98
2022-01-26 14:18:22.800 | DEBUG    | __main__:trials:24 - Trial = 23967/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.801 | DEBUG    | __main__:trials:29 - Trial = 23967/30000 | Total reward = 38.13
2022-01-26 14:18:22.804 | DEBUG    | __main__:trials:24 - Trial = 23968/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.805 | DEBUG    | __main__:trials:29 - Trial = 23968/30000 | Total reward = 47.08
2022-01-26 14:18:22.808 | DEBUG    | __main__:trials:24 - Trial = 23969/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.810 | DEBUG    | __main__:trials:29 - Trial = 23969/30000 | Total reward = 37.14
2022-01-26 14:18:22.814 | DEBUG    | __main__:trials:24 - Trial = 23970/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.815 | DEBUG    | __main__:trials:29 - Trial = 23970/30000 | Total reward = 34.83
2022-01-26 14:18:22.819 | DEBUG    | __main__:trials:24 - Trial = 23971/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.820 | DEBUG    | __main__:trials:29 - Trial = 23971/30000 | Total reward = 36.29
2022-01-26 14:18:22.824 | DEBUG    | __main__:trials:24 - Trial = 23972/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.825 | DEBUG    | __main__:trials:29 - Trial = 23972/30000 | Total reward = 45.91
2022-01-26 14:18:22.829 | DEBUG    | __main__:trials:24 - Trial = 23973/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.831 | DEBUG    | __main__:trials:29 - Trial = 23973/30000 | Total reward = 41.25
2022-01-26 14:18:22.835 | DEBUG    | __main__:trials:24 - Trial = 23974/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.836 | DEBUG    | __main__:trials:29 - Trial = 23974/30000 | Total reward = 27.98
2022-01-26 14:18:22.839 | DEBUG    | __main__:trials:24 - Trial = 23975/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.841 | DEBUG    | __main__:trials:29 - Trial = 23975/30000 | Total reward = 39.80
2022-01-26 14:18:22.844 | DEBUG    | __main__:trials:24 - Trial = 23976/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.846 | DEBUG    | __main__:trials:29 - Trial = 23976/30000 | Total reward = 39.76
2022-01-26 14:18:22.849 | DEBUG    | __main__:trials:24 - Trial = 23977/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.851 | DEBUG    | __main__:trials:29 - Trial = 23977/30000 | Total reward = 23.16
2022-01-26 14:18:22.855 | DEBUG    | __main__:trials:24 - Trial = 23978/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.856 | DEBUG    | __main__:trials:29 - Trial = 23978/30000 | Total reward = 40.00
2022-01-26 14:18:22.859 | DEBUG    | __main__:trials:26 - Trial = 23979/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.861 | DEBUG    | __main__:trials:29 - Trial = 23979/30000 | Total reward = 17.46
2022-01-26 14:18:22.864 | DEBUG    | __main__:trials:24 - Trial = 23980/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.866 | DEBUG    | __main__:trials:29 - Trial = 23980/30000 | Total reward = 29.15
2022-01-26 14:18:22.870 | DEBUG    | __main__:trials:24 - Trial = 23981/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.871 | DEBUG    | __main__:trials:29 - Trial = 23981/30000 | Total reward = 38.10
2022-01-26 14:18:22.875 | DEBUG    | __main__:trials:24 - Trial = 23982/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.877 | DEBUG    | __main__:trials:29 - Trial = 23982/30000 | Total reward = 39.20
2022-01-26 14:18:22.880 | DEBUG    | __main__:trials:24 - Trial = 23983/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.882 | DEBUG    | __main__:trials:29 - Trial = 23983/30000 | Total reward = 37.82
2022-01-26 14:18:22.886 | DEBUG    | __main__:trials:24 - Trial = 23984/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.887 | DEBUG    | __main__:trials:29 - Trial = 23984/30000 | Total reward = 40.63
2022-01-26 14:18:22.891 | DEBUG    | __main__:trials:24 - Trial = 23985/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.891 | DEBUG    | __main__:trials:29 - Trial = 23985/30000 | Total reward = 30.36
2022-01-26 14:18:22.896 | DEBUG    | __main__:trials:24 - Trial = 23986/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.897 | DEBUG    | __main__:trials:29 - Trial = 23986/30000 | Total reward = 30.20
2022-01-26 14:18:22.901 | DEBUG    | __main__:trials:24 - Trial = 23987/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.902 | DEBUG    | __main__:trials:29 - Trial = 23987/30000 | Total reward = 28.19
2022-01-26 14:18:22.906 | DEBUG    | __main__:trials:24 - Trial = 23988/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.908 | DEBUG    | __main__:trials:29 - Trial = 23988/30000 | Total reward = 39.72
2022-01-26 14:18:22.911 | DEBUG    | __main__:trials:24 - Trial = 23989/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.912 | DEBUG    | __main__:trials:29 - Trial = 23989/30000 | Total reward = 39.80
2022-01-26 14:18:22.916 | DEBUG    | __main__:trials:26 - Trial = 23990/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.917 | DEBUG    | __main__:trials:29 - Trial = 23990/30000 | Total reward = 23.26
2022-01-26 14:18:22.921 | DEBUG    | __main__:trials:24 - Trial = 23991/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.922 | DEBUG    | __main__:trials:29 - Trial = 23991/30000 | Total reward = 45.69
2022-01-26 14:18:22.926 | DEBUG    | __main__:trials:24 - Trial = 23992/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.927 | DEBUG    | __main__:trials:29 - Trial = 23992/30000 | Total reward = 32.46
2022-01-26 14:18:22.931 | DEBUG    | __main__:trials:24 - Trial = 23993/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.933 | DEBUG    | __main__:trials:29 - Trial = 23993/30000 | Total reward = 39.25
2022-01-26 14:18:22.936 | DEBUG    | __main__:trials:24 - Trial = 23994/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.937 | DEBUG    | __main__:trials:29 - Trial = 23994/30000 | Total reward = 40.20
2022-01-26 14:18:22.940 | DEBUG    | __main__:trials:26 - Trial = 23995/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.941 | DEBUG    | __main__:trials:29 - Trial = 23995/30000 | Total reward = 15.71
2022-01-26 14:18:22.944 | DEBUG    | __main__:trials:24 - Trial = 23996/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.945 | DEBUG    | __main__:trials:29 - Trial = 23996/30000 | Total reward = 61.75
2022-01-26 14:18:22.949 | DEBUG    | __main__:trials:24 - Trial = 23997/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.949 | DEBUG    | __main__:trials:29 - Trial = 23997/30000 | Total reward = 33.94
2022-01-26 14:18:22.953 | DEBUG    | __main__:trials:24 - Trial = 23998/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.955 | DEBUG    | __main__:trials:29 - Trial = 23998/30000 | Total reward = 33.69
2022-01-26 14:18:22.958 | DEBUG    | __main__:trials:24 - Trial = 23999/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.959 | DEBUG    | __main__:trials:29 - Trial = 23999/30000 | Total reward = 51.95
2022-01-26 14:18:22.963 | DEBUG    | __main__:trials:24 - Trial = 24000/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.964 | DEBUG    | __main__:trials:29 - Trial = 24000/30000 | Total reward = 38.70
2022-01-26 14:18:22.968 | DEBUG    | __main__:trials:26 - Trial = 24001/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.969 | DEBUG    | __main__:trials:29 - Trial = 24001/30000 | Total reward = 26.41
2022-01-26 14:18:22.973 | DEBUG    | __main__:trials:26 - Trial = 24002/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:22.975 | DEBUG    | __main__:trials:29 - Trial = 24002/30000 | Total reward = 20.70
2022-01-26 14:18:22.978 | DEBUG    | __main__:trials:24 - Trial = 24003/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.979 | DEBUG    | __main__:trials:29 - Trial = 24003/30000 | Total reward = 34.90
2022-01-26 14:18:22.983 | DEBUG    | __main__:trials:24 - Trial = 24004/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.985 | DEBUG    | __main__:trials:29 - Trial = 24004/30000 | Total reward = 40.00
2022-01-26 14:18:22.988 | DEBUG    | __main__:trials:24 - Trial = 24005/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.989 | DEBUG    | __main__:trials:29 - Trial = 24005/30000 | Total reward = 38.32
2022-01-26 14:18:22.993 | DEBUG    | __main__:trials:24 - Trial = 24006/30000 | Max number of steps (20) reached
2022-01-26 14:18:22.995 | DEBUG    | __main__:trials:29 - Trial = 24006/30000 | Total reward = 39.20
2022-01-26 14:18:22.999 | DEBUG    | __main__:trials:24 - Trial = 24007/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.000 | DEBUG    | __main__:trials:29 - Trial = 24007/30000 | Total reward = 38.83
2022-01-26 14:18:23.004 | DEBUG    | __main__:trials:24 - Trial = 24008/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.005 | DEBUG    | __main__:trials:29 - Trial = 24008/30000 | Total reward = 32.10
2022-01-26 14:18:23.009 | DEBUG    | __main__:trials:24 - Trial = 24009/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.010 | DEBUG    | __main__:trials:29 - Trial = 24009/30000 | Total reward = 39.80
2022-01-26 14:18:23.014 | DEBUG    | __main__:trials:24 - Trial = 24010/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.014 | DEBUG    | __main__:trials:29 - Trial = 24010/30000 | Total reward = 33.89
2022-01-26 14:18:23.019 | DEBUG    | __main__:trials:24 - Trial = 24011/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.020 | DEBUG    | __main__:trials:29 - Trial = 24011/30000 | Total reward = 31.27
2022-01-26 14:18:23.023 | DEBUG    | __main__:trials:24 - Trial = 24012/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.025 | DEBUG    | __main__:trials:29 - Trial = 24012/30000 | Total reward = 40.00
2022-01-26 14:18:23.029 | DEBUG    | __main__:trials:24 - Trial = 24013/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.030 | DEBUG    | __main__:trials:29 - Trial = 24013/30000 | Total reward = 37.52
2022-01-26 14:18:23.034 | DEBUG    | __main__:trials:24 - Trial = 24014/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.035 | DEBUG    | __main__:trials:29 - Trial = 24014/30000 | Total reward = 20.95
2022-01-26 14:18:23.039 | DEBUG    | __main__:trials:24 - Trial = 24015/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.040 | DEBUG    | __main__:trials:29 - Trial = 24015/30000 | Total reward = 39.96
2022-01-26 14:18:23.044 | DEBUG    | __main__:trials:24 - Trial = 24016/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.046 | DEBUG    | __main__:trials:29 - Trial = 24016/30000 | Total reward = 37.62
2022-01-26 14:18:23.049 | DEBUG    | __main__:trials:24 - Trial = 24017/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.050 | DEBUG    | __main__:trials:29 - Trial = 24017/30000 | Total reward = 30.16
2022-01-26 14:18:23.055 | DEBUG    | __main__:trials:24 - Trial = 24018/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.055 | DEBUG    | __main__:trials:29 - Trial = 24018/30000 | Total reward = 37.82
2022-01-26 14:18:23.059 | DEBUG    | __main__:trials:24 - Trial = 24019/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.061 | DEBUG    | __main__:trials:29 - Trial = 24019/30000 | Total reward = 39.15
2022-01-26 14:18:23.064 | DEBUG    | __main__:trials:24 - Trial = 24020/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.065 | DEBUG    | __main__:trials:29 - Trial = 24020/30000 | Total reward = 42.39
2022-01-26 14:18:23.068 | DEBUG    | __main__:trials:24 - Trial = 24021/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.070 | DEBUG    | __main__:trials:29 - Trial = 24021/30000 | Total reward = 34.81
2022-01-26 14:18:23.074 | DEBUG    | __main__:trials:24 - Trial = 24022/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.074 | DEBUG    | __main__:trials:29 - Trial = 24022/30000 | Total reward = 27.93
2022-01-26 14:18:23.078 | DEBUG    | __main__:trials:24 - Trial = 24023/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.078 | DEBUG    | __main__:trials:29 - Trial = 24023/30000 | Total reward = 34.22
2022-01-26 14:18:23.082 | DEBUG    | __main__:trials:24 - Trial = 24024/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.084 | DEBUG    | __main__:trials:29 - Trial = 24024/30000 | Total reward = 37.80
2022-01-26 14:18:23.087 | DEBUG    | __main__:trials:24 - Trial = 24025/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.088 | DEBUG    | __main__:trials:29 - Trial = 24025/30000 | Total reward = 39.42
2022-01-26 14:18:23.091 | DEBUG    | __main__:trials:24 - Trial = 24026/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.093 | DEBUG    | __main__:trials:29 - Trial = 24026/30000 | Total reward = 34.34
2022-01-26 14:18:23.096 | DEBUG    | __main__:trials:24 - Trial = 24027/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.098 | DEBUG    | __main__:trials:29 - Trial = 24027/30000 | Total reward = 38.86
2022-01-26 14:18:23.101 | DEBUG    | __main__:trials:24 - Trial = 24028/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.102 | DEBUG    | __main__:trials:29 - Trial = 24028/30000 | Total reward = 41.49
2022-01-26 14:18:23.106 | DEBUG    | __main__:trials:24 - Trial = 24029/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.108 | DEBUG    | __main__:trials:29 - Trial = 24029/30000 | Total reward = 36.78
2022-01-26 14:18:23.111 | DEBUG    | __main__:trials:26 - Trial = 24030/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.111 | DEBUG    | __main__:trials:29 - Trial = 24030/30000 | Total reward = 19.80
2022-01-26 14:18:23.116 | DEBUG    | __main__:trials:24 - Trial = 24031/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.117 | DEBUG    | __main__:trials:29 - Trial = 24031/30000 | Total reward = 40.65
2022-01-26 14:18:23.120 | DEBUG    | __main__:trials:24 - Trial = 24032/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.122 | DEBUG    | __main__:trials:29 - Trial = 24032/30000 | Total reward = 35.82
2022-01-26 14:18:23.126 | DEBUG    | __main__:trials:24 - Trial = 24033/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.127 | DEBUG    | __main__:trials:29 - Trial = 24033/30000 | Total reward = 28.72
2022-01-26 14:18:23.131 | DEBUG    | __main__:trials:24 - Trial = 24034/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.131 | DEBUG    | __main__:trials:29 - Trial = 24034/30000 | Total reward = 40.47
2022-01-26 14:18:23.136 | DEBUG    | __main__:trials:24 - Trial = 24035/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.138 | DEBUG    | __main__:trials:29 - Trial = 24035/30000 | Total reward = 40.28
2022-01-26 14:18:23.141 | DEBUG    | __main__:trials:24 - Trial = 24036/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.143 | DEBUG    | __main__:trials:29 - Trial = 24036/30000 | Total reward = 38.89
2022-01-26 14:18:23.146 | DEBUG    | __main__:trials:24 - Trial = 24037/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.148 | DEBUG    | __main__:trials:29 - Trial = 24037/30000 | Total reward = 34.31
2022-01-26 14:18:23.151 | DEBUG    | __main__:trials:24 - Trial = 24038/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.152 | DEBUG    | __main__:trials:29 - Trial = 24038/30000 | Total reward = 39.64
2022-01-26 14:18:23.156 | DEBUG    | __main__:trials:24 - Trial = 24039/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.157 | DEBUG    | __main__:trials:29 - Trial = 24039/30000 | Total reward = 35.37
2022-01-26 14:18:23.161 | DEBUG    | __main__:trials:24 - Trial = 24040/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.162 | DEBUG    | __main__:trials:29 - Trial = 24040/30000 | Total reward = 33.26
2022-01-26 14:18:23.166 | DEBUG    | __main__:trials:26 - Trial = 24041/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.166 | DEBUG    | __main__:trials:29 - Trial = 24041/30000 | Total reward = 32.29
2022-01-26 14:18:23.171 | DEBUG    | __main__:trials:24 - Trial = 24042/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.173 | DEBUG    | __main__:trials:29 - Trial = 24042/30000 | Total reward = 35.51
2022-01-26 14:18:23.176 | DEBUG    | __main__:trials:24 - Trial = 24043/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.177 | DEBUG    | __main__:trials:29 - Trial = 24043/30000 | Total reward = 40.43
2022-01-26 14:18:23.180 | DEBUG    | __main__:trials:24 - Trial = 24044/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.182 | DEBUG    | __main__:trials:29 - Trial = 24044/30000 | Total reward = 40.00
2022-01-26 14:18:23.185 | DEBUG    | __main__:trials:24 - Trial = 24045/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.186 | DEBUG    | __main__:trials:29 - Trial = 24045/30000 | Total reward = 38.21
2022-01-26 14:18:23.189 | DEBUG    | __main__:trials:24 - Trial = 24046/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.191 | DEBUG    | __main__:trials:29 - Trial = 24046/30000 | Total reward = 40.38
2022-01-26 14:18:23.194 | DEBUG    | __main__:trials:24 - Trial = 24047/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.196 | DEBUG    | __main__:trials:29 - Trial = 24047/30000 | Total reward = 35.04
2022-01-26 14:18:23.199 | DEBUG    | __main__:trials:24 - Trial = 24048/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.200 | DEBUG    | __main__:trials:29 - Trial = 24048/30000 | Total reward = 40.00
2022-01-26 14:18:23.204 | DEBUG    | __main__:trials:24 - Trial = 24049/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.205 | DEBUG    | __main__:trials:29 - Trial = 24049/30000 | Total reward = 39.80
2022-01-26 14:18:23.208 | DEBUG    | __main__:trials:24 - Trial = 24050/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.209 | DEBUG    | __main__:trials:29 - Trial = 24050/30000 | Total reward = 37.48
2022-01-26 14:18:23.213 | DEBUG    | __main__:trials:24 - Trial = 24051/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.214 | DEBUG    | __main__:trials:29 - Trial = 24051/30000 | Total reward = 49.21
2022-01-26 14:18:23.218 | DEBUG    | __main__:trials:24 - Trial = 24052/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.219 | DEBUG    | __main__:trials:29 - Trial = 24052/30000 | Total reward = 38.82
2022-01-26 14:18:23.223 | DEBUG    | __main__:trials:24 - Trial = 24053/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.224 | DEBUG    | __main__:trials:29 - Trial = 24053/30000 | Total reward = 38.23
2022-01-26 14:18:23.228 | DEBUG    | __main__:trials:24 - Trial = 24054/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.230 | DEBUG    | __main__:trials:29 - Trial = 24054/30000 | Total reward = 37.15
2022-01-26 14:18:23.233 | DEBUG    | __main__:trials:24 - Trial = 24055/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.234 | DEBUG    | __main__:trials:29 - Trial = 24055/30000 | Total reward = 42.01
2022-01-26 14:18:23.237 | DEBUG    | __main__:trials:24 - Trial = 24056/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.238 | DEBUG    | __main__:trials:29 - Trial = 24056/30000 | Total reward = 39.07
2022-01-26 14:18:23.241 | DEBUG    | __main__:trials:26 - Trial = 24057/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.242 | DEBUG    | __main__:trials:29 - Trial = 24057/30000 | Total reward = 13.98
2022-01-26 14:18:23.245 | DEBUG    | __main__:trials:24 - Trial = 24058/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.247 | DEBUG    | __main__:trials:29 - Trial = 24058/30000 | Total reward = 39.59
2022-01-26 14:18:23.250 | DEBUG    | __main__:trials:24 - Trial = 24059/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.251 | DEBUG    | __main__:trials:29 - Trial = 24059/30000 | Total reward = 33.28
2022-01-26 14:18:23.254 | DEBUG    | __main__:trials:24 - Trial = 24060/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.256 | DEBUG    | __main__:trials:29 - Trial = 24060/30000 | Total reward = 43.24
2022-01-26 14:18:23.260 | DEBUG    | __main__:trials:24 - Trial = 24061/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.260 | DEBUG    | __main__:trials:29 - Trial = 24061/30000 | Total reward = 43.58
2022-01-26 14:18:23.265 | DEBUG    | __main__:trials:24 - Trial = 24062/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.266 | DEBUG    | __main__:trials:29 - Trial = 24062/30000 | Total reward = 48.20
2022-01-26 14:18:23.269 | DEBUG    | __main__:trials:24 - Trial = 24063/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.270 | DEBUG    | __main__:trials:29 - Trial = 24063/30000 | Total reward = 36.10
2022-01-26 14:18:23.273 | DEBUG    | __main__:trials:24 - Trial = 24064/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.275 | DEBUG    | __main__:trials:29 - Trial = 24064/30000 | Total reward = 30.91
2022-01-26 14:18:23.278 | DEBUG    | __main__:trials:24 - Trial = 24065/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.279 | DEBUG    | __main__:trials:29 - Trial = 24065/30000 | Total reward = 38.23
2022-01-26 14:18:23.282 | DEBUG    | __main__:trials:26 - Trial = 24066/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.284 | DEBUG    | __main__:trials:29 - Trial = 24066/30000 | Total reward = 19.70
2022-01-26 14:18:23.287 | DEBUG    | __main__:trials:24 - Trial = 24067/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.288 | DEBUG    | __main__:trials:29 - Trial = 24067/30000 | Total reward = 39.71
2022-01-26 14:18:23.292 | DEBUG    | __main__:trials:24 - Trial = 24068/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.294 | DEBUG    | __main__:trials:29 - Trial = 24068/30000 | Total reward = 60.65
2022-01-26 14:18:23.298 | DEBUG    | __main__:trials:24 - Trial = 24069/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.298 | DEBUG    | __main__:trials:29 - Trial = 24069/30000 | Total reward = 26.33
2022-01-26 14:18:23.303 | DEBUG    | __main__:trials:26 - Trial = 24070/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.303 | DEBUG    | __main__:trials:29 - Trial = 24070/30000 | Total reward = 20.48
2022-01-26 14:18:23.307 | DEBUG    | __main__:trials:24 - Trial = 24071/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.309 | DEBUG    | __main__:trials:29 - Trial = 24071/30000 | Total reward = 29.72
2022-01-26 14:18:23.312 | DEBUG    | __main__:trials:24 - Trial = 24072/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.314 | DEBUG    | __main__:trials:29 - Trial = 24072/30000 | Total reward = 39.58
2022-01-26 14:18:23.318 | DEBUG    | __main__:trials:26 - Trial = 24073/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.319 | DEBUG    | __main__:trials:29 - Trial = 24073/30000 | Total reward = 35.41
2022-01-26 14:18:23.323 | DEBUG    | __main__:trials:24 - Trial = 24074/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.325 | DEBUG    | __main__:trials:29 - Trial = 24074/30000 | Total reward = 25.17
2022-01-26 14:18:23.328 | DEBUG    | __main__:trials:24 - Trial = 24075/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.329 | DEBUG    | __main__:trials:29 - Trial = 24075/30000 | Total reward = 43.70
2022-01-26 14:18:23.334 | DEBUG    | __main__:trials:24 - Trial = 24076/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.335 | DEBUG    | __main__:trials:29 - Trial = 24076/30000 | Total reward = 34.85
2022-01-26 14:18:23.338 | DEBUG    | __main__:trials:24 - Trial = 24077/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.340 | DEBUG    | __main__:trials:29 - Trial = 24077/30000 | Total reward = 21.44
2022-01-26 14:18:23.343 | DEBUG    | __main__:trials:24 - Trial = 24078/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.345 | DEBUG    | __main__:trials:29 - Trial = 24078/30000 | Total reward = 37.18
2022-01-26 14:18:23.348 | DEBUG    | __main__:trials:24 - Trial = 24079/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.350 | DEBUG    | __main__:trials:29 - Trial = 24079/30000 | Total reward = 40.00
2022-01-26 14:18:23.354 | DEBUG    | __main__:trials:24 - Trial = 24080/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.355 | DEBUG    | __main__:trials:29 - Trial = 24080/30000 | Total reward = 43.07
2022-01-26 14:18:23.359 | DEBUG    | __main__:trials:26 - Trial = 24081/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.360 | DEBUG    | __main__:trials:29 - Trial = 24081/30000 | Total reward = 31.29
2022-01-26 14:18:23.364 | DEBUG    | __main__:trials:24 - Trial = 24082/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.366 | DEBUG    | __main__:trials:29 - Trial = 24082/30000 | Total reward = 41.49
2022-01-26 14:18:23.370 | DEBUG    | __main__:trials:24 - Trial = 24083/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.371 | DEBUG    | __main__:trials:29 - Trial = 24083/30000 | Total reward = 41.23
2022-01-26 14:18:23.375 | DEBUG    | __main__:trials:24 - Trial = 24084/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.376 | DEBUG    | __main__:trials:29 - Trial = 24084/30000 | Total reward = 40.00
2022-01-26 14:18:23.380 | DEBUG    | __main__:trials:24 - Trial = 24085/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.382 | DEBUG    | __main__:trials:29 - Trial = 24085/30000 | Total reward = 40.10
2022-01-26 14:18:23.385 | DEBUG    | __main__:trials:24 - Trial = 24086/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.387 | DEBUG    | __main__:trials:29 - Trial = 24086/30000 | Total reward = 35.02
2022-01-26 14:18:23.390 | DEBUG    | __main__:trials:24 - Trial = 24087/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.392 | DEBUG    | __main__:trials:29 - Trial = 24087/30000 | Total reward = 28.43
2022-01-26 14:18:23.395 | DEBUG    | __main__:trials:24 - Trial = 24088/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.397 | DEBUG    | __main__:trials:29 - Trial = 24088/30000 | Total reward = 26.91
2022-01-26 14:18:23.401 | DEBUG    | __main__:trials:24 - Trial = 24089/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.402 | DEBUG    | __main__:trials:29 - Trial = 24089/30000 | Total reward = 37.50
2022-01-26 14:18:23.406 | DEBUG    | __main__:trials:24 - Trial = 24090/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.407 | DEBUG    | __main__:trials:29 - Trial = 24090/30000 | Total reward = 35.86
2022-01-26 14:18:23.410 | DEBUG    | __main__:trials:24 - Trial = 24091/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.411 | DEBUG    | __main__:trials:29 - Trial = 24091/30000 | Total reward = 39.81
2022-01-26 14:18:23.414 | DEBUG    | __main__:trials:24 - Trial = 24092/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.416 | DEBUG    | __main__:trials:29 - Trial = 24092/30000 | Total reward = 40.00
2022-01-26 14:18:23.419 | DEBUG    | __main__:trials:24 - Trial = 24093/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.421 | DEBUG    | __main__:trials:29 - Trial = 24093/30000 | Total reward = 34.69
2022-01-26 14:18:23.423 | DEBUG    | __main__:trials:26 - Trial = 24094/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.424 | DEBUG    | __main__:trials:29 - Trial = 24094/30000 | Total reward = 14.30
2022-01-26 14:18:23.428 | DEBUG    | __main__:trials:24 - Trial = 24095/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.428 | DEBUG    | __main__:trials:29 - Trial = 24095/30000 | Total reward = 38.55
2022-01-26 14:18:23.432 | DEBUG    | __main__:trials:24 - Trial = 24096/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.432 | DEBUG    | __main__:trials:29 - Trial = 24096/30000 | Total reward = 26.01
2022-01-26 14:18:23.436 | DEBUG    | __main__:trials:24 - Trial = 24097/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.437 | DEBUG    | __main__:trials:29 - Trial = 24097/30000 | Total reward = 46.78
2022-01-26 14:18:23.440 | DEBUG    | __main__:trials:24 - Trial = 24098/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.442 | DEBUG    | __main__:trials:29 - Trial = 24098/30000 | Total reward = 50.16
2022-01-26 14:18:23.445 | DEBUG    | __main__:trials:24 - Trial = 24099/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.446 | DEBUG    | __main__:trials:29 - Trial = 24099/30000 | Total reward = 41.23
2022-01-26 14:18:23.449 | DEBUG    | __main__:trials:24 - Trial = 24100/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.451 | DEBUG    | __main__:trials:29 - Trial = 24100/30000 | Total reward = 55.91
2022-01-26 14:18:23.454 | DEBUG    | __main__:trials:26 - Trial = 24101/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.455 | DEBUG    | __main__:trials:29 - Trial = 24101/30000 | Total reward = 23.37
2022-01-26 14:18:23.459 | DEBUG    | __main__:trials:24 - Trial = 24102/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.460 | DEBUG    | __main__:trials:29 - Trial = 24102/30000 | Total reward = 28.10
2022-01-26 14:18:23.464 | DEBUG    | __main__:trials:24 - Trial = 24103/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.465 | DEBUG    | __main__:trials:29 - Trial = 24103/30000 | Total reward = 38.25
2022-01-26 14:18:23.469 | DEBUG    | __main__:trials:24 - Trial = 24104/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.470 | DEBUG    | __main__:trials:29 - Trial = 24104/30000 | Total reward = 40.00
2022-01-26 14:18:23.473 | DEBUG    | __main__:trials:24 - Trial = 24105/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.475 | DEBUG    | __main__:trials:29 - Trial = 24105/30000 | Total reward = 35.62
2022-01-26 14:18:23.479 | DEBUG    | __main__:trials:24 - Trial = 24106/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.480 | DEBUG    | __main__:trials:29 - Trial = 24106/30000 | Total reward = 33.21
2022-01-26 14:18:23.483 | DEBUG    | __main__:trials:24 - Trial = 24107/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.484 | DEBUG    | __main__:trials:29 - Trial = 24107/30000 | Total reward = 39.92
2022-01-26 14:18:23.487 | DEBUG    | __main__:trials:24 - Trial = 24108/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.489 | DEBUG    | __main__:trials:29 - Trial = 24108/30000 | Total reward = 36.65
2022-01-26 14:18:23.492 | DEBUG    | __main__:trials:24 - Trial = 24109/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.493 | DEBUG    | __main__:trials:29 - Trial = 24109/30000 | Total reward = 32.80
2022-01-26 14:18:23.497 | DEBUG    | __main__:trials:24 - Trial = 24110/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.498 | DEBUG    | __main__:trials:29 - Trial = 24110/30000 | Total reward = 22.26
2022-01-26 14:18:23.501 | DEBUG    | __main__:trials:24 - Trial = 24111/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.503 | DEBUG    | __main__:trials:29 - Trial = 24111/30000 | Total reward = 37.85
2022-01-26 14:18:23.506 | DEBUG    | __main__:trials:24 - Trial = 24112/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.507 | DEBUG    | __main__:trials:29 - Trial = 24112/30000 | Total reward = 37.89
2022-01-26 14:18:23.510 | DEBUG    | __main__:trials:24 - Trial = 24113/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.511 | DEBUG    | __main__:trials:29 - Trial = 24113/30000 | Total reward = 22.58
2022-01-26 14:18:23.515 | DEBUG    | __main__:trials:24 - Trial = 24114/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.515 | DEBUG    | __main__:trials:29 - Trial = 24114/30000 | Total reward = 28.18
2022-01-26 14:18:23.519 | DEBUG    | __main__:trials:24 - Trial = 24115/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.521 | DEBUG    | __main__:trials:29 - Trial = 24115/30000 | Total reward = 37.65
2022-01-26 14:18:23.524 | DEBUG    | __main__:trials:24 - Trial = 24116/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.524 | DEBUG    | __main__:trials:29 - Trial = 24116/30000 | Total reward = 41.49
2022-01-26 14:18:23.528 | DEBUG    | __main__:trials:24 - Trial = 24117/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.530 | DEBUG    | __main__:trials:29 - Trial = 24117/30000 | Total reward = 34.87
2022-01-26 14:18:23.533 | DEBUG    | __main__:trials:24 - Trial = 24118/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.534 | DEBUG    | __main__:trials:29 - Trial = 24118/30000 | Total reward = 35.66
2022-01-26 14:18:23.537 | DEBUG    | __main__:trials:26 - Trial = 24119/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.538 | DEBUG    | __main__:trials:29 - Trial = 24119/30000 | Total reward = 15.20
2022-01-26 14:18:23.542 | DEBUG    | __main__:trials:24 - Trial = 24120/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.544 | DEBUG    | __main__:trials:29 - Trial = 24120/30000 | Total reward = 30.88
2022-01-26 14:18:23.546 | DEBUG    | __main__:trials:24 - Trial = 24121/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.548 | DEBUG    | __main__:trials:29 - Trial = 24121/30000 | Total reward = 55.96
2022-01-26 14:18:23.552 | DEBUG    | __main__:trials:24 - Trial = 24122/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.553 | DEBUG    | __main__:trials:29 - Trial = 24122/30000 | Total reward = 36.02
2022-01-26 14:18:23.556 | DEBUG    | __main__:trials:24 - Trial = 24123/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.558 | DEBUG    | __main__:trials:29 - Trial = 24123/30000 | Total reward = 29.18
2022-01-26 14:18:23.562 | DEBUG    | __main__:trials:24 - Trial = 24124/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.563 | DEBUG    | __main__:trials:29 - Trial = 24124/30000 | Total reward = 39.10
2022-01-26 14:18:23.566 | DEBUG    | __main__:trials:24 - Trial = 24125/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.568 | DEBUG    | __main__:trials:29 - Trial = 24125/30000 | Total reward = 30.43
2022-01-26 14:18:23.571 | DEBUG    | __main__:trials:24 - Trial = 24126/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.573 | DEBUG    | __main__:trials:29 - Trial = 24126/30000 | Total reward = 52.89
2022-01-26 14:18:23.576 | DEBUG    | __main__:trials:24 - Trial = 24127/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.577 | DEBUG    | __main__:trials:29 - Trial = 24127/30000 | Total reward = 17.31
2022-01-26 14:18:23.581 | DEBUG    | __main__:trials:24 - Trial = 24128/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.583 | DEBUG    | __main__:trials:29 - Trial = 24128/30000 | Total reward = 38.23
2022-01-26 14:18:23.586 | DEBUG    | __main__:trials:24 - Trial = 24129/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.587 | DEBUG    | __main__:trials:29 - Trial = 24129/30000 | Total reward = 34.23
2022-01-26 14:18:23.590 | DEBUG    | __main__:trials:26 - Trial = 24130/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.592 | DEBUG    | __main__:trials:29 - Trial = 24130/30000 | Total reward = 14.65
2022-01-26 14:18:23.595 | DEBUG    | __main__:trials:24 - Trial = 24131/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.596 | DEBUG    | __main__:trials:29 - Trial = 24131/30000 | Total reward = 37.39
2022-01-26 14:18:23.600 | DEBUG    | __main__:trials:24 - Trial = 24132/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.601 | DEBUG    | __main__:trials:29 - Trial = 24132/30000 | Total reward = 35.31
2022-01-26 14:18:23.605 | DEBUG    | __main__:trials:24 - Trial = 24133/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.607 | DEBUG    | __main__:trials:29 - Trial = 24133/30000 | Total reward = 32.60
2022-01-26 14:18:23.609 | DEBUG    | __main__:trials:26 - Trial = 24134/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.610 | DEBUG    | __main__:trials:29 - Trial = 24134/30000 | Total reward = 19.32
2022-01-26 14:18:23.613 | DEBUG    | __main__:trials:24 - Trial = 24135/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.615 | DEBUG    | __main__:trials:29 - Trial = 24135/30000 | Total reward = 50.15
2022-01-26 14:18:23.618 | DEBUG    | __main__:trials:24 - Trial = 24136/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.619 | DEBUG    | __main__:trials:29 - Trial = 24136/30000 | Total reward = 37.60
2022-01-26 14:18:23.622 | DEBUG    | __main__:trials:24 - Trial = 24137/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.623 | DEBUG    | __main__:trials:29 - Trial = 24137/30000 | Total reward = 38.26
2022-01-26 14:18:23.626 | DEBUG    | __main__:trials:24 - Trial = 24138/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.627 | DEBUG    | __main__:trials:29 - Trial = 24138/30000 | Total reward = 49.36
2022-01-26 14:18:23.630 | DEBUG    | __main__:trials:24 - Trial = 24139/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.632 | DEBUG    | __main__:trials:29 - Trial = 24139/30000 | Total reward = 35.04
2022-01-26 14:18:23.636 | DEBUG    | __main__:trials:24 - Trial = 24140/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.637 | DEBUG    | __main__:trials:29 - Trial = 24140/30000 | Total reward = 37.11
2022-01-26 14:18:23.639 | DEBUG    | __main__:trials:26 - Trial = 24141/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.641 | DEBUG    | __main__:trials:29 - Trial = 24141/30000 | Total reward = 15.71
2022-01-26 14:18:23.644 | DEBUG    | __main__:trials:24 - Trial = 24142/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.646 | DEBUG    | __main__:trials:29 - Trial = 24142/30000 | Total reward = 32.80
2022-01-26 14:18:23.649 | DEBUG    | __main__:trials:24 - Trial = 24143/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.651 | DEBUG    | __main__:trials:29 - Trial = 24143/30000 | Total reward = 37.65
2022-01-26 14:18:23.655 | DEBUG    | __main__:trials:24 - Trial = 24144/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.656 | DEBUG    | __main__:trials:29 - Trial = 24144/30000 | Total reward = 38.27
2022-01-26 14:18:23.660 | DEBUG    | __main__:trials:24 - Trial = 24145/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.661 | DEBUG    | __main__:trials:29 - Trial = 24145/30000 | Total reward = 37.83
2022-01-26 14:18:23.665 | DEBUG    | __main__:trials:24 - Trial = 24146/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.666 | DEBUG    | __main__:trials:29 - Trial = 24146/30000 | Total reward = 38.27
2022-01-26 14:18:23.670 | DEBUG    | __main__:trials:24 - Trial = 24147/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.671 | DEBUG    | __main__:trials:29 - Trial = 24147/30000 | Total reward = 34.79
2022-01-26 14:18:23.675 | DEBUG    | __main__:trials:24 - Trial = 24148/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.676 | DEBUG    | __main__:trials:29 - Trial = 24148/30000 | Total reward = 32.73
2022-01-26 14:18:23.680 | DEBUG    | __main__:trials:24 - Trial = 24149/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.681 | DEBUG    | __main__:trials:29 - Trial = 24149/30000 | Total reward = 37.89
2022-01-26 14:18:23.684 | DEBUG    | __main__:trials:24 - Trial = 24150/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.686 | DEBUG    | __main__:trials:29 - Trial = 24150/30000 | Total reward = 21.62
2022-01-26 14:18:23.690 | DEBUG    | __main__:trials:24 - Trial = 24151/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.691 | DEBUG    | __main__:trials:29 - Trial = 24151/30000 | Total reward = 37.71
2022-01-26 14:18:23.695 | DEBUG    | __main__:trials:24 - Trial = 24152/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.697 | DEBUG    | __main__:trials:29 - Trial = 24152/30000 | Total reward = 24.38
2022-01-26 14:18:23.700 | DEBUG    | __main__:trials:24 - Trial = 24153/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.702 | DEBUG    | __main__:trials:29 - Trial = 24153/30000 | Total reward = 33.51
2022-01-26 14:18:23.705 | DEBUG    | __main__:trials:26 - Trial = 24154/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.706 | DEBUG    | __main__:trials:29 - Trial = 24154/30000 | Total reward = 17.52
2022-01-26 14:18:23.710 | DEBUG    | __main__:trials:24 - Trial = 24155/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.711 | DEBUG    | __main__:trials:29 - Trial = 24155/30000 | Total reward = 38.56
2022-01-26 14:18:23.715 | DEBUG    | __main__:trials:24 - Trial = 24156/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.717 | DEBUG    | __main__:trials:29 - Trial = 24156/30000 | Total reward = 37.29
2022-01-26 14:18:23.720 | DEBUG    | __main__:trials:24 - Trial = 24157/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.722 | DEBUG    | __main__:trials:29 - Trial = 24157/30000 | Total reward = 33.12
2022-01-26 14:18:23.725 | DEBUG    | __main__:trials:24 - Trial = 24158/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.726 | DEBUG    | __main__:trials:29 - Trial = 24158/30000 | Total reward = 50.13
2022-01-26 14:18:23.731 | DEBUG    | __main__:trials:24 - Trial = 24159/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.732 | DEBUG    | __main__:trials:29 - Trial = 24159/30000 | Total reward = 39.04
2022-01-26 14:18:23.736 | DEBUG    | __main__:trials:24 - Trial = 24160/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.737 | DEBUG    | __main__:trials:29 - Trial = 24160/30000 | Total reward = 43.03
2022-01-26 14:18:23.741 | DEBUG    | __main__:trials:24 - Trial = 24161/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.742 | DEBUG    | __main__:trials:29 - Trial = 24161/30000 | Total reward = 35.12
2022-01-26 14:18:23.746 | DEBUG    | __main__:trials:24 - Trial = 24162/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.747 | DEBUG    | __main__:trials:29 - Trial = 24162/30000 | Total reward = 39.07
2022-01-26 14:18:23.750 | DEBUG    | __main__:trials:24 - Trial = 24163/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.752 | DEBUG    | __main__:trials:29 - Trial = 24163/30000 | Total reward = 38.28
2022-01-26 14:18:23.756 | DEBUG    | __main__:trials:24 - Trial = 24164/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.757 | DEBUG    | __main__:trials:29 - Trial = 24164/30000 | Total reward = 46.01
2022-01-26 14:18:23.760 | DEBUG    | __main__:trials:24 - Trial = 24165/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.762 | DEBUG    | __main__:trials:29 - Trial = 24165/30000 | Total reward = 37.46
2022-01-26 14:18:23.765 | DEBUG    | __main__:trials:24 - Trial = 24166/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.767 | DEBUG    | __main__:trials:29 - Trial = 24166/30000 | Total reward = 42.65
2022-01-26 14:18:23.770 | DEBUG    | __main__:trials:24 - Trial = 24167/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.772 | DEBUG    | __main__:trials:29 - Trial = 24167/30000 | Total reward = 41.85
2022-01-26 14:18:23.775 | DEBUG    | __main__:trials:24 - Trial = 24168/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.776 | DEBUG    | __main__:trials:29 - Trial = 24168/30000 | Total reward = 51.60
2022-01-26 14:18:23.780 | DEBUG    | __main__:trials:24 - Trial = 24169/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.781 | DEBUG    | __main__:trials:29 - Trial = 24169/30000 | Total reward = 38.21
2022-01-26 14:18:23.786 | DEBUG    | __main__:trials:24 - Trial = 24170/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.786 | DEBUG    | __main__:trials:29 - Trial = 24170/30000 | Total reward = 38.51
2022-01-26 14:18:23.790 | DEBUG    | __main__:trials:26 - Trial = 24171/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.792 | DEBUG    | __main__:trials:29 - Trial = 24171/30000 | Total reward = 22.11
2022-01-26 14:18:23.796 | DEBUG    | __main__:trials:24 - Trial = 24172/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.797 | DEBUG    | __main__:trials:29 - Trial = 24172/30000 | Total reward = 37.11
2022-01-26 14:18:23.801 | DEBUG    | __main__:trials:24 - Trial = 24173/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.803 | DEBUG    | __main__:trials:29 - Trial = 24173/30000 | Total reward = 40.05
2022-01-26 14:18:23.806 | DEBUG    | __main__:trials:24 - Trial = 24174/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.807 | DEBUG    | __main__:trials:29 - Trial = 24174/30000 | Total reward = 35.94
2022-01-26 14:18:23.811 | DEBUG    | __main__:trials:24 - Trial = 24175/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.812 | DEBUG    | __main__:trials:29 - Trial = 24175/30000 | Total reward = 36.18
2022-01-26 14:18:23.815 | DEBUG    | __main__:trials:24 - Trial = 24176/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.817 | DEBUG    | __main__:trials:29 - Trial = 24176/30000 | Total reward = 39.83
2022-01-26 14:18:23.820 | DEBUG    | __main__:trials:24 - Trial = 24177/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.822 | DEBUG    | __main__:trials:29 - Trial = 24177/30000 | Total reward = 38.51
2022-01-26 14:18:23.825 | DEBUG    | __main__:trials:24 - Trial = 24178/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.827 | DEBUG    | __main__:trials:29 - Trial = 24178/30000 | Total reward = 35.74
2022-01-26 14:18:23.830 | DEBUG    | __main__:trials:24 - Trial = 24179/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.832 | DEBUG    | __main__:trials:29 - Trial = 24179/30000 | Total reward = 37.84
2022-01-26 14:18:23.835 | DEBUG    | __main__:trials:24 - Trial = 24180/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.836 | DEBUG    | __main__:trials:29 - Trial = 24180/30000 | Total reward = 36.23
2022-01-26 14:18:23.840 | DEBUG    | __main__:trials:24 - Trial = 24181/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.841 | DEBUG    | __main__:trials:29 - Trial = 24181/30000 | Total reward = 35.14
2022-01-26 14:18:23.844 | DEBUG    | __main__:trials:24 - Trial = 24182/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.845 | DEBUG    | __main__:trials:29 - Trial = 24182/30000 | Total reward = 43.04
2022-01-26 14:18:23.849 | DEBUG    | __main__:trials:24 - Trial = 24183/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.849 | DEBUG    | __main__:trials:29 - Trial = 24183/30000 | Total reward = 34.45
2022-01-26 14:18:23.853 | DEBUG    | __main__:trials:24 - Trial = 24184/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.854 | DEBUG    | __main__:trials:29 - Trial = 24184/30000 | Total reward = 39.71
2022-01-26 14:18:23.858 | DEBUG    | __main__:trials:24 - Trial = 24185/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.859 | DEBUG    | __main__:trials:29 - Trial = 24185/30000 | Total reward = 37.81
2022-01-26 14:18:23.863 | DEBUG    | __main__:trials:24 - Trial = 24186/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.864 | DEBUG    | __main__:trials:29 - Trial = 24186/30000 | Total reward = 26.45
2022-01-26 14:18:23.868 | DEBUG    | __main__:trials:26 - Trial = 24187/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.869 | DEBUG    | __main__:trials:29 - Trial = 24187/30000 | Total reward = 16.39
2022-01-26 14:18:23.872 | DEBUG    | __main__:trials:24 - Trial = 24188/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.874 | DEBUG    | __main__:trials:29 - Trial = 24188/30000 | Total reward = 35.55
2022-01-26 14:18:23.877 | DEBUG    | __main__:trials:24 - Trial = 24189/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.879 | DEBUG    | __main__:trials:29 - Trial = 24189/30000 | Total reward = 49.18
2022-01-26 14:18:23.882 | DEBUG    | __main__:trials:26 - Trial = 24190/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.884 | DEBUG    | __main__:trials:29 - Trial = 24190/30000 | Total reward = 25.28
2022-01-26 14:18:23.888 | DEBUG    | __main__:trials:24 - Trial = 24191/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.890 | DEBUG    | __main__:trials:29 - Trial = 24191/30000 | Total reward = 39.46
2022-01-26 14:18:23.894 | DEBUG    | __main__:trials:24 - Trial = 24192/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.896 | DEBUG    | __main__:trials:29 - Trial = 24192/30000 | Total reward = 31.73
2022-01-26 14:18:23.899 | DEBUG    | __main__:trials:24 - Trial = 24193/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.901 | DEBUG    | __main__:trials:29 - Trial = 24193/30000 | Total reward = 32.87
2022-01-26 14:18:23.904 | DEBUG    | __main__:trials:26 - Trial = 24194/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.906 | DEBUG    | __main__:trials:29 - Trial = 24194/30000 | Total reward = 15.20
2022-01-26 14:18:23.908 | DEBUG    | __main__:trials:24 - Trial = 24195/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.910 | DEBUG    | __main__:trials:29 - Trial = 24195/30000 | Total reward = 49.16
2022-01-26 14:18:23.913 | DEBUG    | __main__:trials:24 - Trial = 24196/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.914 | DEBUG    | __main__:trials:29 - Trial = 24196/30000 | Total reward = 34.37
2022-01-26 14:18:23.917 | DEBUG    | __main__:trials:26 - Trial = 24197/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.918 | DEBUG    | __main__:trials:29 - Trial = 24197/30000 | Total reward = 19.27
2022-01-26 14:18:23.921 | DEBUG    | __main__:trials:24 - Trial = 24198/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.923 | DEBUG    | __main__:trials:29 - Trial = 24198/30000 | Total reward = 51.42
2022-01-26 14:18:23.925 | DEBUG    | __main__:trials:24 - Trial = 24199/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.926 | DEBUG    | __main__:trials:29 - Trial = 24199/30000 | Total reward = 37.85
2022-01-26 14:18:23.929 | DEBUG    | __main__:trials:24 - Trial = 24200/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.930 | DEBUG    | __main__:trials:29 - Trial = 24200/30000 | Total reward = 46.58
2022-01-26 14:18:23.933 | DEBUG    | __main__:trials:24 - Trial = 24201/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.934 | DEBUG    | __main__:trials:29 - Trial = 24201/30000 | Total reward = 32.85
2022-01-26 14:18:23.938 | DEBUG    | __main__:trials:24 - Trial = 24202/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.938 | DEBUG    | __main__:trials:29 - Trial = 24202/30000 | Total reward = 29.91
2022-01-26 14:18:23.942 | DEBUG    | __main__:trials:24 - Trial = 24203/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.943 | DEBUG    | __main__:trials:29 - Trial = 24203/30000 | Total reward = 34.50
2022-01-26 14:18:23.945 | DEBUG    | __main__:trials:26 - Trial = 24204/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.946 | DEBUG    | __main__:trials:29 - Trial = 24204/30000 | Total reward = 14.92
2022-01-26 14:18:23.949 | DEBUG    | __main__:trials:24 - Trial = 24205/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.950 | DEBUG    | __main__:trials:29 - Trial = 24205/30000 | Total reward = 39.04
2022-01-26 14:18:23.954 | DEBUG    | __main__:trials:24 - Trial = 24206/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.955 | DEBUG    | __main__:trials:29 - Trial = 24206/30000 | Total reward = 38.31
2022-01-26 14:18:23.958 | DEBUG    | __main__:trials:26 - Trial = 24207/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:23.960 | DEBUG    | __main__:trials:29 - Trial = 24207/30000 | Total reward = 30.69
2022-01-26 14:18:23.963 | DEBUG    | __main__:trials:24 - Trial = 24208/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.964 | DEBUG    | __main__:trials:29 - Trial = 24208/30000 | Total reward = 37.22
2022-01-26 14:18:23.967 | DEBUG    | __main__:trials:24 - Trial = 24209/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.969 | DEBUG    | __main__:trials:29 - Trial = 24209/30000 | Total reward = 35.84
2022-01-26 14:18:23.972 | DEBUG    | __main__:trials:24 - Trial = 24210/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.974 | DEBUG    | __main__:trials:29 - Trial = 24210/30000 | Total reward = 52.78
2022-01-26 14:18:23.978 | DEBUG    | __main__:trials:24 - Trial = 24211/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.979 | DEBUG    | __main__:trials:29 - Trial = 24211/30000 | Total reward = 19.47
2022-01-26 14:18:23.983 | DEBUG    | __main__:trials:24 - Trial = 24212/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.985 | DEBUG    | __main__:trials:29 - Trial = 24212/30000 | Total reward = 37.42
2022-01-26 14:18:23.988 | DEBUG    | __main__:trials:24 - Trial = 24213/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.990 | DEBUG    | __main__:trials:29 - Trial = 24213/30000 | Total reward = 38.37
2022-01-26 14:18:23.994 | DEBUG    | __main__:trials:24 - Trial = 24214/30000 | Max number of steps (20) reached
2022-01-26 14:18:23.995 | DEBUG    | __main__:trials:29 - Trial = 24214/30000 | Total reward = 34.40
2022-01-26 14:18:23.999 | DEBUG    | __main__:trials:24 - Trial = 24215/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.001 | DEBUG    | __main__:trials:29 - Trial = 24215/30000 | Total reward = 41.88
2022-01-26 14:18:24.004 | DEBUG    | __main__:trials:24 - Trial = 24216/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.006 | DEBUG    | __main__:trials:29 - Trial = 24216/30000 | Total reward = 58.04
2022-01-26 14:18:24.010 | DEBUG    | __main__:trials:24 - Trial = 24217/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.011 | DEBUG    | __main__:trials:29 - Trial = 24217/30000 | Total reward = 47.45
2022-01-26 14:18:24.015 | DEBUG    | __main__:trials:24 - Trial = 24218/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.017 | DEBUG    | __main__:trials:29 - Trial = 24218/30000 | Total reward = 35.35
2022-01-26 14:18:24.019 | DEBUG    | __main__:trials:26 - Trial = 24219/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.021 | DEBUG    | __main__:trials:29 - Trial = 24219/30000 | Total reward = 16.32
2022-01-26 14:18:24.024 | DEBUG    | __main__:trials:24 - Trial = 24220/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.026 | DEBUG    | __main__:trials:29 - Trial = 24220/30000 | Total reward = 23.30
2022-01-26 14:18:24.029 | DEBUG    | __main__:trials:24 - Trial = 24221/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.031 | DEBUG    | __main__:trials:29 - Trial = 24221/30000 | Total reward = 33.41
2022-01-26 14:18:24.034 | DEBUG    | __main__:trials:24 - Trial = 24222/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.036 | DEBUG    | __main__:trials:29 - Trial = 24222/30000 | Total reward = 42.10
2022-01-26 14:18:24.040 | DEBUG    | __main__:trials:24 - Trial = 24223/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.041 | DEBUG    | __main__:trials:29 - Trial = 24223/30000 | Total reward = 43.61
2022-01-26 14:18:24.045 | DEBUG    | __main__:trials:24 - Trial = 24224/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.046 | DEBUG    | __main__:trials:29 - Trial = 24224/30000 | Total reward = 42.56
2022-01-26 14:18:24.050 | DEBUG    | __main__:trials:24 - Trial = 24225/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.052 | DEBUG    | __main__:trials:29 - Trial = 24225/30000 | Total reward = 18.90
2022-01-26 14:18:24.055 | DEBUG    | __main__:trials:24 - Trial = 24226/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.056 | DEBUG    | __main__:trials:29 - Trial = 24226/30000 | Total reward = 37.77
2022-01-26 14:18:24.060 | DEBUG    | __main__:trials:24 - Trial = 24227/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.062 | DEBUG    | __main__:trials:29 - Trial = 24227/30000 | Total reward = 36.29
2022-01-26 14:18:24.066 | DEBUG    | __main__:trials:24 - Trial = 24228/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.066 | DEBUG    | __main__:trials:29 - Trial = 24228/30000 | Total reward = 52.75
2022-01-26 14:18:24.072 | DEBUG    | __main__:trials:24 - Trial = 24229/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.073 | DEBUG    | __main__:trials:29 - Trial = 24229/30000 | Total reward = 39.98
2022-01-26 14:18:24.076 | DEBUG    | __main__:trials:26 - Trial = 24230/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.078 | DEBUG    | __main__:trials:29 - Trial = 24230/30000 | Total reward = 16.51
2022-01-26 14:18:24.082 | DEBUG    | __main__:trials:24 - Trial = 24231/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.083 | DEBUG    | __main__:trials:29 - Trial = 24231/30000 | Total reward = 44.37
2022-01-26 14:18:24.086 | DEBUG    | __main__:trials:24 - Trial = 24232/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.088 | DEBUG    | __main__:trials:29 - Trial = 24232/30000 | Total reward = 37.06
2022-01-26 14:18:24.091 | DEBUG    | __main__:trials:24 - Trial = 24233/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.093 | DEBUG    | __main__:trials:29 - Trial = 24233/30000 | Total reward = 44.41
2022-01-26 14:18:24.096 | DEBUG    | __main__:trials:24 - Trial = 24234/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.098 | DEBUG    | __main__:trials:29 - Trial = 24234/30000 | Total reward = 32.40
2022-01-26 14:18:24.101 | DEBUG    | __main__:trials:26 - Trial = 24235/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.103 | DEBUG    | __main__:trials:29 - Trial = 24235/30000 | Total reward = 14.96
2022-01-26 14:18:24.107 | DEBUG    | __main__:trials:24 - Trial = 24236/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.108 | DEBUG    | __main__:trials:29 - Trial = 24236/30000 | Total reward = 35.38
2022-01-26 14:18:24.111 | DEBUG    | __main__:trials:24 - Trial = 24237/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.113 | DEBUG    | __main__:trials:29 - Trial = 24237/30000 | Total reward = 38.30
2022-01-26 14:18:24.117 | DEBUG    | __main__:trials:24 - Trial = 24238/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.118 | DEBUG    | __main__:trials:29 - Trial = 24238/30000 | Total reward = 33.12
2022-01-26 14:18:24.121 | DEBUG    | __main__:trials:26 - Trial = 24239/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.121 | DEBUG    | __main__:trials:29 - Trial = 24239/30000 | Total reward = 11.64
2022-01-26 14:18:24.125 | DEBUG    | __main__:trials:26 - Trial = 24240/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.126 | DEBUG    | __main__:trials:29 - Trial = 24240/30000 | Total reward = 29.18
2022-01-26 14:18:24.130 | DEBUG    | __main__:trials:24 - Trial = 24241/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.131 | DEBUG    | __main__:trials:29 - Trial = 24241/30000 | Total reward = 34.77
2022-01-26 14:18:24.135 | DEBUG    | __main__:trials:24 - Trial = 24242/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.137 | DEBUG    | __main__:trials:29 - Trial = 24242/30000 | Total reward = 47.63
2022-01-26 14:18:24.140 | DEBUG    | __main__:trials:24 - Trial = 24243/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.142 | DEBUG    | __main__:trials:29 - Trial = 24243/30000 | Total reward = 47.65
2022-01-26 14:18:24.146 | DEBUG    | __main__:trials:24 - Trial = 24244/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.147 | DEBUG    | __main__:trials:29 - Trial = 24244/30000 | Total reward = 38.70
2022-01-26 14:18:24.149 | DEBUG    | __main__:trials:26 - Trial = 24245/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.150 | DEBUG    | __main__:trials:29 - Trial = 24245/30000 | Total reward = 15.00
2022-01-26 14:18:24.153 | DEBUG    | __main__:trials:26 - Trial = 24246/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.153 | DEBUG    | __main__:trials:29 - Trial = 24246/30000 | Total reward = 18.94
2022-01-26 14:18:24.157 | DEBUG    | __main__:trials:24 - Trial = 24247/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.158 | DEBUG    | __main__:trials:29 - Trial = 24247/30000 | Total reward = 36.54
2022-01-26 14:18:24.161 | DEBUG    | __main__:trials:24 - Trial = 24248/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.162 | DEBUG    | __main__:trials:29 - Trial = 24248/30000 | Total reward = 41.29
2022-01-26 14:18:24.166 | DEBUG    | __main__:trials:24 - Trial = 24249/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.168 | DEBUG    | __main__:trials:29 - Trial = 24249/30000 | Total reward = 37.02
2022-01-26 14:18:24.172 | DEBUG    | __main__:trials:24 - Trial = 24250/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.173 | DEBUG    | __main__:trials:29 - Trial = 24250/30000 | Total reward = 37.05
2022-01-26 14:18:24.177 | DEBUG    | __main__:trials:24 - Trial = 24251/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.178 | DEBUG    | __main__:trials:29 - Trial = 24251/30000 | Total reward = 54.18
2022-01-26 14:18:24.182 | DEBUG    | __main__:trials:24 - Trial = 24252/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.184 | DEBUG    | __main__:trials:29 - Trial = 24252/30000 | Total reward = 34.27
2022-01-26 14:18:24.188 | DEBUG    | __main__:trials:24 - Trial = 24253/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.189 | DEBUG    | __main__:trials:29 - Trial = 24253/30000 | Total reward = 39.24
2022-01-26 14:18:24.192 | DEBUG    | __main__:trials:24 - Trial = 24254/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.194 | DEBUG    | __main__:trials:29 - Trial = 24254/30000 | Total reward = 35.04
2022-01-26 14:18:24.198 | DEBUG    | __main__:trials:24 - Trial = 24255/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.199 | DEBUG    | __main__:trials:29 - Trial = 24255/30000 | Total reward = 36.49
2022-01-26 14:18:24.203 | DEBUG    | __main__:trials:24 - Trial = 24256/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.204 | DEBUG    | __main__:trials:29 - Trial = 24256/30000 | Total reward = 35.45
2022-01-26 14:18:24.208 | DEBUG    | __main__:trials:24 - Trial = 24257/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.210 | DEBUG    | __main__:trials:29 - Trial = 24257/30000 | Total reward = 37.09
2022-01-26 14:18:24.214 | DEBUG    | __main__:trials:24 - Trial = 24258/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.215 | DEBUG    | __main__:trials:29 - Trial = 24258/30000 | Total reward = 36.09
2022-01-26 14:18:24.219 | DEBUG    | __main__:trials:24 - Trial = 24259/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.221 | DEBUG    | __main__:trials:29 - Trial = 24259/30000 | Total reward = 43.40
2022-01-26 14:18:24.224 | DEBUG    | __main__:trials:24 - Trial = 24260/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.226 | DEBUG    | __main__:trials:29 - Trial = 24260/30000 | Total reward = 37.64
2022-01-26 14:18:24.229 | DEBUG    | __main__:trials:24 - Trial = 24261/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.230 | DEBUG    | __main__:trials:29 - Trial = 24261/30000 | Total reward = 36.86
2022-01-26 14:18:24.234 | DEBUG    | __main__:trials:24 - Trial = 24262/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.234 | DEBUG    | __main__:trials:29 - Trial = 24262/30000 | Total reward = 31.67
2022-01-26 14:18:24.239 | DEBUG    | __main__:trials:24 - Trial = 24263/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.240 | DEBUG    | __main__:trials:29 - Trial = 24263/30000 | Total reward = 29.24
2022-01-26 14:18:24.243 | DEBUG    | __main__:trials:26 - Trial = 24264/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.244 | DEBUG    | __main__:trials:29 - Trial = 24264/30000 | Total reward = 16.79
2022-01-26 14:18:24.247 | DEBUG    | __main__:trials:26 - Trial = 24265/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.248 | DEBUG    | __main__:trials:29 - Trial = 24265/30000 | Total reward = 10.11
2022-01-26 14:18:24.252 | DEBUG    | __main__:trials:24 - Trial = 24266/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.254 | DEBUG    | __main__:trials:29 - Trial = 24266/30000 | Total reward = 46.20
2022-01-26 14:18:24.258 | DEBUG    | __main__:trials:24 - Trial = 24267/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.259 | DEBUG    | __main__:trials:29 - Trial = 24267/30000 | Total reward = 37.81
2022-01-26 14:18:24.262 | DEBUG    | __main__:trials:24 - Trial = 24268/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.264 | DEBUG    | __main__:trials:29 - Trial = 24268/30000 | Total reward = 35.18
2022-01-26 14:18:24.268 | DEBUG    | __main__:trials:24 - Trial = 24269/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.269 | DEBUG    | __main__:trials:29 - Trial = 24269/30000 | Total reward = 32.47
2022-01-26 14:18:24.273 | DEBUG    | __main__:trials:24 - Trial = 24270/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.275 | DEBUG    | __main__:trials:29 - Trial = 24270/30000 | Total reward = 35.80
2022-01-26 14:18:24.277 | DEBUG    | __main__:trials:24 - Trial = 24271/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.279 | DEBUG    | __main__:trials:29 - Trial = 24271/30000 | Total reward = 38.23
2022-01-26 14:18:24.283 | DEBUG    | __main__:trials:24 - Trial = 24272/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.285 | DEBUG    | __main__:trials:29 - Trial = 24272/30000 | Total reward = 31.89
2022-01-26 14:18:24.288 | DEBUG    | __main__:trials:24 - Trial = 24273/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.290 | DEBUG    | __main__:trials:29 - Trial = 24273/30000 | Total reward = 34.49
2022-01-26 14:18:24.293 | DEBUG    | __main__:trials:24 - Trial = 24274/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.295 | DEBUG    | __main__:trials:29 - Trial = 24274/30000 | Total reward = 34.97
2022-01-26 14:18:24.299 | DEBUG    | __main__:trials:24 - Trial = 24275/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.300 | DEBUG    | __main__:trials:29 - Trial = 24275/30000 | Total reward = 38.29
2022-01-26 14:18:24.303 | DEBUG    | __main__:trials:24 - Trial = 24276/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.305 | DEBUG    | __main__:trials:29 - Trial = 24276/30000 | Total reward = 37.92
2022-01-26 14:18:24.309 | DEBUG    | __main__:trials:24 - Trial = 24277/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.311 | DEBUG    | __main__:trials:29 - Trial = 24277/30000 | Total reward = 42.70
2022-01-26 14:18:24.315 | DEBUG    | __main__:trials:24 - Trial = 24278/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.316 | DEBUG    | __main__:trials:29 - Trial = 24278/30000 | Total reward = 44.98
2022-01-26 14:18:24.320 | DEBUG    | __main__:trials:24 - Trial = 24279/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.321 | DEBUG    | __main__:trials:29 - Trial = 24279/30000 | Total reward = 36.03
2022-01-26 14:18:24.324 | DEBUG    | __main__:trials:24 - Trial = 24280/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.326 | DEBUG    | __main__:trials:29 - Trial = 24280/30000 | Total reward = 37.43
2022-01-26 14:18:24.330 | DEBUG    | __main__:trials:24 - Trial = 24281/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.331 | DEBUG    | __main__:trials:29 - Trial = 24281/30000 | Total reward = 42.81
2022-01-26 14:18:24.335 | DEBUG    | __main__:trials:24 - Trial = 24282/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.337 | DEBUG    | __main__:trials:29 - Trial = 24282/30000 | Total reward = 52.06
2022-01-26 14:18:24.340 | DEBUG    | __main__:trials:24 - Trial = 24283/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.342 | DEBUG    | __main__:trials:29 - Trial = 24283/30000 | Total reward = 36.19
2022-01-26 14:18:24.345 | DEBUG    | __main__:trials:24 - Trial = 24284/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.347 | DEBUG    | __main__:trials:29 - Trial = 24284/30000 | Total reward = 35.51
2022-01-26 14:18:24.350 | DEBUG    | __main__:trials:26 - Trial = 24285/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.352 | DEBUG    | __main__:trials:29 - Trial = 24285/30000 | Total reward = 28.93
2022-01-26 14:18:24.356 | DEBUG    | __main__:trials:24 - Trial = 24286/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.357 | DEBUG    | __main__:trials:29 - Trial = 24286/30000 | Total reward = 37.94
2022-01-26 14:18:24.359 | DEBUG    | __main__:trials:26 - Trial = 24287/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.361 | DEBUG    | __main__:trials:29 - Trial = 24287/30000 | Total reward = 10.11
2022-01-26 14:18:24.365 | DEBUG    | __main__:trials:24 - Trial = 24288/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.366 | DEBUG    | __main__:trials:29 - Trial = 24288/30000 | Total reward = 33.35
2022-01-26 14:18:24.369 | DEBUG    | __main__:trials:24 - Trial = 24289/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.370 | DEBUG    | __main__:trials:29 - Trial = 24289/30000 | Total reward = 26.41
2022-01-26 14:18:24.373 | DEBUG    | __main__:trials:26 - Trial = 24290/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.374 | DEBUG    | __main__:trials:29 - Trial = 24290/30000 | Total reward = 28.91
2022-01-26 14:18:24.378 | DEBUG    | __main__:trials:24 - Trial = 24291/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.378 | DEBUG    | __main__:trials:29 - Trial = 24291/30000 | Total reward = 37.23
2022-01-26 14:18:24.382 | DEBUG    | __main__:trials:24 - Trial = 24292/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.384 | DEBUG    | __main__:trials:29 - Trial = 24292/30000 | Total reward = 37.40
2022-01-26 14:18:24.387 | DEBUG    | __main__:trials:24 - Trial = 24293/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.389 | DEBUG    | __main__:trials:29 - Trial = 24293/30000 | Total reward = 35.88
2022-01-26 14:18:24.392 | DEBUG    | __main__:trials:24 - Trial = 24294/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.394 | DEBUG    | __main__:trials:29 - Trial = 24294/30000 | Total reward = 32.99
2022-01-26 14:18:24.397 | DEBUG    | __main__:trials:24 - Trial = 24295/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.398 | DEBUG    | __main__:trials:29 - Trial = 24295/30000 | Total reward = 35.65
2022-01-26 14:18:24.402 | DEBUG    | __main__:trials:24 - Trial = 24296/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.404 | DEBUG    | __main__:trials:29 - Trial = 24296/30000 | Total reward = 36.81
2022-01-26 14:18:24.408 | DEBUG    | __main__:trials:24 - Trial = 24297/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.409 | DEBUG    | __main__:trials:29 - Trial = 24297/30000 | Total reward = 35.83
2022-01-26 14:18:24.412 | DEBUG    | __main__:trials:24 - Trial = 24298/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.414 | DEBUG    | __main__:trials:29 - Trial = 24298/30000 | Total reward = 33.20
2022-01-26 14:18:24.418 | DEBUG    | __main__:trials:24 - Trial = 24299/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.418 | DEBUG    | __main__:trials:29 - Trial = 24299/30000 | Total reward = 52.59
2022-01-26 14:18:24.423 | DEBUG    | __main__:trials:24 - Trial = 24300/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.424 | DEBUG    | __main__:trials:29 - Trial = 24300/30000 | Total reward = 32.10
2022-01-26 14:18:24.427 | DEBUG    | __main__:trials:26 - Trial = 24301/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.429 | DEBUG    | __main__:trials:29 - Trial = 24301/30000 | Total reward = 10.79
2022-01-26 14:18:24.432 | DEBUG    | __main__:trials:24 - Trial = 24302/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.434 | DEBUG    | __main__:trials:29 - Trial = 24302/30000 | Total reward = 53.01
2022-01-26 14:18:24.438 | DEBUG    | __main__:trials:24 - Trial = 24303/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.439 | DEBUG    | __main__:trials:29 - Trial = 24303/30000 | Total reward = 36.61
2022-01-26 14:18:24.443 | DEBUG    | __main__:trials:24 - Trial = 24304/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.445 | DEBUG    | __main__:trials:29 - Trial = 24304/30000 | Total reward = 37.23
2022-01-26 14:18:24.448 | DEBUG    | __main__:trials:24 - Trial = 24305/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.450 | DEBUG    | __main__:trials:29 - Trial = 24305/30000 | Total reward = 36.52
2022-01-26 14:18:24.453 | DEBUG    | __main__:trials:24 - Trial = 24306/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.455 | DEBUG    | __main__:trials:29 - Trial = 24306/30000 | Total reward = 36.98
2022-01-26 14:18:24.458 | DEBUG    | __main__:trials:26 - Trial = 24307/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.460 | DEBUG    | __main__:trials:29 - Trial = 24307/30000 | Total reward = 29.36
2022-01-26 14:18:24.463 | DEBUG    | __main__:trials:24 - Trial = 24308/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.465 | DEBUG    | __main__:trials:29 - Trial = 24308/30000 | Total reward = 31.15
2022-01-26 14:18:24.468 | DEBUG    | __main__:trials:24 - Trial = 24309/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.469 | DEBUG    | __main__:trials:29 - Trial = 24309/30000 | Total reward = 33.86
2022-01-26 14:18:24.472 | DEBUG    | __main__:trials:24 - Trial = 24310/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.473 | DEBUG    | __main__:trials:29 - Trial = 24310/30000 | Total reward = 46.27
2022-01-26 14:18:24.476 | DEBUG    | __main__:trials:24 - Trial = 24311/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.477 | DEBUG    | __main__:trials:29 - Trial = 24311/30000 | Total reward = 36.80
2022-01-26 14:18:24.481 | DEBUG    | __main__:trials:24 - Trial = 24312/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.481 | DEBUG    | __main__:trials:29 - Trial = 24312/30000 | Total reward = 36.44
2022-01-26 14:18:24.485 | DEBUG    | __main__:trials:24 - Trial = 24313/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.486 | DEBUG    | __main__:trials:29 - Trial = 24313/30000 | Total reward = 35.31
2022-01-26 14:18:24.490 | DEBUG    | __main__:trials:24 - Trial = 24314/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.491 | DEBUG    | __main__:trials:29 - Trial = 24314/30000 | Total reward = 39.67
2022-01-26 14:18:24.494 | DEBUG    | __main__:trials:24 - Trial = 24315/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.495 | DEBUG    | __main__:trials:29 - Trial = 24315/30000 | Total reward = 36.81
2022-01-26 14:18:24.498 | DEBUG    | __main__:trials:24 - Trial = 24316/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.499 | DEBUG    | __main__:trials:29 - Trial = 24316/30000 | Total reward = 33.95
2022-01-26 14:18:24.502 | DEBUG    | __main__:trials:24 - Trial = 24317/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.503 | DEBUG    | __main__:trials:29 - Trial = 24317/30000 | Total reward = 36.11
2022-01-26 14:18:24.506 | DEBUG    | __main__:trials:24 - Trial = 24318/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.508 | DEBUG    | __main__:trials:29 - Trial = 24318/30000 | Total reward = 35.04
2022-01-26 14:18:24.511 | DEBUG    | __main__:trials:24 - Trial = 24319/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.513 | DEBUG    | __main__:trials:29 - Trial = 24319/30000 | Total reward = 6.71
2022-01-26 14:18:24.516 | DEBUG    | __main__:trials:24 - Trial = 24320/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.519 | DEBUG    | __main__:trials:29 - Trial = 24320/30000 | Total reward = 36.10
2022-01-26 14:18:24.523 | DEBUG    | __main__:trials:24 - Trial = 24321/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.523 | DEBUG    | __main__:trials:29 - Trial = 24321/30000 | Total reward = 37.23
2022-01-26 14:18:24.527 | DEBUG    | __main__:trials:24 - Trial = 24322/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.529 | DEBUG    | __main__:trials:29 - Trial = 24322/30000 | Total reward = 36.95
2022-01-26 14:18:24.533 | DEBUG    | __main__:trials:24 - Trial = 24323/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.534 | DEBUG    | __main__:trials:29 - Trial = 24323/30000 | Total reward = 38.17
2022-01-26 14:18:24.537 | DEBUG    | __main__:trials:24 - Trial = 24324/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.538 | DEBUG    | __main__:trials:29 - Trial = 24324/30000 | Total reward = 34.72
2022-01-26 14:18:24.541 | DEBUG    | __main__:trials:24 - Trial = 24325/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.543 | DEBUG    | __main__:trials:29 - Trial = 24325/30000 | Total reward = 21.83
2022-01-26 14:18:24.546 | DEBUG    | __main__:trials:24 - Trial = 24326/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.548 | DEBUG    | __main__:trials:29 - Trial = 24326/30000 | Total reward = 16.20
2022-01-26 14:18:24.550 | DEBUG    | __main__:trials:26 - Trial = 24327/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.552 | DEBUG    | __main__:trials:29 - Trial = 24327/30000 | Total reward = 11.18
2022-01-26 14:18:24.555 | DEBUG    | __main__:trials:24 - Trial = 24328/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.557 | DEBUG    | __main__:trials:29 - Trial = 24328/30000 | Total reward = 45.96
2022-01-26 14:18:24.560 | DEBUG    | __main__:trials:24 - Trial = 24329/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.562 | DEBUG    | __main__:trials:29 - Trial = 24329/30000 | Total reward = 36.14
2022-01-26 14:18:24.565 | DEBUG    | __main__:trials:24 - Trial = 24330/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.567 | DEBUG    | __main__:trials:29 - Trial = 24330/30000 | Total reward = 38.13
2022-01-26 14:18:24.570 | DEBUG    | __main__:trials:24 - Trial = 24331/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.572 | DEBUG    | __main__:trials:29 - Trial = 24331/30000 | Total reward = 49.91
2022-01-26 14:18:24.576 | DEBUG    | __main__:trials:24 - Trial = 24332/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.577 | DEBUG    | __main__:trials:29 - Trial = 24332/30000 | Total reward = 22.46
2022-01-26 14:18:24.580 | DEBUG    | __main__:trials:24 - Trial = 24333/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.582 | DEBUG    | __main__:trials:29 - Trial = 24333/30000 | Total reward = 37.79
2022-01-26 14:18:24.586 | DEBUG    | __main__:trials:26 - Trial = 24334/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.587 | DEBUG    | __main__:trials:29 - Trial = 24334/30000 | Total reward = 23.98
2022-01-26 14:18:24.590 | DEBUG    | __main__:trials:24 - Trial = 24335/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.592 | DEBUG    | __main__:trials:29 - Trial = 24335/30000 | Total reward = 33.62
2022-01-26 14:18:24.595 | DEBUG    | __main__:trials:26 - Trial = 24336/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.597 | DEBUG    | __main__:trials:29 - Trial = 24336/30000 | Total reward = 22.11
2022-01-26 14:18:24.601 | DEBUG    | __main__:trials:24 - Trial = 24337/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.601 | DEBUG    | __main__:trials:29 - Trial = 24337/30000 | Total reward = 35.31
2022-01-26 14:18:24.605 | DEBUG    | __main__:trials:24 - Trial = 24338/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.605 | DEBUG    | __main__:trials:29 - Trial = 24338/30000 | Total reward = 34.97
2022-01-26 14:18:24.609 | DEBUG    | __main__:trials:24 - Trial = 24339/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.611 | DEBUG    | __main__:trials:29 - Trial = 24339/30000 | Total reward = 38.62
2022-01-26 14:18:24.614 | DEBUG    | __main__:trials:24 - Trial = 24340/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.616 | DEBUG    | __main__:trials:29 - Trial = 24340/30000 | Total reward = 43.78
2022-01-26 14:18:24.619 | DEBUG    | __main__:trials:24 - Trial = 24341/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.621 | DEBUG    | __main__:trials:29 - Trial = 24341/30000 | Total reward = 28.27
2022-01-26 14:18:24.624 | DEBUG    | __main__:trials:24 - Trial = 24342/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.626 | DEBUG    | __main__:trials:29 - Trial = 24342/30000 | Total reward = 31.48
2022-01-26 14:18:24.630 | DEBUG    | __main__:trials:24 - Trial = 24343/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.632 | DEBUG    | __main__:trials:29 - Trial = 24343/30000 | Total reward = 47.18
2022-01-26 14:18:24.634 | DEBUG    | __main__:trials:26 - Trial = 24344/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.636 | DEBUG    | __main__:trials:29 - Trial = 24344/30000 | Total reward = 21.74
2022-01-26 14:18:24.639 | DEBUG    | __main__:trials:24 - Trial = 24345/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.641 | DEBUG    | __main__:trials:29 - Trial = 24345/30000 | Total reward = 35.26
2022-01-26 14:18:24.645 | DEBUG    | __main__:trials:24 - Trial = 24346/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.647 | DEBUG    | __main__:trials:29 - Trial = 24346/30000 | Total reward = 37.65
2022-01-26 14:18:24.650 | DEBUG    | __main__:trials:24 - Trial = 24347/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.652 | DEBUG    | __main__:trials:29 - Trial = 24347/30000 | Total reward = 38.39
2022-01-26 14:18:24.656 | DEBUG    | __main__:trials:24 - Trial = 24348/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.658 | DEBUG    | __main__:trials:29 - Trial = 24348/30000 | Total reward = 40.05
2022-01-26 14:18:24.662 | DEBUG    | __main__:trials:24 - Trial = 24349/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.663 | DEBUG    | __main__:trials:29 - Trial = 24349/30000 | Total reward = 59.27
2022-01-26 14:18:24.667 | DEBUG    | __main__:trials:24 - Trial = 24350/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.669 | DEBUG    | __main__:trials:29 - Trial = 24350/30000 | Total reward = 27.69
2022-01-26 14:18:24.672 | DEBUG    | __main__:trials:26 - Trial = 24351/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.674 | DEBUG    | __main__:trials:29 - Trial = 24351/30000 | Total reward = 27.68
2022-01-26 14:18:24.678 | DEBUG    | __main__:trials:24 - Trial = 24352/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.678 | DEBUG    | __main__:trials:29 - Trial = 24352/30000 | Total reward = 29.98
2022-01-26 14:18:24.683 | DEBUG    | __main__:trials:24 - Trial = 24353/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.683 | DEBUG    | __main__:trials:29 - Trial = 24353/30000 | Total reward = 32.96
2022-01-26 14:18:24.688 | DEBUG    | __main__:trials:24 - Trial = 24354/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.689 | DEBUG    | __main__:trials:29 - Trial = 24354/30000 | Total reward = 32.15
2022-01-26 14:18:24.692 | DEBUG    | __main__:trials:24 - Trial = 24355/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.694 | DEBUG    | __main__:trials:29 - Trial = 24355/30000 | Total reward = 34.61
2022-01-26 14:18:24.698 | DEBUG    | __main__:trials:24 - Trial = 24356/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.699 | DEBUG    | __main__:trials:29 - Trial = 24356/30000 | Total reward = 30.95
2022-01-26 14:18:24.703 | DEBUG    | __main__:trials:24 - Trial = 24357/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.704 | DEBUG    | __main__:trials:29 - Trial = 24357/30000 | Total reward = 35.89
2022-01-26 14:18:24.707 | DEBUG    | __main__:trials:26 - Trial = 24358/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.708 | DEBUG    | __main__:trials:29 - Trial = 24358/30000 | Total reward = 18.97
2022-01-26 14:18:24.712 | DEBUG    | __main__:trials:24 - Trial = 24359/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.714 | DEBUG    | __main__:trials:29 - Trial = 24359/30000 | Total reward = 35.83
2022-01-26 14:18:24.717 | DEBUG    | __main__:trials:24 - Trial = 24360/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.719 | DEBUG    | __main__:trials:29 - Trial = 24360/30000 | Total reward = 36.21
2022-01-26 14:18:24.722 | DEBUG    | __main__:trials:24 - Trial = 24361/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.724 | DEBUG    | __main__:trials:29 - Trial = 24361/30000 | Total reward = 44.04
2022-01-26 14:18:24.727 | DEBUG    | __main__:trials:24 - Trial = 24362/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.729 | DEBUG    | __main__:trials:29 - Trial = 24362/30000 | Total reward = 29.67
2022-01-26 14:18:24.733 | DEBUG    | __main__:trials:24 - Trial = 24363/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.735 | DEBUG    | __main__:trials:29 - Trial = 24363/30000 | Total reward = 34.04
2022-01-26 14:18:24.738 | DEBUG    | __main__:trials:24 - Trial = 24364/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.740 | DEBUG    | __main__:trials:29 - Trial = 24364/30000 | Total reward = 47.95
2022-01-26 14:18:24.743 | DEBUG    | __main__:trials:24 - Trial = 24365/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.745 | DEBUG    | __main__:trials:29 - Trial = 24365/30000 | Total reward = 33.99
2022-01-26 14:18:24.748 | DEBUG    | __main__:trials:24 - Trial = 24366/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.750 | DEBUG    | __main__:trials:29 - Trial = 24366/30000 | Total reward = 34.05
2022-01-26 14:18:24.754 | DEBUG    | __main__:trials:24 - Trial = 24367/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.755 | DEBUG    | __main__:trials:29 - Trial = 24367/30000 | Total reward = 33.11
2022-01-26 14:18:24.759 | DEBUG    | __main__:trials:24 - Trial = 24368/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.761 | DEBUG    | __main__:trials:29 - Trial = 24368/30000 | Total reward = 52.29
2022-01-26 14:18:24.764 | DEBUG    | __main__:trials:24 - Trial = 24369/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.765 | DEBUG    | __main__:trials:29 - Trial = 24369/30000 | Total reward = 47.96
2022-01-26 14:18:24.769 | DEBUG    | __main__:trials:24 - Trial = 24370/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.770 | DEBUG    | __main__:trials:29 - Trial = 24370/30000 | Total reward = 35.68
2022-01-26 14:18:24.774 | DEBUG    | __main__:trials:24 - Trial = 24371/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.776 | DEBUG    | __main__:trials:29 - Trial = 24371/30000 | Total reward = 36.56
2022-01-26 14:18:24.780 | DEBUG    | __main__:trials:24 - Trial = 24372/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.781 | DEBUG    | __main__:trials:29 - Trial = 24372/30000 | Total reward = 31.84
2022-01-26 14:18:24.785 | DEBUG    | __main__:trials:24 - Trial = 24373/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.787 | DEBUG    | __main__:trials:29 - Trial = 24373/30000 | Total reward = 36.22
2022-01-26 14:18:24.789 | DEBUG    | __main__:trials:24 - Trial = 24374/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.791 | DEBUG    | __main__:trials:29 - Trial = 24374/30000 | Total reward = 36.51
2022-01-26 14:18:24.794 | DEBUG    | __main__:trials:24 - Trial = 24375/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.796 | DEBUG    | __main__:trials:29 - Trial = 24375/30000 | Total reward = 55.04
2022-01-26 14:18:24.799 | DEBUG    | __main__:trials:24 - Trial = 24376/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.801 | DEBUG    | __main__:trials:29 - Trial = 24376/30000 | Total reward = 25.42
2022-01-26 14:18:24.804 | DEBUG    | __main__:trials:24 - Trial = 24377/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.806 | DEBUG    | __main__:trials:29 - Trial = 24377/30000 | Total reward = 34.22
2022-01-26 14:18:24.809 | DEBUG    | __main__:trials:26 - Trial = 24378/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.810 | DEBUG    | __main__:trials:29 - Trial = 24378/30000 | Total reward = 26.83
2022-01-26 14:18:24.813 | DEBUG    | __main__:trials:24 - Trial = 24379/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.815 | DEBUG    | __main__:trials:29 - Trial = 24379/30000 | Total reward = 36.91
2022-01-26 14:18:24.817 | DEBUG    | __main__:trials:24 - Trial = 24380/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.819 | DEBUG    | __main__:trials:29 - Trial = 24380/30000 | Total reward = 36.51
2022-01-26 14:18:24.823 | DEBUG    | __main__:trials:24 - Trial = 24381/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.825 | DEBUG    | __main__:trials:29 - Trial = 24381/30000 | Total reward = 25.48
2022-01-26 14:18:24.829 | DEBUG    | __main__:trials:24 - Trial = 24382/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.830 | DEBUG    | __main__:trials:29 - Trial = 24382/30000 | Total reward = 32.22
2022-01-26 14:18:24.833 | DEBUG    | __main__:trials:24 - Trial = 24383/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.834 | DEBUG    | __main__:trials:29 - Trial = 24383/30000 | Total reward = 35.25
2022-01-26 14:18:24.837 | DEBUG    | __main__:trials:24 - Trial = 24384/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.839 | DEBUG    | __main__:trials:29 - Trial = 24384/30000 | Total reward = 39.71
2022-01-26 14:18:24.842 | DEBUG    | __main__:trials:24 - Trial = 24385/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.842 | DEBUG    | __main__:trials:29 - Trial = 24385/30000 | Total reward = 34.59
2022-01-26 14:18:24.846 | DEBUG    | __main__:trials:24 - Trial = 24386/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.846 | DEBUG    | __main__:trials:29 - Trial = 24386/30000 | Total reward = 37.59
2022-01-26 14:18:24.850 | DEBUG    | __main__:trials:26 - Trial = 24387/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.851 | DEBUG    | __main__:trials:29 - Trial = 24387/30000 | Total reward = 25.14
2022-01-26 14:18:24.855 | DEBUG    | __main__:trials:24 - Trial = 24388/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.857 | DEBUG    | __main__:trials:29 - Trial = 24388/30000 | Total reward = 36.90
2022-01-26 14:18:24.860 | DEBUG    | __main__:trials:24 - Trial = 24389/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.862 | DEBUG    | __main__:trials:29 - Trial = 24389/30000 | Total reward = 37.30
2022-01-26 14:18:24.865 | DEBUG    | __main__:trials:24 - Trial = 24390/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.867 | DEBUG    | __main__:trials:29 - Trial = 24390/30000 | Total reward = 51.39
2022-01-26 14:18:24.871 | DEBUG    | __main__:trials:24 - Trial = 24391/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.873 | DEBUG    | __main__:trials:29 - Trial = 24391/30000 | Total reward = 36.83
2022-01-26 14:18:24.876 | DEBUG    | __main__:trials:24 - Trial = 24392/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.878 | DEBUG    | __main__:trials:29 - Trial = 24392/30000 | Total reward = 32.64
2022-01-26 14:18:24.882 | DEBUG    | __main__:trials:24 - Trial = 24393/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.883 | DEBUG    | __main__:trials:29 - Trial = 24393/30000 | Total reward = 26.79
2022-01-26 14:18:24.886 | DEBUG    | __main__:trials:26 - Trial = 24394/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:24.888 | DEBUG    | __main__:trials:29 - Trial = 24394/30000 | Total reward = 19.29
2022-01-26 14:18:24.892 | DEBUG    | __main__:trials:24 - Trial = 24395/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.894 | DEBUG    | __main__:trials:29 - Trial = 24395/30000 | Total reward = 32.85
2022-01-26 14:18:24.897 | DEBUG    | __main__:trials:24 - Trial = 24396/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.899 | DEBUG    | __main__:trials:29 - Trial = 24396/30000 | Total reward = 37.90
2022-01-26 14:18:24.903 | DEBUG    | __main__:trials:24 - Trial = 24397/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.905 | DEBUG    | __main__:trials:29 - Trial = 24397/30000 | Total reward = 33.89
2022-01-26 14:18:24.908 | DEBUG    | __main__:trials:24 - Trial = 24398/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.909 | DEBUG    | __main__:trials:29 - Trial = 24398/30000 | Total reward = 32.79
2022-01-26 14:18:24.912 | DEBUG    | __main__:trials:24 - Trial = 24399/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.914 | DEBUG    | __main__:trials:29 - Trial = 24399/30000 | Total reward = 34.12
2022-01-26 14:18:24.918 | DEBUG    | __main__:trials:24 - Trial = 24400/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.919 | DEBUG    | __main__:trials:29 - Trial = 24400/30000 | Total reward = 37.91
2022-01-26 14:18:24.923 | DEBUG    | __main__:trials:24 - Trial = 24401/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.924 | DEBUG    | __main__:trials:29 - Trial = 24401/30000 | Total reward = 39.08
2022-01-26 14:18:24.928 | DEBUG    | __main__:trials:24 - Trial = 24402/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.929 | DEBUG    | __main__:trials:29 - Trial = 24402/30000 | Total reward = 45.06
2022-01-26 14:18:24.933 | DEBUG    | __main__:trials:24 - Trial = 24403/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.935 | DEBUG    | __main__:trials:29 - Trial = 24403/30000 | Total reward = 35.08
2022-01-26 14:18:24.938 | DEBUG    | __main__:trials:24 - Trial = 24404/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.940 | DEBUG    | __main__:trials:29 - Trial = 24404/30000 | Total reward = 31.74
2022-01-26 14:18:24.944 | DEBUG    | __main__:trials:24 - Trial = 24405/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.945 | DEBUG    | __main__:trials:29 - Trial = 24405/30000 | Total reward = 59.95
2022-01-26 14:18:24.949 | DEBUG    | __main__:trials:24 - Trial = 24406/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.950 | DEBUG    | __main__:trials:29 - Trial = 24406/30000 | Total reward = 35.26
2022-01-26 14:18:24.953 | DEBUG    | __main__:trials:24 - Trial = 24407/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.954 | DEBUG    | __main__:trials:29 - Trial = 24407/30000 | Total reward = 34.78
2022-01-26 14:18:24.959 | DEBUG    | __main__:trials:24 - Trial = 24408/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.960 | DEBUG    | __main__:trials:29 - Trial = 24408/30000 | Total reward = 32.77
2022-01-26 14:18:24.964 | DEBUG    | __main__:trials:24 - Trial = 24409/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.966 | DEBUG    | __main__:trials:29 - Trial = 24409/30000 | Total reward = 43.88
2022-01-26 14:18:24.969 | DEBUG    | __main__:trials:24 - Trial = 24410/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.970 | DEBUG    | __main__:trials:29 - Trial = 24410/30000 | Total reward = 36.39
2022-01-26 14:18:24.974 | DEBUG    | __main__:trials:24 - Trial = 24411/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.975 | DEBUG    | __main__:trials:29 - Trial = 24411/30000 | Total reward = 51.68
2022-01-26 14:18:24.979 | DEBUG    | __main__:trials:24 - Trial = 24412/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.981 | DEBUG    | __main__:trials:29 - Trial = 24412/30000 | Total reward = 38.46
2022-01-26 14:18:24.984 | DEBUG    | __main__:trials:24 - Trial = 24413/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.986 | DEBUG    | __main__:trials:29 - Trial = 24413/30000 | Total reward = 31.89
2022-01-26 14:18:24.989 | DEBUG    | __main__:trials:24 - Trial = 24414/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.991 | DEBUG    | __main__:trials:29 - Trial = 24414/30000 | Total reward = 38.32
2022-01-26 14:18:24.995 | DEBUG    | __main__:trials:24 - Trial = 24415/30000 | Max number of steps (20) reached
2022-01-26 14:18:24.995 | DEBUG    | __main__:trials:29 - Trial = 24415/30000 | Total reward = 31.46
2022-01-26 14:18:24.999 | DEBUG    | __main__:trials:24 - Trial = 24416/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.000 | DEBUG    | __main__:trials:29 - Trial = 24416/30000 | Total reward = 38.15
2022-01-26 14:18:25.004 | DEBUG    | __main__:trials:24 - Trial = 24417/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.006 | DEBUG    | __main__:trials:29 - Trial = 24417/30000 | Total reward = 41.64
2022-01-26 14:18:25.009 | DEBUG    | __main__:trials:24 - Trial = 24418/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.011 | DEBUG    | __main__:trials:29 - Trial = 24418/30000 | Total reward = 49.61
2022-01-26 14:18:25.015 | DEBUG    | __main__:trials:24 - Trial = 24419/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.016 | DEBUG    | __main__:trials:29 - Trial = 24419/30000 | Total reward = 36.26
2022-01-26 14:18:25.019 | DEBUG    | __main__:trials:24 - Trial = 24420/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.021 | DEBUG    | __main__:trials:29 - Trial = 24420/30000 | Total reward = 35.91
2022-01-26 14:18:25.025 | DEBUG    | __main__:trials:24 - Trial = 24421/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.027 | DEBUG    | __main__:trials:29 - Trial = 24421/30000 | Total reward = 39.86
2022-01-26 14:18:25.030 | DEBUG    | __main__:trials:24 - Trial = 24422/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.032 | DEBUG    | __main__:trials:29 - Trial = 24422/30000 | Total reward = 30.21
2022-01-26 14:18:25.035 | DEBUG    | __main__:trials:24 - Trial = 24423/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.037 | DEBUG    | __main__:trials:29 - Trial = 24423/30000 | Total reward = 32.17
2022-01-26 14:18:25.040 | DEBUG    | __main__:trials:24 - Trial = 24424/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.041 | DEBUG    | __main__:trials:29 - Trial = 24424/30000 | Total reward = 34.20
2022-01-26 14:18:25.044 | DEBUG    | __main__:trials:24 - Trial = 24425/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.045 | DEBUG    | __main__:trials:29 - Trial = 24425/30000 | Total reward = 36.30
2022-01-26 14:18:25.049 | DEBUG    | __main__:trials:24 - Trial = 24426/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.050 | DEBUG    | __main__:trials:29 - Trial = 24426/30000 | Total reward = 30.13
2022-01-26 14:18:25.054 | DEBUG    | __main__:trials:24 - Trial = 24427/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.055 | DEBUG    | __main__:trials:29 - Trial = 24427/30000 | Total reward = 51.14
2022-01-26 14:18:25.058 | DEBUG    | __main__:trials:24 - Trial = 24428/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.060 | DEBUG    | __main__:trials:29 - Trial = 24428/30000 | Total reward = 53.44
2022-01-26 14:18:25.063 | DEBUG    | __main__:trials:24 - Trial = 24429/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.065 | DEBUG    | __main__:trials:29 - Trial = 24429/30000 | Total reward = 35.14
2022-01-26 14:18:25.068 | DEBUG    | __main__:trials:24 - Trial = 24430/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.071 | DEBUG    | __main__:trials:29 - Trial = 24430/30000 | Total reward = 41.21
2022-01-26 14:18:25.074 | DEBUG    | __main__:trials:24 - Trial = 24431/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.076 | DEBUG    | __main__:trials:29 - Trial = 24431/30000 | Total reward = 47.08
2022-01-26 14:18:25.080 | DEBUG    | __main__:trials:24 - Trial = 24432/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.081 | DEBUG    | __main__:trials:29 - Trial = 24432/30000 | Total reward = 38.39
2022-01-26 14:18:25.085 | DEBUG    | __main__:trials:24 - Trial = 24433/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.086 | DEBUG    | __main__:trials:29 - Trial = 24433/30000 | Total reward = 39.47
2022-01-26 14:18:25.090 | DEBUG    | __main__:trials:24 - Trial = 24434/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.092 | DEBUG    | __main__:trials:29 - Trial = 24434/30000 | Total reward = 38.61
2022-01-26 14:18:25.096 | DEBUG    | __main__:trials:24 - Trial = 24435/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.097 | DEBUG    | __main__:trials:29 - Trial = 24435/30000 | Total reward = 35.75
2022-01-26 14:18:25.101 | DEBUG    | __main__:trials:24 - Trial = 24436/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.103 | DEBUG    | __main__:trials:29 - Trial = 24436/30000 | Total reward = 38.53
2022-01-26 14:18:25.106 | DEBUG    | __main__:trials:24 - Trial = 24437/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.108 | DEBUG    | __main__:trials:29 - Trial = 24437/30000 | Total reward = 40.46
2022-01-26 14:18:25.112 | DEBUG    | __main__:trials:24 - Trial = 24438/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.113 | DEBUG    | __main__:trials:29 - Trial = 24438/30000 | Total reward = 36.51
2022-01-26 14:18:25.117 | DEBUG    | __main__:trials:26 - Trial = 24439/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.118 | DEBUG    | __main__:trials:29 - Trial = 24439/30000 | Total reward = 19.38
2022-01-26 14:18:25.122 | DEBUG    | __main__:trials:24 - Trial = 24440/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.123 | DEBUG    | __main__:trials:29 - Trial = 24440/30000 | Total reward = 35.58
2022-01-26 14:18:25.126 | DEBUG    | __main__:trials:24 - Trial = 24441/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.127 | DEBUG    | __main__:trials:29 - Trial = 24441/30000 | Total reward = 34.75
2022-01-26 14:18:25.130 | DEBUG    | __main__:trials:24 - Trial = 24442/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.132 | DEBUG    | __main__:trials:29 - Trial = 24442/30000 | Total reward = 37.81
2022-01-26 14:18:25.136 | DEBUG    | __main__:trials:24 - Trial = 24443/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.137 | DEBUG    | __main__:trials:29 - Trial = 24443/30000 | Total reward = 48.77
2022-01-26 14:18:25.141 | DEBUG    | __main__:trials:24 - Trial = 24444/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.142 | DEBUG    | __main__:trials:29 - Trial = 24444/30000 | Total reward = 36.79
2022-01-26 14:18:25.146 | DEBUG    | __main__:trials:24 - Trial = 24445/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.148 | DEBUG    | __main__:trials:29 - Trial = 24445/30000 | Total reward = 52.72
2022-01-26 14:18:25.151 | DEBUG    | __main__:trials:26 - Trial = 24446/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.153 | DEBUG    | __main__:trials:29 - Trial = 24446/30000 | Total reward = 34.26
2022-01-26 14:18:25.157 | DEBUG    | __main__:trials:24 - Trial = 24447/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.157 | DEBUG    | __main__:trials:29 - Trial = 24447/30000 | Total reward = 32.85
2022-01-26 14:18:25.161 | DEBUG    | __main__:trials:24 - Trial = 24448/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.162 | DEBUG    | __main__:trials:29 - Trial = 24448/30000 | Total reward = 30.83
2022-01-26 14:18:25.165 | DEBUG    | __main__:trials:24 - Trial = 24449/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.167 | DEBUG    | __main__:trials:29 - Trial = 24449/30000 | Total reward = 37.95
2022-01-26 14:18:25.170 | DEBUG    | __main__:trials:24 - Trial = 24450/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.172 | DEBUG    | __main__:trials:29 - Trial = 24450/30000 | Total reward = 47.26
2022-01-26 14:18:25.175 | DEBUG    | __main__:trials:26 - Trial = 24451/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.177 | DEBUG    | __main__:trials:29 - Trial = 24451/30000 | Total reward = 9.68
2022-01-26 14:18:25.180 | DEBUG    | __main__:trials:24 - Trial = 24452/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.182 | DEBUG    | __main__:trials:29 - Trial = 24452/30000 | Total reward = 37.27
2022-01-26 14:18:25.186 | DEBUG    | __main__:trials:24 - Trial = 24453/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.187 | DEBUG    | __main__:trials:29 - Trial = 24453/30000 | Total reward = 29.14
2022-01-26 14:18:25.191 | DEBUG    | __main__:trials:24 - Trial = 24454/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.192 | DEBUG    | __main__:trials:29 - Trial = 24454/30000 | Total reward = 32.41
2022-01-26 14:18:25.195 | DEBUG    | __main__:trials:24 - Trial = 24455/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.196 | DEBUG    | __main__:trials:29 - Trial = 24455/30000 | Total reward = 31.62
2022-01-26 14:18:25.199 | DEBUG    | __main__:trials:24 - Trial = 24456/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.200 | DEBUG    | __main__:trials:29 - Trial = 24456/30000 | Total reward = 41.84
2022-01-26 14:18:25.204 | DEBUG    | __main__:trials:24 - Trial = 24457/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.205 | DEBUG    | __main__:trials:29 - Trial = 24457/30000 | Total reward = 39.41
2022-01-26 14:18:25.208 | DEBUG    | __main__:trials:24 - Trial = 24458/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.210 | DEBUG    | __main__:trials:29 - Trial = 24458/30000 | Total reward = 47.84
2022-01-26 14:18:25.213 | DEBUG    | __main__:trials:24 - Trial = 24459/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.214 | DEBUG    | __main__:trials:29 - Trial = 24459/30000 | Total reward = 42.63
2022-01-26 14:18:25.217 | DEBUG    | __main__:trials:26 - Trial = 24460/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.218 | DEBUG    | __main__:trials:29 - Trial = 24460/30000 | Total reward = 21.67
2022-01-26 14:18:25.221 | DEBUG    | __main__:trials:24 - Trial = 24461/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.223 | DEBUG    | __main__:trials:29 - Trial = 24461/30000 | Total reward = 35.08
2022-01-26 14:18:25.225 | DEBUG    | __main__:trials:26 - Trial = 24462/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.226 | DEBUG    | __main__:trials:29 - Trial = 24462/30000 | Total reward = 10.11
2022-01-26 14:18:25.229 | DEBUG    | __main__:trials:24 - Trial = 24463/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.230 | DEBUG    | __main__:trials:29 - Trial = 24463/30000 | Total reward = 50.68
2022-01-26 14:18:25.233 | DEBUG    | __main__:trials:24 - Trial = 24464/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.235 | DEBUG    | __main__:trials:29 - Trial = 24464/30000 | Total reward = 37.84
2022-01-26 14:18:25.238 | DEBUG    | __main__:trials:24 - Trial = 24465/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.240 | DEBUG    | __main__:trials:29 - Trial = 24465/30000 | Total reward = 36.44
2022-01-26 14:18:25.243 | DEBUG    | __main__:trials:24 - Trial = 24466/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.243 | DEBUG    | __main__:trials:29 - Trial = 24466/30000 | Total reward = 51.27
2022-01-26 14:18:25.247 | DEBUG    | __main__:trials:24 - Trial = 24467/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.248 | DEBUG    | __main__:trials:29 - Trial = 24467/30000 | Total reward = 40.61
2022-01-26 14:18:25.252 | DEBUG    | __main__:trials:24 - Trial = 24468/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.254 | DEBUG    | __main__:trials:29 - Trial = 24468/30000 | Total reward = 34.59
2022-01-26 14:18:25.257 | DEBUG    | __main__:trials:24 - Trial = 24469/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.259 | DEBUG    | __main__:trials:29 - Trial = 24469/30000 | Total reward = 39.20
2022-01-26 14:18:25.262 | DEBUG    | __main__:trials:24 - Trial = 24470/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.264 | DEBUG    | __main__:trials:29 - Trial = 24470/30000 | Total reward = 40.80
2022-01-26 14:18:25.268 | DEBUG    | __main__:trials:24 - Trial = 24471/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.269 | DEBUG    | __main__:trials:29 - Trial = 24471/30000 | Total reward = 30.16
2022-01-26 14:18:25.273 | DEBUG    | __main__:trials:24 - Trial = 24472/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.274 | DEBUG    | __main__:trials:29 - Trial = 24472/30000 | Total reward = 39.31
2022-01-26 14:18:25.278 | DEBUG    | __main__:trials:24 - Trial = 24473/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.280 | DEBUG    | __main__:trials:29 - Trial = 24473/30000 | Total reward = 35.72
2022-01-26 14:18:25.284 | DEBUG    | __main__:trials:24 - Trial = 24474/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.286 | DEBUG    | __main__:trials:29 - Trial = 24474/30000 | Total reward = 36.11
2022-01-26 14:18:25.289 | DEBUG    | __main__:trials:24 - Trial = 24475/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.291 | DEBUG    | __main__:trials:29 - Trial = 24475/30000 | Total reward = 38.31
2022-01-26 14:18:25.295 | DEBUG    | __main__:trials:24 - Trial = 24476/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.296 | DEBUG    | __main__:trials:29 - Trial = 24476/30000 | Total reward = 36.01
2022-01-26 14:18:25.299 | DEBUG    | __main__:trials:24 - Trial = 24477/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.301 | DEBUG    | __main__:trials:29 - Trial = 24477/30000 | Total reward = 33.64
2022-01-26 14:18:25.305 | DEBUG    | __main__:trials:24 - Trial = 24478/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.306 | DEBUG    | __main__:trials:29 - Trial = 24478/30000 | Total reward = 37.24
2022-01-26 14:18:25.310 | DEBUG    | __main__:trials:24 - Trial = 24479/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.312 | DEBUG    | __main__:trials:29 - Trial = 24479/30000 | Total reward = 37.99
2022-01-26 14:18:25.316 | DEBUG    | __main__:trials:24 - Trial = 24480/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.317 | DEBUG    | __main__:trials:29 - Trial = 24480/30000 | Total reward = 45.34
2022-01-26 14:18:25.320 | DEBUG    | __main__:trials:24 - Trial = 24481/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.322 | DEBUG    | __main__:trials:29 - Trial = 24481/30000 | Total reward = 38.74
2022-01-26 14:18:25.325 | DEBUG    | __main__:trials:24 - Trial = 24482/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.327 | DEBUG    | __main__:trials:29 - Trial = 24482/30000 | Total reward = 33.17
2022-01-26 14:18:25.331 | DEBUG    | __main__:trials:24 - Trial = 24483/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.333 | DEBUG    | __main__:trials:29 - Trial = 24483/30000 | Total reward = 33.86
2022-01-26 14:18:25.336 | DEBUG    | __main__:trials:24 - Trial = 24484/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.338 | DEBUG    | __main__:trials:29 - Trial = 24484/30000 | Total reward = 35.63
2022-01-26 14:18:25.341 | DEBUG    | __main__:trials:26 - Trial = 24485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.342 | DEBUG    | __main__:trials:29 - Trial = 24485/30000 | Total reward = 9.11
2022-01-26 14:18:25.345 | DEBUG    | __main__:trials:26 - Trial = 24486/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.347 | DEBUG    | __main__:trials:29 - Trial = 24486/30000 | Total reward = 16.87
2022-01-26 14:18:25.351 | DEBUG    | __main__:trials:24 - Trial = 24487/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.353 | DEBUG    | __main__:trials:29 - Trial = 24487/30000 | Total reward = 37.93
2022-01-26 14:18:25.356 | DEBUG    | __main__:trials:24 - Trial = 24488/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.358 | DEBUG    | __main__:trials:29 - Trial = 24488/30000 | Total reward = 29.75
2022-01-26 14:18:25.361 | DEBUG    | __main__:trials:24 - Trial = 24489/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.362 | DEBUG    | __main__:trials:29 - Trial = 24489/30000 | Total reward = 35.21
2022-01-26 14:18:25.366 | DEBUG    | __main__:trials:24 - Trial = 24490/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.368 | DEBUG    | __main__:trials:29 - Trial = 24490/30000 | Total reward = 47.20
2022-01-26 14:18:25.371 | DEBUG    | __main__:trials:24 - Trial = 24491/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.373 | DEBUG    | __main__:trials:29 - Trial = 24491/30000 | Total reward = 43.01
2022-01-26 14:18:25.377 | DEBUG    | __main__:trials:24 - Trial = 24492/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.378 | DEBUG    | __main__:trials:29 - Trial = 24492/30000 | Total reward = 37.75
2022-01-26 14:18:25.381 | DEBUG    | __main__:trials:24 - Trial = 24493/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.382 | DEBUG    | __main__:trials:29 - Trial = 24493/30000 | Total reward = 36.14
2022-01-26 14:18:25.385 | DEBUG    | __main__:trials:24 - Trial = 24494/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.386 | DEBUG    | __main__:trials:29 - Trial = 24494/30000 | Total reward = 37.79
2022-01-26 14:18:25.389 | DEBUG    | __main__:trials:24 - Trial = 24495/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.390 | DEBUG    | __main__:trials:29 - Trial = 24495/30000 | Total reward = 36.18
2022-01-26 14:18:25.394 | DEBUG    | __main__:trials:24 - Trial = 24496/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.395 | DEBUG    | __main__:trials:29 - Trial = 24496/30000 | Total reward = 36.15
2022-01-26 14:18:25.399 | DEBUG    | __main__:trials:24 - Trial = 24497/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.401 | DEBUG    | __main__:trials:29 - Trial = 24497/30000 | Total reward = 51.07
2022-01-26 14:18:25.404 | DEBUG    | __main__:trials:24 - Trial = 24498/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.406 | DEBUG    | __main__:trials:29 - Trial = 24498/30000 | Total reward = 37.32
2022-01-26 14:18:25.410 | DEBUG    | __main__:trials:24 - Trial = 24499/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.411 | DEBUG    | __main__:trials:29 - Trial = 24499/30000 | Total reward = 31.66
2022-01-26 14:18:25.414 | DEBUG    | __main__:trials:24 - Trial = 24500/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.416 | DEBUG    | __main__:trials:29 - Trial = 24500/30000 | Total reward = 42.66
2022-01-26 14:18:25.420 | DEBUG    | __main__:trials:26 - Trial = 24501/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.422 | DEBUG    | __main__:trials:29 - Trial = 24501/30000 | Total reward = 30.68
2022-01-26 14:18:25.426 | DEBUG    | __main__:trials:24 - Trial = 24502/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.428 | DEBUG    | __main__:trials:29 - Trial = 24502/30000 | Total reward = 33.34
2022-01-26 14:18:25.431 | DEBUG    | __main__:trials:24 - Trial = 24503/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.433 | DEBUG    | __main__:trials:29 - Trial = 24503/30000 | Total reward = 35.09
2022-01-26 14:18:25.437 | DEBUG    | __main__:trials:24 - Trial = 24504/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.438 | DEBUG    | __main__:trials:29 - Trial = 24504/30000 | Total reward = 46.84
2022-01-26 14:18:25.442 | DEBUG    | __main__:trials:24 - Trial = 24505/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.444 | DEBUG    | __main__:trials:29 - Trial = 24505/30000 | Total reward = 34.76
2022-01-26 14:18:25.447 | DEBUG    | __main__:trials:24 - Trial = 24506/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.449 | DEBUG    | __main__:trials:29 - Trial = 24506/30000 | Total reward = 31.41
2022-01-26 14:18:25.453 | DEBUG    | __main__:trials:24 - Trial = 24507/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.454 | DEBUG    | __main__:trials:29 - Trial = 24507/30000 | Total reward = 42.58
2022-01-26 14:18:25.458 | DEBUG    | __main__:trials:26 - Trial = 24508/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.460 | DEBUG    | __main__:trials:29 - Trial = 24508/30000 | Total reward = 23.13
2022-01-26 14:18:25.464 | DEBUG    | __main__:trials:24 - Trial = 24509/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.465 | DEBUG    | __main__:trials:29 - Trial = 24509/30000 | Total reward = 34.38
2022-01-26 14:18:25.469 | DEBUG    | __main__:trials:24 - Trial = 24510/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.470 | DEBUG    | __main__:trials:29 - Trial = 24510/30000 | Total reward = 37.45
2022-01-26 14:18:25.474 | DEBUG    | __main__:trials:24 - Trial = 24511/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.475 | DEBUG    | __main__:trials:29 - Trial = 24511/30000 | Total reward = 35.23
2022-01-26 14:18:25.479 | DEBUG    | __main__:trials:24 - Trial = 24512/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.480 | DEBUG    | __main__:trials:29 - Trial = 24512/30000 | Total reward = 37.45
2022-01-26 14:18:25.484 | DEBUG    | __main__:trials:24 - Trial = 24513/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.486 | DEBUG    | __main__:trials:29 - Trial = 24513/30000 | Total reward = 40.09
2022-01-26 14:18:25.490 | DEBUG    | __main__:trials:24 - Trial = 24514/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.491 | DEBUG    | __main__:trials:29 - Trial = 24514/30000 | Total reward = 37.63
2022-01-26 14:18:25.495 | DEBUG    | __main__:trials:24 - Trial = 24515/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.496 | DEBUG    | __main__:trials:29 - Trial = 24515/30000 | Total reward = 38.21
2022-01-26 14:18:25.500 | DEBUG    | __main__:trials:24 - Trial = 24516/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.502 | DEBUG    | __main__:trials:29 - Trial = 24516/30000 | Total reward = 32.93
2022-01-26 14:18:25.505 | DEBUG    | __main__:trials:24 - Trial = 24517/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.507 | DEBUG    | __main__:trials:29 - Trial = 24517/30000 | Total reward = 37.65
2022-01-26 14:18:25.510 | DEBUG    | __main__:trials:24 - Trial = 24518/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.512 | DEBUG    | __main__:trials:29 - Trial = 24518/30000 | Total reward = 51.61
2022-01-26 14:18:25.516 | DEBUG    | __main__:trials:24 - Trial = 24519/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.516 | DEBUG    | __main__:trials:29 - Trial = 24519/30000 | Total reward = 37.70
2022-01-26 14:18:25.520 | DEBUG    | __main__:trials:24 - Trial = 24520/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.522 | DEBUG    | __main__:trials:29 - Trial = 24520/30000 | Total reward = 38.13
2022-01-26 14:18:25.526 | DEBUG    | __main__:trials:24 - Trial = 24521/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.527 | DEBUG    | __main__:trials:29 - Trial = 24521/30000 | Total reward = 55.75
2022-01-26 14:18:25.531 | DEBUG    | __main__:trials:24 - Trial = 24522/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.533 | DEBUG    | __main__:trials:29 - Trial = 24522/30000 | Total reward = 39.97
2022-01-26 14:18:25.537 | DEBUG    | __main__:trials:24 - Trial = 24523/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.538 | DEBUG    | __main__:trials:29 - Trial = 24523/30000 | Total reward = 34.44
2022-01-26 14:18:25.541 | DEBUG    | __main__:trials:24 - Trial = 24524/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.542 | DEBUG    | __main__:trials:29 - Trial = 24524/30000 | Total reward = 41.42
2022-01-26 14:18:25.545 | DEBUG    | __main__:trials:26 - Trial = 24525/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.547 | DEBUG    | __main__:trials:29 - Trial = 24525/30000 | Total reward = 17.12
2022-01-26 14:18:25.550 | DEBUG    | __main__:trials:24 - Trial = 24526/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.551 | DEBUG    | __main__:trials:29 - Trial = 24526/30000 | Total reward = 50.83
2022-01-26 14:18:25.555 | DEBUG    | __main__:trials:24 - Trial = 24527/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.557 | DEBUG    | __main__:trials:29 - Trial = 24527/30000 | Total reward = 37.81
2022-01-26 14:18:25.560 | DEBUG    | __main__:trials:24 - Trial = 24528/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.562 | DEBUG    | __main__:trials:29 - Trial = 24528/30000 | Total reward = 38.36
2022-01-26 14:18:25.566 | DEBUG    | __main__:trials:24 - Trial = 24529/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.567 | DEBUG    | __main__:trials:29 - Trial = 24529/30000 | Total reward = 38.06
2022-01-26 14:18:25.571 | DEBUG    | __main__:trials:24 - Trial = 24530/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.573 | DEBUG    | __main__:trials:29 - Trial = 24530/30000 | Total reward = 38.44
2022-01-26 14:18:25.576 | DEBUG    | __main__:trials:24 - Trial = 24531/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.578 | DEBUG    | __main__:trials:29 - Trial = 24531/30000 | Total reward = 38.82
2022-01-26 14:18:25.582 | DEBUG    | __main__:trials:24 - Trial = 24532/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.583 | DEBUG    | __main__:trials:29 - Trial = 24532/30000 | Total reward = 31.39
2022-01-26 14:18:25.587 | DEBUG    | __main__:trials:24 - Trial = 24533/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.588 | DEBUG    | __main__:trials:29 - Trial = 24533/30000 | Total reward = 54.66
2022-01-26 14:18:25.592 | DEBUG    | __main__:trials:24 - Trial = 24534/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.593 | DEBUG    | __main__:trials:29 - Trial = 24534/30000 | Total reward = 46.95
2022-01-26 14:18:25.597 | DEBUG    | __main__:trials:24 - Trial = 24535/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.598 | DEBUG    | __main__:trials:29 - Trial = 24535/30000 | Total reward = 28.62
2022-01-26 14:18:25.602 | DEBUG    | __main__:trials:24 - Trial = 24536/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.604 | DEBUG    | __main__:trials:29 - Trial = 24536/30000 | Total reward = 36.39
2022-01-26 14:18:25.608 | DEBUG    | __main__:trials:24 - Trial = 24537/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.609 | DEBUG    | __main__:trials:29 - Trial = 24537/30000 | Total reward = 38.02
2022-01-26 14:18:25.612 | DEBUG    | __main__:trials:24 - Trial = 24538/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.614 | DEBUG    | __main__:trials:29 - Trial = 24538/30000 | Total reward = 42.48
2022-01-26 14:18:25.618 | DEBUG    | __main__:trials:24 - Trial = 24539/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.620 | DEBUG    | __main__:trials:29 - Trial = 24539/30000 | Total reward = 38.23
2022-01-26 14:18:25.623 | DEBUG    | __main__:trials:24 - Trial = 24540/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.624 | DEBUG    | __main__:trials:29 - Trial = 24540/30000 | Total reward = 49.12
2022-01-26 14:18:25.627 | DEBUG    | __main__:trials:24 - Trial = 24541/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.628 | DEBUG    | __main__:trials:29 - Trial = 24541/30000 | Total reward = 37.64
2022-01-26 14:18:25.632 | DEBUG    | __main__:trials:24 - Trial = 24542/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.633 | DEBUG    | __main__:trials:29 - Trial = 24542/30000 | Total reward = 37.02
2022-01-26 14:18:25.637 | DEBUG    | __main__:trials:24 - Trial = 24543/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.638 | DEBUG    | __main__:trials:29 - Trial = 24543/30000 | Total reward = 36.47
2022-01-26 14:18:25.642 | DEBUG    | __main__:trials:24 - Trial = 24544/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.643 | DEBUG    | __main__:trials:29 - Trial = 24544/30000 | Total reward = 37.81
2022-01-26 14:18:25.647 | DEBUG    | __main__:trials:26 - Trial = 24545/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.649 | DEBUG    | __main__:trials:29 - Trial = 24545/30000 | Total reward = 21.73
2022-01-26 14:18:25.652 | DEBUG    | __main__:trials:24 - Trial = 24546/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.654 | DEBUG    | __main__:trials:29 - Trial = 24546/30000 | Total reward = 50.36
2022-01-26 14:18:25.658 | DEBUG    | __main__:trials:24 - Trial = 24547/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.659 | DEBUG    | __main__:trials:29 - Trial = 24547/30000 | Total reward = 36.85
2022-01-26 14:18:25.663 | DEBUG    | __main__:trials:24 - Trial = 24548/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.665 | DEBUG    | __main__:trials:29 - Trial = 24548/30000 | Total reward = 33.87
2022-01-26 14:18:25.667 | DEBUG    | __main__:trials:26 - Trial = 24549/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.668 | DEBUG    | __main__:trials:29 - Trial = 24549/30000 | Total reward = 7.96
2022-01-26 14:18:25.672 | DEBUG    | __main__:trials:24 - Trial = 24550/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.673 | DEBUG    | __main__:trials:29 - Trial = 24550/30000 | Total reward = 36.14
2022-01-26 14:18:25.677 | DEBUG    | __main__:trials:24 - Trial = 24551/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.679 | DEBUG    | __main__:trials:29 - Trial = 24551/30000 | Total reward = 33.76
2022-01-26 14:18:25.683 | DEBUG    | __main__:trials:24 - Trial = 24552/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.684 | DEBUG    | __main__:trials:29 - Trial = 24552/30000 | Total reward = 35.93
2022-01-26 14:18:25.688 | DEBUG    | __main__:trials:24 - Trial = 24553/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.689 | DEBUG    | __main__:trials:29 - Trial = 24553/30000 | Total reward = 30.05
2022-01-26 14:18:25.693 | DEBUG    | __main__:trials:24 - Trial = 24554/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.695 | DEBUG    | __main__:trials:29 - Trial = 24554/30000 | Total reward = 30.24
2022-01-26 14:18:25.698 | DEBUG    | __main__:trials:26 - Trial = 24555/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.700 | DEBUG    | __main__:trials:29 - Trial = 24555/30000 | Total reward = 21.38
2022-01-26 14:18:25.703 | DEBUG    | __main__:trials:24 - Trial = 24556/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.705 | DEBUG    | __main__:trials:29 - Trial = 24556/30000 | Total reward = 31.83
2022-01-26 14:18:25.708 | DEBUG    | __main__:trials:24 - Trial = 24557/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.710 | DEBUG    | __main__:trials:29 - Trial = 24557/30000 | Total reward = 36.84
2022-01-26 14:18:25.712 | DEBUG    | __main__:trials:26 - Trial = 24558/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.713 | DEBUG    | __main__:trials:29 - Trial = 24558/30000 | Total reward = 23.87
2022-01-26 14:18:25.717 | DEBUG    | __main__:trials:24 - Trial = 24559/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.719 | DEBUG    | __main__:trials:29 - Trial = 24559/30000 | Total reward = 41.10
2022-01-26 14:18:25.722 | DEBUG    | __main__:trials:24 - Trial = 24560/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.724 | DEBUG    | __main__:trials:29 - Trial = 24560/30000 | Total reward = 47.73
2022-01-26 14:18:25.727 | DEBUG    | __main__:trials:24 - Trial = 24561/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.729 | DEBUG    | __main__:trials:29 - Trial = 24561/30000 | Total reward = 37.00
2022-01-26 14:18:25.732 | DEBUG    | __main__:trials:24 - Trial = 24562/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.734 | DEBUG    | __main__:trials:29 - Trial = 24562/30000 | Total reward = 47.70
2022-01-26 14:18:25.737 | DEBUG    | __main__:trials:24 - Trial = 24563/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.738 | DEBUG    | __main__:trials:29 - Trial = 24563/30000 | Total reward = 37.87
2022-01-26 14:18:25.741 | DEBUG    | __main__:trials:24 - Trial = 24564/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.742 | DEBUG    | __main__:trials:29 - Trial = 24564/30000 | Total reward = 37.11
2022-01-26 14:18:25.746 | DEBUG    | __main__:trials:24 - Trial = 24565/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.747 | DEBUG    | __main__:trials:29 - Trial = 24565/30000 | Total reward = 43.69
2022-01-26 14:18:25.751 | DEBUG    | __main__:trials:24 - Trial = 24566/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.753 | DEBUG    | __main__:trials:29 - Trial = 24566/30000 | Total reward = 34.03
2022-01-26 14:18:25.756 | DEBUG    | __main__:trials:24 - Trial = 24567/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.758 | DEBUG    | __main__:trials:29 - Trial = 24567/30000 | Total reward = 29.40
2022-01-26 14:18:25.762 | DEBUG    | __main__:trials:24 - Trial = 24568/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.763 | DEBUG    | __main__:trials:29 - Trial = 24568/30000 | Total reward = 34.22
2022-01-26 14:18:25.766 | DEBUG    | __main__:trials:26 - Trial = 24569/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.768 | DEBUG    | __main__:trials:29 - Trial = 24569/30000 | Total reward = 16.74
2022-01-26 14:18:25.770 | DEBUG    | __main__:trials:26 - Trial = 24570/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.772 | DEBUG    | __main__:trials:29 - Trial = 24570/30000 | Total reward = 10.11
2022-01-26 14:18:25.775 | DEBUG    | __main__:trials:24 - Trial = 24571/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.777 | DEBUG    | __main__:trials:29 - Trial = 24571/30000 | Total reward = 39.14
2022-01-26 14:18:25.780 | DEBUG    | __main__:trials:24 - Trial = 24572/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.782 | DEBUG    | __main__:trials:29 - Trial = 24572/30000 | Total reward = 33.91
2022-01-26 14:18:25.786 | DEBUG    | __main__:trials:24 - Trial = 24573/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.787 | DEBUG    | __main__:trials:29 - Trial = 24573/30000 | Total reward = 40.18
2022-01-26 14:18:25.791 | DEBUG    | __main__:trials:24 - Trial = 24574/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.792 | DEBUG    | __main__:trials:29 - Trial = 24574/30000 | Total reward = 38.91
2022-01-26 14:18:25.796 | DEBUG    | __main__:trials:24 - Trial = 24575/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.797 | DEBUG    | __main__:trials:29 - Trial = 24575/30000 | Total reward = 25.55
2022-01-26 14:18:25.801 | DEBUG    | __main__:trials:24 - Trial = 24576/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.803 | DEBUG    | __main__:trials:29 - Trial = 24576/30000 | Total reward = 33.85
2022-01-26 14:18:25.806 | DEBUG    | __main__:trials:24 - Trial = 24577/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.807 | DEBUG    | __main__:trials:29 - Trial = 24577/30000 | Total reward = 38.13
2022-01-26 14:18:25.811 | DEBUG    | __main__:trials:24 - Trial = 24578/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.813 | DEBUG    | __main__:trials:29 - Trial = 24578/30000 | Total reward = 37.62
2022-01-26 14:18:25.817 | DEBUG    | __main__:trials:24 - Trial = 24579/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.818 | DEBUG    | __main__:trials:29 - Trial = 24579/30000 | Total reward = 35.36
2022-01-26 14:18:25.821 | DEBUG    | __main__:trials:24 - Trial = 24580/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.823 | DEBUG    | __main__:trials:29 - Trial = 24580/30000 | Total reward = 38.41
2022-01-26 14:18:25.826 | DEBUG    | __main__:trials:24 - Trial = 24581/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.827 | DEBUG    | __main__:trials:29 - Trial = 24581/30000 | Total reward = 38.38
2022-01-26 14:18:25.831 | DEBUG    | __main__:trials:24 - Trial = 24582/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.833 | DEBUG    | __main__:trials:29 - Trial = 24582/30000 | Total reward = 34.85
2022-01-26 14:18:25.836 | DEBUG    | __main__:trials:24 - Trial = 24583/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.838 | DEBUG    | __main__:trials:29 - Trial = 24583/30000 | Total reward = 30.68
2022-01-26 14:18:25.840 | DEBUG    | __main__:trials:24 - Trial = 24584/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.842 | DEBUG    | __main__:trials:29 - Trial = 24584/30000 | Total reward = 32.94
2022-01-26 14:18:25.846 | DEBUG    | __main__:trials:24 - Trial = 24585/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.848 | DEBUG    | __main__:trials:29 - Trial = 24585/30000 | Total reward = 28.13
2022-01-26 14:18:25.851 | DEBUG    | __main__:trials:24 - Trial = 24586/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.852 | DEBUG    | __main__:trials:29 - Trial = 24586/30000 | Total reward = 39.86
2022-01-26 14:18:25.856 | DEBUG    | __main__:trials:24 - Trial = 24587/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.857 | DEBUG    | __main__:trials:29 - Trial = 24587/30000 | Total reward = 41.76
2022-01-26 14:18:25.861 | DEBUG    | __main__:trials:26 - Trial = 24588/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.863 | DEBUG    | __main__:trials:29 - Trial = 24588/30000 | Total reward = 23.35
2022-01-26 14:18:25.867 | DEBUG    | __main__:trials:24 - Trial = 24589/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.867 | DEBUG    | __main__:trials:29 - Trial = 24589/30000 | Total reward = 35.40
2022-01-26 14:18:25.871 | DEBUG    | __main__:trials:24 - Trial = 24590/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.873 | DEBUG    | __main__:trials:29 - Trial = 24590/30000 | Total reward = 39.40
2022-01-26 14:18:25.876 | DEBUG    | __main__:trials:24 - Trial = 24591/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.878 | DEBUG    | __main__:trials:29 - Trial = 24591/30000 | Total reward = 37.91
2022-01-26 14:18:25.881 | DEBUG    | __main__:trials:24 - Trial = 24592/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.882 | DEBUG    | __main__:trials:29 - Trial = 24592/30000 | Total reward = 34.11
2022-01-26 14:18:25.886 | DEBUG    | __main__:trials:24 - Trial = 24593/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.887 | DEBUG    | __main__:trials:29 - Trial = 24593/30000 | Total reward = 31.52
2022-01-26 14:18:25.891 | DEBUG    | __main__:trials:24 - Trial = 24594/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.893 | DEBUG    | __main__:trials:29 - Trial = 24594/30000 | Total reward = 36.98
2022-01-26 14:18:25.897 | DEBUG    | __main__:trials:24 - Trial = 24595/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.898 | DEBUG    | __main__:trials:29 - Trial = 24595/30000 | Total reward = 31.16
2022-01-26 14:18:25.902 | DEBUG    | __main__:trials:24 - Trial = 24596/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.903 | DEBUG    | __main__:trials:29 - Trial = 24596/30000 | Total reward = 33.95
2022-01-26 14:18:25.907 | DEBUG    | __main__:trials:24 - Trial = 24597/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.909 | DEBUG    | __main__:trials:29 - Trial = 24597/30000 | Total reward = 37.55
2022-01-26 14:18:25.912 | DEBUG    | __main__:trials:24 - Trial = 24598/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.914 | DEBUG    | __main__:trials:29 - Trial = 24598/30000 | Total reward = 35.20
2022-01-26 14:18:25.917 | DEBUG    | __main__:trials:24 - Trial = 24599/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.919 | DEBUG    | __main__:trials:29 - Trial = 24599/30000 | Total reward = 37.31
2022-01-26 14:18:25.922 | DEBUG    | __main__:trials:24 - Trial = 24600/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.924 | DEBUG    | __main__:trials:29 - Trial = 24600/30000 | Total reward = 34.73
2022-01-26 14:18:25.927 | DEBUG    | __main__:trials:24 - Trial = 24601/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.928 | DEBUG    | __main__:trials:29 - Trial = 24601/30000 | Total reward = 48.56
2022-01-26 14:18:25.932 | DEBUG    | __main__:trials:24 - Trial = 24602/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.933 | DEBUG    | __main__:trials:29 - Trial = 24602/30000 | Total reward = 34.22
2022-01-26 14:18:25.937 | DEBUG    | __main__:trials:24 - Trial = 24603/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.939 | DEBUG    | __main__:trials:29 - Trial = 24603/30000 | Total reward = 28.01
2022-01-26 14:18:25.942 | DEBUG    | __main__:trials:24 - Trial = 24604/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.943 | DEBUG    | __main__:trials:29 - Trial = 24604/30000 | Total reward = 41.39
2022-01-26 14:18:25.947 | DEBUG    | __main__:trials:24 - Trial = 24605/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.949 | DEBUG    | __main__:trials:29 - Trial = 24605/30000 | Total reward = 46.40
2022-01-26 14:18:25.952 | DEBUG    | __main__:trials:24 - Trial = 24606/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.953 | DEBUG    | __main__:trials:29 - Trial = 24606/30000 | Total reward = 34.38
2022-01-26 14:18:25.957 | DEBUG    | __main__:trials:24 - Trial = 24607/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.959 | DEBUG    | __main__:trials:29 - Trial = 24607/30000 | Total reward = 40.34
2022-01-26 14:18:25.962 | DEBUG    | __main__:trials:24 - Trial = 24608/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.964 | DEBUG    | __main__:trials:29 - Trial = 24608/30000 | Total reward = 36.31
2022-01-26 14:18:25.967 | DEBUG    | __main__:trials:26 - Trial = 24609/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:25.967 | DEBUG    | __main__:trials:29 - Trial = 24609/30000 | Total reward = 12.41
2022-01-26 14:18:25.972 | DEBUG    | __main__:trials:24 - Trial = 24610/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.974 | DEBUG    | __main__:trials:29 - Trial = 24610/30000 | Total reward = 33.99
2022-01-26 14:18:25.977 | DEBUG    | __main__:trials:24 - Trial = 24611/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.979 | DEBUG    | __main__:trials:29 - Trial = 24611/30000 | Total reward = 33.59
2022-01-26 14:18:25.982 | DEBUG    | __main__:trials:24 - Trial = 24612/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.984 | DEBUG    | __main__:trials:29 - Trial = 24612/30000 | Total reward = 36.29
2022-01-26 14:18:25.987 | DEBUG    | __main__:trials:24 - Trial = 24613/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.989 | DEBUG    | __main__:trials:29 - Trial = 24613/30000 | Total reward = 33.70
2022-01-26 14:18:25.992 | DEBUG    | __main__:trials:24 - Trial = 24614/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.993 | DEBUG    | __main__:trials:29 - Trial = 24614/30000 | Total reward = 33.70
2022-01-26 14:18:25.997 | DEBUG    | __main__:trials:24 - Trial = 24615/30000 | Max number of steps (20) reached
2022-01-26 14:18:25.999 | DEBUG    | __main__:trials:29 - Trial = 24615/30000 | Total reward = 35.60
2022-01-26 14:18:26.003 | DEBUG    | __main__:trials:24 - Trial = 24616/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.003 | DEBUG    | __main__:trials:29 - Trial = 24616/30000 | Total reward = 31.76
2022-01-26 14:18:26.008 | DEBUG    | __main__:trials:24 - Trial = 24617/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.009 | DEBUG    | __main__:trials:29 - Trial = 24617/30000 | Total reward = 52.08
2022-01-26 14:18:26.012 | DEBUG    | __main__:trials:24 - Trial = 24618/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.014 | DEBUG    | __main__:trials:29 - Trial = 24618/30000 | Total reward = 33.96
2022-01-26 14:18:26.017 | DEBUG    | __main__:trials:24 - Trial = 24619/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.019 | DEBUG    | __main__:trials:29 - Trial = 24619/30000 | Total reward = 51.73
2022-01-26 14:18:26.023 | DEBUG    | __main__:trials:24 - Trial = 24620/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.024 | DEBUG    | __main__:trials:29 - Trial = 24620/30000 | Total reward = 36.54
2022-01-26 14:18:26.028 | DEBUG    | __main__:trials:24 - Trial = 24621/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.028 | DEBUG    | __main__:trials:29 - Trial = 24621/30000 | Total reward = 32.78
2022-01-26 14:18:26.033 | DEBUG    | __main__:trials:24 - Trial = 24622/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.034 | DEBUG    | __main__:trials:29 - Trial = 24622/30000 | Total reward = 34.38
2022-01-26 14:18:26.038 | DEBUG    | __main__:trials:24 - Trial = 24623/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.040 | DEBUG    | __main__:trials:29 - Trial = 24623/30000 | Total reward = 33.44
2022-01-26 14:18:26.044 | DEBUG    | __main__:trials:24 - Trial = 24624/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.045 | DEBUG    | __main__:trials:29 - Trial = 24624/30000 | Total reward = 34.68
2022-01-26 14:18:26.048 | DEBUG    | __main__:trials:24 - Trial = 24625/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.050 | DEBUG    | __main__:trials:29 - Trial = 24625/30000 | Total reward = 36.74
2022-01-26 14:18:26.054 | DEBUG    | __main__:trials:24 - Trial = 24626/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.055 | DEBUG    | __main__:trials:29 - Trial = 24626/30000 | Total reward = 39.47
2022-01-26 14:18:26.059 | DEBUG    | __main__:trials:24 - Trial = 24627/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.061 | DEBUG    | __main__:trials:29 - Trial = 24627/30000 | Total reward = 36.61
2022-01-26 14:18:26.065 | DEBUG    | __main__:trials:24 - Trial = 24628/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.065 | DEBUG    | __main__:trials:29 - Trial = 24628/30000 | Total reward = 37.28
2022-01-26 14:18:26.068 | DEBUG    | __main__:trials:24 - Trial = 24629/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.069 | DEBUG    | __main__:trials:29 - Trial = 24629/30000 | Total reward = 45.04
2022-01-26 14:18:26.073 | DEBUG    | __main__:trials:26 - Trial = 24630/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.074 | DEBUG    | __main__:trials:29 - Trial = 24630/30000 | Total reward = 20.87
2022-01-26 14:18:26.078 | DEBUG    | __main__:trials:26 - Trial = 24631/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.079 | DEBUG    | __main__:trials:29 - Trial = 24631/30000 | Total reward = 31.04
2022-01-26 14:18:26.082 | DEBUG    | __main__:trials:24 - Trial = 24632/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.083 | DEBUG    | __main__:trials:29 - Trial = 24632/30000 | Total reward = 34.84
2022-01-26 14:18:26.087 | DEBUG    | __main__:trials:24 - Trial = 24633/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.089 | DEBUG    | __main__:trials:29 - Trial = 24633/30000 | Total reward = 40.35
2022-01-26 14:18:26.092 | DEBUG    | __main__:trials:24 - Trial = 24634/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.093 | DEBUG    | __main__:trials:29 - Trial = 24634/30000 | Total reward = 33.57
2022-01-26 14:18:26.097 | DEBUG    | __main__:trials:24 - Trial = 24635/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.098 | DEBUG    | __main__:trials:29 - Trial = 24635/30000 | Total reward = 44.31
2022-01-26 14:18:26.102 | DEBUG    | __main__:trials:24 - Trial = 24636/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.102 | DEBUG    | __main__:trials:29 - Trial = 24636/30000 | Total reward = 43.70
2022-01-26 14:18:26.106 | DEBUG    | __main__:trials:24 - Trial = 24637/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.106 | DEBUG    | __main__:trials:29 - Trial = 24637/30000 | Total reward = 34.15
2022-01-26 14:18:26.110 | DEBUG    | __main__:trials:24 - Trial = 24638/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.112 | DEBUG    | __main__:trials:29 - Trial = 24638/30000 | Total reward = 34.45
2022-01-26 14:18:26.116 | DEBUG    | __main__:trials:24 - Trial = 24639/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.116 | DEBUG    | __main__:trials:29 - Trial = 24639/30000 | Total reward = 35.04
2022-01-26 14:18:26.120 | DEBUG    | __main__:trials:24 - Trial = 24640/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.121 | DEBUG    | __main__:trials:29 - Trial = 24640/30000 | Total reward = 34.26
2022-01-26 14:18:26.124 | DEBUG    | __main__:trials:26 - Trial = 24641/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.125 | DEBUG    | __main__:trials:29 - Trial = 24641/30000 | Total reward = 21.17
2022-01-26 14:18:26.128 | DEBUG    | __main__:trials:24 - Trial = 24642/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.130 | DEBUG    | __main__:trials:29 - Trial = 24642/30000 | Total reward = 31.04
2022-01-26 14:18:26.133 | DEBUG    | __main__:trials:24 - Trial = 24643/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.135 | DEBUG    | __main__:trials:29 - Trial = 24643/30000 | Total reward = 47.32
2022-01-26 14:18:26.138 | DEBUG    | __main__:trials:24 - Trial = 24644/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.139 | DEBUG    | __main__:trials:29 - Trial = 24644/30000 | Total reward = 37.12
2022-01-26 14:18:26.142 | DEBUG    | __main__:trials:24 - Trial = 24645/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.144 | DEBUG    | __main__:trials:29 - Trial = 24645/30000 | Total reward = 38.73
2022-01-26 14:18:26.147 | DEBUG    | __main__:trials:24 - Trial = 24646/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.150 | DEBUG    | __main__:trials:29 - Trial = 24646/30000 | Total reward = 39.08
2022-01-26 14:18:26.153 | DEBUG    | __main__:trials:24 - Trial = 24647/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.155 | DEBUG    | __main__:trials:29 - Trial = 24647/30000 | Total reward = 38.20
2022-01-26 14:18:26.159 | DEBUG    | __main__:trials:24 - Trial = 24648/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.160 | DEBUG    | __main__:trials:29 - Trial = 24648/30000 | Total reward = 36.42
2022-01-26 14:18:26.164 | DEBUG    | __main__:trials:24 - Trial = 24649/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.165 | DEBUG    | __main__:trials:29 - Trial = 24649/30000 | Total reward = 60.27
2022-01-26 14:18:26.169 | DEBUG    | __main__:trials:24 - Trial = 24650/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.170 | DEBUG    | __main__:trials:29 - Trial = 24650/30000 | Total reward = 36.93
2022-01-26 14:18:26.174 | DEBUG    | __main__:trials:24 - Trial = 24651/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.176 | DEBUG    | __main__:trials:29 - Trial = 24651/30000 | Total reward = 38.41
2022-01-26 14:18:26.180 | DEBUG    | __main__:trials:24 - Trial = 24652/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.182 | DEBUG    | __main__:trials:29 - Trial = 24652/30000 | Total reward = 42.22
2022-01-26 14:18:26.185 | DEBUG    | __main__:trials:24 - Trial = 24653/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.187 | DEBUG    | __main__:trials:29 - Trial = 24653/30000 | Total reward = 44.46
2022-01-26 14:18:26.191 | DEBUG    | __main__:trials:24 - Trial = 24654/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.192 | DEBUG    | __main__:trials:29 - Trial = 24654/30000 | Total reward = 20.72
2022-01-26 14:18:26.195 | DEBUG    | __main__:trials:24 - Trial = 24655/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.196 | DEBUG    | __main__:trials:29 - Trial = 24655/30000 | Total reward = 36.15
2022-01-26 14:18:26.199 | DEBUG    | __main__:trials:24 - Trial = 24656/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.201 | DEBUG    | __main__:trials:29 - Trial = 24656/30000 | Total reward = 48.95
2022-01-26 14:18:26.204 | DEBUG    | __main__:trials:24 - Trial = 24657/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.206 | DEBUG    | __main__:trials:29 - Trial = 24657/30000 | Total reward = 45.11
2022-01-26 14:18:26.210 | DEBUG    | __main__:trials:24 - Trial = 24658/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.211 | DEBUG    | __main__:trials:29 - Trial = 24658/30000 | Total reward = 41.24
2022-01-26 14:18:26.214 | DEBUG    | __main__:trials:24 - Trial = 24659/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.216 | DEBUG    | __main__:trials:29 - Trial = 24659/30000 | Total reward = 33.49
2022-01-26 14:18:26.219 | DEBUG    | __main__:trials:24 - Trial = 24660/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.220 | DEBUG    | __main__:trials:29 - Trial = 24660/30000 | Total reward = 35.42
2022-01-26 14:18:26.224 | DEBUG    | __main__:trials:24 - Trial = 24661/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.225 | DEBUG    | __main__:trials:29 - Trial = 24661/30000 | Total reward = 36.65
2022-01-26 14:18:26.229 | DEBUG    | __main__:trials:24 - Trial = 24662/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.231 | DEBUG    | __main__:trials:29 - Trial = 24662/30000 | Total reward = 33.47
2022-01-26 14:18:26.235 | DEBUG    | __main__:trials:24 - Trial = 24663/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.236 | DEBUG    | __main__:trials:29 - Trial = 24663/30000 | Total reward = 34.81
2022-01-26 14:18:26.240 | DEBUG    | __main__:trials:24 - Trial = 24664/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.241 | DEBUG    | __main__:trials:29 - Trial = 24664/30000 | Total reward = 44.17
2022-01-26 14:18:26.244 | DEBUG    | __main__:trials:26 - Trial = 24665/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.246 | DEBUG    | __main__:trials:29 - Trial = 24665/30000 | Total reward = 21.08
2022-01-26 14:18:26.249 | DEBUG    | __main__:trials:24 - Trial = 24666/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.250 | DEBUG    | __main__:trials:29 - Trial = 24666/30000 | Total reward = 36.95
2022-01-26 14:18:26.255 | DEBUG    | __main__:trials:24 - Trial = 24667/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.255 | DEBUG    | __main__:trials:29 - Trial = 24667/30000 | Total reward = 51.11
2022-01-26 14:18:26.260 | DEBUG    | __main__:trials:24 - Trial = 24668/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.261 | DEBUG    | __main__:trials:29 - Trial = 24668/30000 | Total reward = 32.93
2022-01-26 14:18:26.265 | DEBUG    | __main__:trials:24 - Trial = 24669/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.267 | DEBUG    | __main__:trials:29 - Trial = 24669/30000 | Total reward = 16.99
2022-01-26 14:18:26.270 | DEBUG    | __main__:trials:24 - Trial = 24670/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.272 | DEBUG    | __main__:trials:29 - Trial = 24670/30000 | Total reward = 38.25
2022-01-26 14:18:26.276 | DEBUG    | __main__:trials:24 - Trial = 24671/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.277 | DEBUG    | __main__:trials:29 - Trial = 24671/30000 | Total reward = 36.84
2022-01-26 14:18:26.281 | DEBUG    | __main__:trials:24 - Trial = 24672/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.282 | DEBUG    | __main__:trials:29 - Trial = 24672/30000 | Total reward = 39.16
2022-01-26 14:18:26.287 | DEBUG    | __main__:trials:24 - Trial = 24673/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.287 | DEBUG    | __main__:trials:29 - Trial = 24673/30000 | Total reward = 37.44
2022-01-26 14:18:26.292 | DEBUG    | __main__:trials:24 - Trial = 24674/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.293 | DEBUG    | __main__:trials:29 - Trial = 24674/30000 | Total reward = 37.57
2022-01-26 14:18:26.297 | DEBUG    | __main__:trials:24 - Trial = 24675/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.298 | DEBUG    | __main__:trials:29 - Trial = 24675/30000 | Total reward = 35.42
2022-01-26 14:18:26.302 | DEBUG    | __main__:trials:24 - Trial = 24676/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.304 | DEBUG    | __main__:trials:29 - Trial = 24676/30000 | Total reward = 36.19
2022-01-26 14:18:26.308 | DEBUG    | __main__:trials:24 - Trial = 24677/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.309 | DEBUG    | __main__:trials:29 - Trial = 24677/30000 | Total reward = 39.31
2022-01-26 14:18:26.313 | DEBUG    | __main__:trials:24 - Trial = 24678/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.314 | DEBUG    | __main__:trials:29 - Trial = 24678/30000 | Total reward = 35.59
2022-01-26 14:18:26.318 | DEBUG    | __main__:trials:24 - Trial = 24679/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.319 | DEBUG    | __main__:trials:29 - Trial = 24679/30000 | Total reward = 40.58
2022-01-26 14:18:26.323 | DEBUG    | __main__:trials:24 - Trial = 24680/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.325 | DEBUG    | __main__:trials:29 - Trial = 24680/30000 | Total reward = 35.77
2022-01-26 14:18:26.329 | DEBUG    | __main__:trials:24 - Trial = 24681/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.330 | DEBUG    | __main__:trials:29 - Trial = 24681/30000 | Total reward = 37.67
2022-01-26 14:18:26.333 | DEBUG    | __main__:trials:24 - Trial = 24682/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.334 | DEBUG    | __main__:trials:29 - Trial = 24682/30000 | Total reward = 35.91
2022-01-26 14:18:26.338 | DEBUG    | __main__:trials:24 - Trial = 24683/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.340 | DEBUG    | __main__:trials:29 - Trial = 24683/30000 | Total reward = 35.44
2022-01-26 14:18:26.343 | DEBUG    | __main__:trials:24 - Trial = 24684/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.344 | DEBUG    | __main__:trials:29 - Trial = 24684/30000 | Total reward = 40.62
2022-01-26 14:18:26.348 | DEBUG    | __main__:trials:24 - Trial = 24685/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.349 | DEBUG    | __main__:trials:29 - Trial = 24685/30000 | Total reward = 37.36
2022-01-26 14:18:26.353 | DEBUG    | __main__:trials:24 - Trial = 24686/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.354 | DEBUG    | __main__:trials:29 - Trial = 24686/30000 | Total reward = 59.87
2022-01-26 14:18:26.358 | DEBUG    | __main__:trials:24 - Trial = 24687/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.359 | DEBUG    | __main__:trials:29 - Trial = 24687/30000 | Total reward = 36.79
2022-01-26 14:18:26.363 | DEBUG    | __main__:trials:24 - Trial = 24688/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.364 | DEBUG    | __main__:trials:29 - Trial = 24688/30000 | Total reward = 29.67
2022-01-26 14:18:26.368 | DEBUG    | __main__:trials:24 - Trial = 24689/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.370 | DEBUG    | __main__:trials:29 - Trial = 24689/30000 | Total reward = 35.53
2022-01-26 14:18:26.374 | DEBUG    | __main__:trials:24 - Trial = 24690/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.375 | DEBUG    | __main__:trials:29 - Trial = 24690/30000 | Total reward = 37.50
2022-01-26 14:18:26.379 | DEBUG    | __main__:trials:24 - Trial = 24691/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.379 | DEBUG    | __main__:trials:29 - Trial = 24691/30000 | Total reward = 31.21
2022-01-26 14:18:26.384 | DEBUG    | __main__:trials:24 - Trial = 24692/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.385 | DEBUG    | __main__:trials:29 - Trial = 24692/30000 | Total reward = 38.78
2022-01-26 14:18:26.388 | DEBUG    | __main__:trials:24 - Trial = 24693/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.390 | DEBUG    | __main__:trials:29 - Trial = 24693/30000 | Total reward = 35.77
2022-01-26 14:18:26.393 | DEBUG    | __main__:trials:24 - Trial = 24694/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.395 | DEBUG    | __main__:trials:29 - Trial = 24694/30000 | Total reward = 33.21
2022-01-26 14:18:26.398 | DEBUG    | __main__:trials:24 - Trial = 24695/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.399 | DEBUG    | __main__:trials:29 - Trial = 24695/30000 | Total reward = 37.45
2022-01-26 14:18:26.403 | DEBUG    | __main__:trials:24 - Trial = 24696/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.403 | DEBUG    | __main__:trials:29 - Trial = 24696/30000 | Total reward = 39.21
2022-01-26 14:18:26.408 | DEBUG    | __main__:trials:24 - Trial = 24697/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.408 | DEBUG    | __main__:trials:29 - Trial = 24697/30000 | Total reward = 35.33
2022-01-26 14:18:26.413 | DEBUG    | __main__:trials:24 - Trial = 24698/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.414 | DEBUG    | __main__:trials:29 - Trial = 24698/30000 | Total reward = 47.69
2022-01-26 14:18:26.418 | DEBUG    | __main__:trials:24 - Trial = 24699/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.420 | DEBUG    | __main__:trials:29 - Trial = 24699/30000 | Total reward = 36.62
2022-01-26 14:18:26.423 | DEBUG    | __main__:trials:24 - Trial = 24700/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.425 | DEBUG    | __main__:trials:29 - Trial = 24700/30000 | Total reward = 38.20
2022-01-26 14:18:26.429 | DEBUG    | __main__:trials:24 - Trial = 24701/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.430 | DEBUG    | __main__:trials:29 - Trial = 24701/30000 | Total reward = 40.33
2022-01-26 14:18:26.434 | DEBUG    | __main__:trials:24 - Trial = 24702/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.435 | DEBUG    | __main__:trials:29 - Trial = 24702/30000 | Total reward = 36.07
2022-01-26 14:18:26.439 | DEBUG    | __main__:trials:24 - Trial = 24703/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.440 | DEBUG    | __main__:trials:29 - Trial = 24703/30000 | Total reward = 38.14
2022-01-26 14:18:26.444 | DEBUG    | __main__:trials:24 - Trial = 24704/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.445 | DEBUG    | __main__:trials:29 - Trial = 24704/30000 | Total reward = 39.35
2022-01-26 14:18:26.449 | DEBUG    | __main__:trials:24 - Trial = 24705/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.451 | DEBUG    | __main__:trials:29 - Trial = 24705/30000 | Total reward = 36.77
2022-01-26 14:18:26.455 | DEBUG    | __main__:trials:24 - Trial = 24706/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.456 | DEBUG    | __main__:trials:29 - Trial = 24706/30000 | Total reward = 38.52
2022-01-26 14:18:26.459 | DEBUG    | __main__:trials:24 - Trial = 24707/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.461 | DEBUG    | __main__:trials:29 - Trial = 24707/30000 | Total reward = 49.61
2022-01-26 14:18:26.465 | DEBUG    | __main__:trials:24 - Trial = 24708/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.466 | DEBUG    | __main__:trials:29 - Trial = 24708/30000 | Total reward = 34.42
2022-01-26 14:18:26.469 | DEBUG    | __main__:trials:24 - Trial = 24709/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.471 | DEBUG    | __main__:trials:29 - Trial = 24709/30000 | Total reward = 40.08
2022-01-26 14:18:26.475 | DEBUG    | __main__:trials:24 - Trial = 24710/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.476 | DEBUG    | __main__:trials:29 - Trial = 24710/30000 | Total reward = 43.14
2022-01-26 14:18:26.480 | DEBUG    | __main__:trials:24 - Trial = 24711/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.482 | DEBUG    | __main__:trials:29 - Trial = 24711/30000 | Total reward = 37.24
2022-01-26 14:18:26.485 | DEBUG    | __main__:trials:24 - Trial = 24712/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.487 | DEBUG    | __main__:trials:29 - Trial = 24712/30000 | Total reward = 38.36
2022-01-26 14:18:26.490 | DEBUG    | __main__:trials:24 - Trial = 24713/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.492 | DEBUG    | __main__:trials:29 - Trial = 24713/30000 | Total reward = 33.40
2022-01-26 14:18:26.495 | DEBUG    | __main__:trials:24 - Trial = 24714/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.497 | DEBUG    | __main__:trials:29 - Trial = 24714/30000 | Total reward = 38.06
2022-01-26 14:18:26.500 | DEBUG    | __main__:trials:24 - Trial = 24715/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.502 | DEBUG    | __main__:trials:29 - Trial = 24715/30000 | Total reward = 36.73
2022-01-26 14:18:26.505 | DEBUG    | __main__:trials:24 - Trial = 24716/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.506 | DEBUG    | __main__:trials:29 - Trial = 24716/30000 | Total reward = 35.74
2022-01-26 14:18:26.511 | DEBUG    | __main__:trials:24 - Trial = 24717/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.512 | DEBUG    | __main__:trials:29 - Trial = 24717/30000 | Total reward = 36.67
2022-01-26 14:18:26.516 | DEBUG    | __main__:trials:26 - Trial = 24718/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.517 | DEBUG    | __main__:trials:29 - Trial = 24718/30000 | Total reward = 26.17
2022-01-26 14:18:26.521 | DEBUG    | __main__:trials:24 - Trial = 24719/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.523 | DEBUG    | __main__:trials:29 - Trial = 24719/30000 | Total reward = 47.13
2022-01-26 14:18:26.527 | DEBUG    | __main__:trials:24 - Trial = 24720/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.527 | DEBUG    | __main__:trials:29 - Trial = 24720/30000 | Total reward = 51.70
2022-01-26 14:18:26.532 | DEBUG    | __main__:trials:24 - Trial = 24721/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.533 | DEBUG    | __main__:trials:29 - Trial = 24721/30000 | Total reward = 37.79
2022-01-26 14:18:26.537 | DEBUG    | __main__:trials:24 - Trial = 24722/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.538 | DEBUG    | __main__:trials:29 - Trial = 24722/30000 | Total reward = 37.93
2022-01-26 14:18:26.542 | DEBUG    | __main__:trials:26 - Trial = 24723/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.543 | DEBUG    | __main__:trials:29 - Trial = 24723/30000 | Total reward = 29.01
2022-01-26 14:18:26.547 | DEBUG    | __main__:trials:24 - Trial = 24724/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.549 | DEBUG    | __main__:trials:29 - Trial = 24724/30000 | Total reward = 38.36
2022-01-26 14:18:26.552 | DEBUG    | __main__:trials:24 - Trial = 24725/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.554 | DEBUG    | __main__:trials:29 - Trial = 24725/30000 | Total reward = 33.57
2022-01-26 14:18:26.558 | DEBUG    | __main__:trials:24 - Trial = 24726/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.559 | DEBUG    | __main__:trials:29 - Trial = 24726/30000 | Total reward = 40.21
2022-01-26 14:18:26.563 | DEBUG    | __main__:trials:24 - Trial = 24727/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.563 | DEBUG    | __main__:trials:29 - Trial = 24727/30000 | Total reward = 37.61
2022-01-26 14:18:26.568 | DEBUG    | __main__:trials:24 - Trial = 24728/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.568 | DEBUG    | __main__:trials:29 - Trial = 24728/30000 | Total reward = 42.65
2022-01-26 14:18:26.571 | DEBUG    | __main__:trials:26 - Trial = 24729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.573 | DEBUG    | __main__:trials:29 - Trial = 24729/30000 | Total reward = 21.51
2022-01-26 14:18:26.577 | DEBUG    | __main__:trials:24 - Trial = 24730/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.578 | DEBUG    | __main__:trials:29 - Trial = 24730/30000 | Total reward = 37.67
2022-01-26 14:18:26.582 | DEBUG    | __main__:trials:26 - Trial = 24731/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.583 | DEBUG    | __main__:trials:29 - Trial = 24731/30000 | Total reward = 26.24
2022-01-26 14:18:26.587 | DEBUG    | __main__:trials:24 - Trial = 24732/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.588 | DEBUG    | __main__:trials:29 - Trial = 24732/30000 | Total reward = 38.66
2022-01-26 14:18:26.591 | DEBUG    | __main__:trials:24 - Trial = 24733/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.593 | DEBUG    | __main__:trials:29 - Trial = 24733/30000 | Total reward = 47.87
2022-01-26 14:18:26.596 | DEBUG    | __main__:trials:24 - Trial = 24734/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.598 | DEBUG    | __main__:trials:29 - Trial = 24734/30000 | Total reward = 31.28
2022-01-26 14:18:26.601 | DEBUG    | __main__:trials:24 - Trial = 24735/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.603 | DEBUG    | __main__:trials:29 - Trial = 24735/30000 | Total reward = 35.19
2022-01-26 14:18:26.607 | DEBUG    | __main__:trials:24 - Trial = 24736/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.607 | DEBUG    | __main__:trials:29 - Trial = 24736/30000 | Total reward = 39.19
2022-01-26 14:18:26.612 | DEBUG    | __main__:trials:24 - Trial = 24737/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.612 | DEBUG    | __main__:trials:29 - Trial = 24737/30000 | Total reward = 47.77
2022-01-26 14:18:26.617 | DEBUG    | __main__:trials:24 - Trial = 24738/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.618 | DEBUG    | __main__:trials:29 - Trial = 24738/30000 | Total reward = 42.87
2022-01-26 14:18:26.621 | DEBUG    | __main__:trials:24 - Trial = 24739/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.622 | DEBUG    | __main__:trials:29 - Trial = 24739/30000 | Total reward = 36.92
2022-01-26 14:18:26.625 | DEBUG    | __main__:trials:26 - Trial = 24740/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.626 | DEBUG    | __main__:trials:29 - Trial = 24740/30000 | Total reward = 24.35
2022-01-26 14:18:26.629 | DEBUG    | __main__:trials:24 - Trial = 24741/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.630 | DEBUG    | __main__:trials:29 - Trial = 24741/30000 | Total reward = 38.25
2022-01-26 14:18:26.633 | DEBUG    | __main__:trials:26 - Trial = 24742/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.634 | DEBUG    | __main__:trials:29 - Trial = 24742/30000 | Total reward = 24.99
2022-01-26 14:18:26.638 | DEBUG    | __main__:trials:24 - Trial = 24743/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.638 | DEBUG    | __main__:trials:29 - Trial = 24743/30000 | Total reward = 44.24
2022-01-26 14:18:26.642 | DEBUG    | __main__:trials:26 - Trial = 24744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.643 | DEBUG    | __main__:trials:29 - Trial = 24744/30000 | Total reward = 27.67
2022-01-26 14:18:26.647 | DEBUG    | __main__:trials:24 - Trial = 24745/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.649 | DEBUG    | __main__:trials:29 - Trial = 24745/30000 | Total reward = 39.30
2022-01-26 14:18:26.652 | DEBUG    | __main__:trials:24 - Trial = 24746/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.654 | DEBUG    | __main__:trials:29 - Trial = 24746/30000 | Total reward = 37.38
2022-01-26 14:18:26.656 | DEBUG    | __main__:trials:26 - Trial = 24747/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.658 | DEBUG    | __main__:trials:29 - Trial = 24747/30000 | Total reward = 17.29
2022-01-26 14:18:26.662 | DEBUG    | __main__:trials:24 - Trial = 24748/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.662 | DEBUG    | __main__:trials:29 - Trial = 24748/30000 | Total reward = 33.58
2022-01-26 14:18:26.666 | DEBUG    | __main__:trials:26 - Trial = 24749/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.668 | DEBUG    | __main__:trials:29 - Trial = 24749/30000 | Total reward = 22.99
2022-01-26 14:18:26.672 | DEBUG    | __main__:trials:24 - Trial = 24750/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.673 | DEBUG    | __main__:trials:29 - Trial = 24750/30000 | Total reward = 37.23
2022-01-26 14:18:26.677 | DEBUG    | __main__:trials:24 - Trial = 24751/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.679 | DEBUG    | __main__:trials:29 - Trial = 24751/30000 | Total reward = 38.20
2022-01-26 14:18:26.683 | DEBUG    | __main__:trials:26 - Trial = 24752/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.683 | DEBUG    | __main__:trials:29 - Trial = 24752/30000 | Total reward = 27.88
2022-01-26 14:18:26.688 | DEBUG    | __main__:trials:24 - Trial = 24753/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.689 | DEBUG    | __main__:trials:29 - Trial = 24753/30000 | Total reward = 46.63
2022-01-26 14:18:26.692 | DEBUG    | __main__:trials:24 - Trial = 24754/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.694 | DEBUG    | __main__:trials:29 - Trial = 24754/30000 | Total reward = 38.41
2022-01-26 14:18:26.697 | DEBUG    | __main__:trials:26 - Trial = 24755/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.698 | DEBUG    | __main__:trials:29 - Trial = 24755/30000 | Total reward = 26.80
2022-01-26 14:18:26.702 | DEBUG    | __main__:trials:24 - Trial = 24756/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.704 | DEBUG    | __main__:trials:29 - Trial = 24756/30000 | Total reward = 39.09
2022-01-26 14:18:26.708 | DEBUG    | __main__:trials:24 - Trial = 24757/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.709 | DEBUG    | __main__:trials:29 - Trial = 24757/30000 | Total reward = 40.40
2022-01-26 14:18:26.713 | DEBUG    | __main__:trials:26 - Trial = 24758/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.714 | DEBUG    | __main__:trials:29 - Trial = 24758/30000 | Total reward = 19.00
2022-01-26 14:18:26.718 | DEBUG    | __main__:trials:24 - Trial = 24759/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.719 | DEBUG    | __main__:trials:29 - Trial = 24759/30000 | Total reward = 51.30
2022-01-26 14:18:26.723 | DEBUG    | __main__:trials:26 - Trial = 24760/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.725 | DEBUG    | __main__:trials:29 - Trial = 24760/30000 | Total reward = 24.87
2022-01-26 14:18:26.728 | DEBUG    | __main__:trials:26 - Trial = 24761/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.729 | DEBUG    | __main__:trials:29 - Trial = 24761/30000 | Total reward = 19.01
2022-01-26 14:18:26.732 | DEBUG    | __main__:trials:24 - Trial = 24762/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.733 | DEBUG    | __main__:trials:29 - Trial = 24762/30000 | Total reward = 38.36
2022-01-26 14:18:26.736 | DEBUG    | __main__:trials:26 - Trial = 24763/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.737 | DEBUG    | __main__:trials:29 - Trial = 24763/30000 | Total reward = 26.86
2022-01-26 14:18:26.740 | DEBUG    | __main__:trials:24 - Trial = 24764/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.742 | DEBUG    | __main__:trials:29 - Trial = 24764/30000 | Total reward = 21.86
2022-01-26 14:18:26.745 | DEBUG    | __main__:trials:24 - Trial = 24765/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.746 | DEBUG    | __main__:trials:29 - Trial = 24765/30000 | Total reward = 39.13
2022-01-26 14:18:26.751 | DEBUG    | __main__:trials:24 - Trial = 24766/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.751 | DEBUG    | __main__:trials:29 - Trial = 24766/30000 | Total reward = 36.62
2022-01-26 14:18:26.755 | DEBUG    | __main__:trials:24 - Trial = 24767/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.757 | DEBUG    | __main__:trials:29 - Trial = 24767/30000 | Total reward = 38.72
2022-01-26 14:18:26.760 | DEBUG    | __main__:trials:24 - Trial = 24768/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.762 | DEBUG    | __main__:trials:29 - Trial = 24768/30000 | Total reward = 43.19
2022-01-26 14:18:26.766 | DEBUG    | __main__:trials:24 - Trial = 24769/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.767 | DEBUG    | __main__:trials:29 - Trial = 24769/30000 | Total reward = 49.62
2022-01-26 14:18:26.770 | DEBUG    | __main__:trials:24 - Trial = 24770/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.772 | DEBUG    | __main__:trials:29 - Trial = 24770/30000 | Total reward = 39.70
2022-01-26 14:18:26.776 | DEBUG    | __main__:trials:24 - Trial = 24771/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.777 | DEBUG    | __main__:trials:29 - Trial = 24771/30000 | Total reward = 31.78
2022-01-26 14:18:26.780 | DEBUG    | __main__:trials:24 - Trial = 24772/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.782 | DEBUG    | __main__:trials:29 - Trial = 24772/30000 | Total reward = 37.79
2022-01-26 14:18:26.785 | DEBUG    | __main__:trials:24 - Trial = 24773/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.786 | DEBUG    | __main__:trials:29 - Trial = 24773/30000 | Total reward = 22.29
2022-01-26 14:18:26.789 | DEBUG    | __main__:trials:24 - Trial = 24774/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.791 | DEBUG    | __main__:trials:29 - Trial = 24774/30000 | Total reward = 34.39
2022-01-26 14:18:26.794 | DEBUG    | __main__:trials:24 - Trial = 24775/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.796 | DEBUG    | __main__:trials:29 - Trial = 24775/30000 | Total reward = 39.24
2022-01-26 14:18:26.800 | DEBUG    | __main__:trials:24 - Trial = 24776/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.801 | DEBUG    | __main__:trials:29 - Trial = 24776/30000 | Total reward = 40.39
2022-01-26 14:18:26.804 | DEBUG    | __main__:trials:24 - Trial = 24777/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.806 | DEBUG    | __main__:trials:29 - Trial = 24777/30000 | Total reward = 25.31
2022-01-26 14:18:26.810 | DEBUG    | __main__:trials:24 - Trial = 24778/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.810 | DEBUG    | __main__:trials:29 - Trial = 24778/30000 | Total reward = 50.19
2022-01-26 14:18:26.814 | DEBUG    | __main__:trials:24 - Trial = 24779/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.816 | DEBUG    | __main__:trials:29 - Trial = 24779/30000 | Total reward = 36.89
2022-01-26 14:18:26.819 | DEBUG    | __main__:trials:24 - Trial = 24780/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.820 | DEBUG    | __main__:trials:29 - Trial = 24780/30000 | Total reward = 42.93
2022-01-26 14:18:26.824 | DEBUG    | __main__:trials:24 - Trial = 24781/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.826 | DEBUG    | __main__:trials:29 - Trial = 24781/30000 | Total reward = 39.45
2022-01-26 14:18:26.830 | DEBUG    | __main__:trials:24 - Trial = 24782/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.831 | DEBUG    | __main__:trials:29 - Trial = 24782/30000 | Total reward = 39.92
2022-01-26 14:18:26.835 | DEBUG    | __main__:trials:24 - Trial = 24783/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.837 | DEBUG    | __main__:trials:29 - Trial = 24783/30000 | Total reward = 35.41
2022-01-26 14:18:26.840 | DEBUG    | __main__:trials:24 - Trial = 24784/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.842 | DEBUG    | __main__:trials:29 - Trial = 24784/30000 | Total reward = 38.39
2022-01-26 14:18:26.846 | DEBUG    | __main__:trials:24 - Trial = 24785/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.848 | DEBUG    | __main__:trials:29 - Trial = 24785/30000 | Total reward = 23.00
2022-01-26 14:18:26.850 | DEBUG    | __main__:trials:24 - Trial = 24786/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.851 | DEBUG    | __main__:trials:29 - Trial = 24786/30000 | Total reward = 43.76
2022-01-26 14:18:26.854 | DEBUG    | __main__:trials:24 - Trial = 24787/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.855 | DEBUG    | __main__:trials:29 - Trial = 24787/30000 | Total reward = 37.15
2022-01-26 14:18:26.859 | DEBUG    | __main__:trials:24 - Trial = 24788/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.861 | DEBUG    | __main__:trials:29 - Trial = 24788/30000 | Total reward = 50.38
2022-01-26 14:18:26.864 | DEBUG    | __main__:trials:24 - Trial = 24789/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.866 | DEBUG    | __main__:trials:29 - Trial = 24789/30000 | Total reward = 40.61
2022-01-26 14:18:26.870 | DEBUG    | __main__:trials:24 - Trial = 24790/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.871 | DEBUG    | __main__:trials:29 - Trial = 24790/30000 | Total reward = 36.30
2022-01-26 14:18:26.875 | DEBUG    | __main__:trials:24 - Trial = 24791/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.877 | DEBUG    | __main__:trials:29 - Trial = 24791/30000 | Total reward = 36.15
2022-01-26 14:18:26.880 | DEBUG    | __main__:trials:24 - Trial = 24792/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.882 | DEBUG    | __main__:trials:29 - Trial = 24792/30000 | Total reward = 51.26
2022-01-26 14:18:26.886 | DEBUG    | __main__:trials:24 - Trial = 24793/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.887 | DEBUG    | __main__:trials:29 - Trial = 24793/30000 | Total reward = 51.07
2022-01-26 14:18:26.890 | DEBUG    | __main__:trials:26 - Trial = 24794/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.892 | DEBUG    | __main__:trials:29 - Trial = 24794/30000 | Total reward = 13.50
2022-01-26 14:18:26.895 | DEBUG    | __main__:trials:24 - Trial = 24795/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.897 | DEBUG    | __main__:trials:29 - Trial = 24795/30000 | Total reward = 39.92
2022-01-26 14:18:26.900 | DEBUG    | __main__:trials:24 - Trial = 24796/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.902 | DEBUG    | __main__:trials:29 - Trial = 24796/30000 | Total reward = 20.86
2022-01-26 14:18:26.905 | DEBUG    | __main__:trials:24 - Trial = 24797/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.906 | DEBUG    | __main__:trials:29 - Trial = 24797/30000 | Total reward = 34.72
2022-01-26 14:18:26.910 | DEBUG    | __main__:trials:24 - Trial = 24798/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.912 | DEBUG    | __main__:trials:29 - Trial = 24798/30000 | Total reward = 36.24
2022-01-26 14:18:26.915 | DEBUG    | __main__:trials:24 - Trial = 24799/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.916 | DEBUG    | __main__:trials:29 - Trial = 24799/30000 | Total reward = 48.95
2022-01-26 14:18:26.919 | DEBUG    | __main__:trials:24 - Trial = 24800/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.920 | DEBUG    | __main__:trials:29 - Trial = 24800/30000 | Total reward = 35.04
2022-01-26 14:18:26.923 | DEBUG    | __main__:trials:26 - Trial = 24801/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.925 | DEBUG    | __main__:trials:29 - Trial = 24801/30000 | Total reward = 9.43
2022-01-26 14:18:26.928 | DEBUG    | __main__:trials:24 - Trial = 24802/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.929 | DEBUG    | __main__:trials:29 - Trial = 24802/30000 | Total reward = 31.36
2022-01-26 14:18:26.932 | DEBUG    | __main__:trials:24 - Trial = 24803/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.933 | DEBUG    | __main__:trials:29 - Trial = 24803/30000 | Total reward = 35.53
2022-01-26 14:18:26.937 | DEBUG    | __main__:trials:24 - Trial = 24804/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.938 | DEBUG    | __main__:trials:29 - Trial = 24804/30000 | Total reward = 32.76
2022-01-26 14:18:26.942 | DEBUG    | __main__:trials:26 - Trial = 24805/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:26.942 | DEBUG    | __main__:trials:29 - Trial = 24805/30000 | Total reward = 20.29
2022-01-26 14:18:26.946 | DEBUG    | __main__:trials:24 - Trial = 24806/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.948 | DEBUG    | __main__:trials:29 - Trial = 24806/30000 | Total reward = 41.65
2022-01-26 14:18:26.951 | DEBUG    | __main__:trials:24 - Trial = 24807/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.952 | DEBUG    | __main__:trials:29 - Trial = 24807/30000 | Total reward = 34.95
2022-01-26 14:18:26.957 | DEBUG    | __main__:trials:24 - Trial = 24808/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.957 | DEBUG    | __main__:trials:29 - Trial = 24808/30000 | Total reward = 33.45
2022-01-26 14:18:26.961 | DEBUG    | __main__:trials:24 - Trial = 24809/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.961 | DEBUG    | __main__:trials:29 - Trial = 24809/30000 | Total reward = 35.04
2022-01-26 14:18:26.966 | DEBUG    | __main__:trials:24 - Trial = 24810/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.968 | DEBUG    | __main__:trials:29 - Trial = 24810/30000 | Total reward = 35.04
2022-01-26 14:18:26.971 | DEBUG    | __main__:trials:24 - Trial = 24811/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.973 | DEBUG    | __main__:trials:29 - Trial = 24811/30000 | Total reward = 43.02
2022-01-26 14:18:26.976 | DEBUG    | __main__:trials:24 - Trial = 24812/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.978 | DEBUG    | __main__:trials:29 - Trial = 24812/30000 | Total reward = 38.03
2022-01-26 14:18:26.981 | DEBUG    | __main__:trials:24 - Trial = 24813/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.983 | DEBUG    | __main__:trials:29 - Trial = 24813/30000 | Total reward = 38.92
2022-01-26 14:18:26.986 | DEBUG    | __main__:trials:24 - Trial = 24814/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.988 | DEBUG    | __main__:trials:29 - Trial = 24814/30000 | Total reward = 41.11
2022-01-26 14:18:26.991 | DEBUG    | __main__:trials:24 - Trial = 24815/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.993 | DEBUG    | __main__:trials:29 - Trial = 24815/30000 | Total reward = 32.07
2022-01-26 14:18:26.996 | DEBUG    | __main__:trials:24 - Trial = 24816/30000 | Max number of steps (20) reached
2022-01-26 14:18:26.997 | DEBUG    | __main__:trials:29 - Trial = 24816/30000 | Total reward = 45.72
2022-01-26 14:18:27.001 | DEBUG    | __main__:trials:24 - Trial = 24817/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.003 | DEBUG    | __main__:trials:29 - Trial = 24817/30000 | Total reward = 43.09
2022-01-26 14:18:27.006 | DEBUG    | __main__:trials:24 - Trial = 24818/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.008 | DEBUG    | __main__:trials:29 - Trial = 24818/30000 | Total reward = 31.97
2022-01-26 14:18:27.010 | DEBUG    | __main__:trials:26 - Trial = 24819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.012 | DEBUG    | __main__:trials:29 - Trial = 24819/30000 | Total reward = 10.89
2022-01-26 14:18:27.014 | DEBUG    | __main__:trials:26 - Trial = 24820/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.016 | DEBUG    | __main__:trials:29 - Trial = 24820/30000 | Total reward = 10.89
2022-01-26 14:18:27.019 | DEBUG    | __main__:trials:24 - Trial = 24821/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.020 | DEBUG    | __main__:trials:29 - Trial = 24821/30000 | Total reward = 25.33
2022-01-26 14:18:27.024 | DEBUG    | __main__:trials:24 - Trial = 24822/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.025 | DEBUG    | __main__:trials:29 - Trial = 24822/30000 | Total reward = 35.23
2022-01-26 14:18:27.029 | DEBUG    | __main__:trials:24 - Trial = 24823/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.030 | DEBUG    | __main__:trials:29 - Trial = 24823/30000 | Total reward = 32.66
2022-01-26 14:18:27.034 | DEBUG    | __main__:trials:24 - Trial = 24824/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.035 | DEBUG    | __main__:trials:29 - Trial = 24824/30000 | Total reward = 33.89
2022-01-26 14:18:27.039 | DEBUG    | __main__:trials:24 - Trial = 24825/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.040 | DEBUG    | __main__:trials:29 - Trial = 24825/30000 | Total reward = 30.01
2022-01-26 14:18:27.044 | DEBUG    | __main__:trials:24 - Trial = 24826/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.045 | DEBUG    | __main__:trials:29 - Trial = 24826/30000 | Total reward = 43.80
2022-01-26 14:18:27.048 | DEBUG    | __main__:trials:24 - Trial = 24827/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.050 | DEBUG    | __main__:trials:29 - Trial = 24827/30000 | Total reward = 35.44
2022-01-26 14:18:27.054 | DEBUG    | __main__:trials:24 - Trial = 24828/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.055 | DEBUG    | __main__:trials:29 - Trial = 24828/30000 | Total reward = 35.01
2022-01-26 14:18:27.059 | DEBUG    | __main__:trials:24 - Trial = 24829/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.059 | DEBUG    | __main__:trials:29 - Trial = 24829/30000 | Total reward = 32.48
2022-01-26 14:18:27.064 | DEBUG    | __main__:trials:24 - Trial = 24830/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.064 | DEBUG    | __main__:trials:29 - Trial = 24830/30000 | Total reward = 45.12
2022-01-26 14:18:27.069 | DEBUG    | __main__:trials:24 - Trial = 24831/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.070 | DEBUG    | __main__:trials:29 - Trial = 24831/30000 | Total reward = 31.11
2022-01-26 14:18:27.075 | DEBUG    | __main__:trials:24 - Trial = 24832/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.075 | DEBUG    | __main__:trials:29 - Trial = 24832/30000 | Total reward = 30.87
2022-01-26 14:18:27.080 | DEBUG    | __main__:trials:24 - Trial = 24833/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.081 | DEBUG    | __main__:trials:29 - Trial = 24833/30000 | Total reward = 21.72
2022-01-26 14:18:27.084 | DEBUG    | __main__:trials:24 - Trial = 24834/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.085 | DEBUG    | __main__:trials:29 - Trial = 24834/30000 | Total reward = 55.53
2022-01-26 14:18:27.088 | DEBUG    | __main__:trials:24 - Trial = 24835/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.089 | DEBUG    | __main__:trials:29 - Trial = 24835/30000 | Total reward = 47.87
2022-01-26 14:18:27.092 | DEBUG    | __main__:trials:24 - Trial = 24836/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.093 | DEBUG    | __main__:trials:29 - Trial = 24836/30000 | Total reward = 36.45
2022-01-26 14:18:27.098 | DEBUG    | __main__:trials:24 - Trial = 24837/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.098 | DEBUG    | __main__:trials:29 - Trial = 24837/30000 | Total reward = 46.16
2022-01-26 14:18:27.103 | DEBUG    | __main__:trials:24 - Trial = 24838/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.104 | DEBUG    | __main__:trials:29 - Trial = 24838/30000 | Total reward = 30.64
2022-01-26 14:18:27.108 | DEBUG    | __main__:trials:24 - Trial = 24839/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.109 | DEBUG    | __main__:trials:29 - Trial = 24839/30000 | Total reward = 37.28
2022-01-26 14:18:27.112 | DEBUG    | __main__:trials:24 - Trial = 24840/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.114 | DEBUG    | __main__:trials:29 - Trial = 24840/30000 | Total reward = 37.45
2022-01-26 14:18:27.118 | DEBUG    | __main__:trials:24 - Trial = 24841/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.119 | DEBUG    | __main__:trials:29 - Trial = 24841/30000 | Total reward = 33.78
2022-01-26 14:18:27.123 | DEBUG    | __main__:trials:24 - Trial = 24842/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.124 | DEBUG    | __main__:trials:29 - Trial = 24842/30000 | Total reward = 37.53
2022-01-26 14:18:27.127 | DEBUG    | __main__:trials:24 - Trial = 24843/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.129 | DEBUG    | __main__:trials:29 - Trial = 24843/30000 | Total reward = 34.50
2022-01-26 14:18:27.132 | DEBUG    | __main__:trials:24 - Trial = 24844/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.134 | DEBUG    | __main__:trials:29 - Trial = 24844/30000 | Total reward = 34.12
2022-01-26 14:18:27.138 | DEBUG    | __main__:trials:24 - Trial = 24845/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.139 | DEBUG    | __main__:trials:29 - Trial = 24845/30000 | Total reward = 48.82
2022-01-26 14:18:27.143 | DEBUG    | __main__:trials:24 - Trial = 24846/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.144 | DEBUG    | __main__:trials:29 - Trial = 24846/30000 | Total reward = 52.53
2022-01-26 14:18:27.147 | DEBUG    | __main__:trials:24 - Trial = 24847/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.149 | DEBUG    | __main__:trials:29 - Trial = 24847/30000 | Total reward = 40.16
2022-01-26 14:18:27.153 | DEBUG    | __main__:trials:24 - Trial = 24848/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.154 | DEBUG    | __main__:trials:29 - Trial = 24848/30000 | Total reward = 34.35
2022-01-26 14:18:27.158 | DEBUG    | __main__:trials:24 - Trial = 24849/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.159 | DEBUG    | __main__:trials:29 - Trial = 24849/30000 | Total reward = 32.42
2022-01-26 14:18:27.163 | DEBUG    | __main__:trials:24 - Trial = 24850/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.165 | DEBUG    | __main__:trials:29 - Trial = 24850/30000 | Total reward = 37.47
2022-01-26 14:18:27.168 | DEBUG    | __main__:trials:24 - Trial = 24851/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.170 | DEBUG    | __main__:trials:29 - Trial = 24851/30000 | Total reward = 32.08
2022-01-26 14:18:27.173 | DEBUG    | __main__:trials:24 - Trial = 24852/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.175 | DEBUG    | __main__:trials:29 - Trial = 24852/30000 | Total reward = 43.40
2022-01-26 14:18:27.179 | DEBUG    | __main__:trials:24 - Trial = 24853/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.180 | DEBUG    | __main__:trials:29 - Trial = 24853/30000 | Total reward = 40.09
2022-01-26 14:18:27.183 | DEBUG    | __main__:trials:24 - Trial = 24854/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.185 | DEBUG    | __main__:trials:29 - Trial = 24854/30000 | Total reward = 42.30
2022-01-26 14:18:27.188 | DEBUG    | __main__:trials:26 - Trial = 24855/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.189 | DEBUG    | __main__:trials:29 - Trial = 24855/30000 | Total reward = 15.71
2022-01-26 14:18:27.192 | DEBUG    | __main__:trials:26 - Trial = 24856/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.193 | DEBUG    | __main__:trials:29 - Trial = 24856/30000 | Total reward = 14.43
2022-01-26 14:18:27.198 | DEBUG    | __main__:trials:24 - Trial = 24857/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.199 | DEBUG    | __main__:trials:29 - Trial = 24857/30000 | Total reward = 43.97
2022-01-26 14:18:27.202 | DEBUG    | __main__:trials:26 - Trial = 24858/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.204 | DEBUG    | __main__:trials:29 - Trial = 24858/30000 | Total reward = 22.79
2022-01-26 14:18:27.207 | DEBUG    | __main__:trials:26 - Trial = 24859/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.208 | DEBUG    | __main__:trials:29 - Trial = 24859/30000 | Total reward = 27.03
2022-01-26 14:18:27.211 | DEBUG    | __main__:trials:24 - Trial = 24860/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.213 | DEBUG    | __main__:trials:29 - Trial = 24860/30000 | Total reward = 59.52
2022-01-26 14:18:27.216 | DEBUG    | __main__:trials:26 - Trial = 24861/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.218 | DEBUG    | __main__:trials:29 - Trial = 24861/30000 | Total reward = 24.50
2022-01-26 14:18:27.221 | DEBUG    | __main__:trials:24 - Trial = 24862/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.223 | DEBUG    | __main__:trials:29 - Trial = 24862/30000 | Total reward = 50.42
2022-01-26 14:18:27.227 | DEBUG    | __main__:trials:24 - Trial = 24863/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.228 | DEBUG    | __main__:trials:29 - Trial = 24863/30000 | Total reward = 21.53
2022-01-26 14:18:27.231 | DEBUG    | __main__:trials:24 - Trial = 24864/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.233 | DEBUG    | __main__:trials:29 - Trial = 24864/30000 | Total reward = 40.59
2022-01-26 14:18:27.237 | DEBUG    | __main__:trials:24 - Trial = 24865/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.238 | DEBUG    | __main__:trials:29 - Trial = 24865/30000 | Total reward = 39.85
2022-01-26 14:18:27.242 | DEBUG    | __main__:trials:24 - Trial = 24866/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.243 | DEBUG    | __main__:trials:29 - Trial = 24866/30000 | Total reward = 38.36
2022-01-26 14:18:27.248 | DEBUG    | __main__:trials:24 - Trial = 24867/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.250 | DEBUG    | __main__:trials:29 - Trial = 24867/30000 | Total reward = 39.89
2022-01-26 14:18:27.253 | DEBUG    | __main__:trials:24 - Trial = 24868/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.254 | DEBUG    | __main__:trials:29 - Trial = 24868/30000 | Total reward = 37.76
2022-01-26 14:18:27.257 | DEBUG    | __main__:trials:26 - Trial = 24869/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.258 | DEBUG    | __main__:trials:29 - Trial = 24869/30000 | Total reward = 26.58
2022-01-26 14:18:27.262 | DEBUG    | __main__:trials:26 - Trial = 24870/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.263 | DEBUG    | __main__:trials:29 - Trial = 24870/30000 | Total reward = 17.74
2022-01-26 14:18:27.267 | DEBUG    | __main__:trials:24 - Trial = 24871/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.268 | DEBUG    | __main__:trials:29 - Trial = 24871/30000 | Total reward = 47.87
2022-01-26 14:18:27.272 | DEBUG    | __main__:trials:24 - Trial = 24872/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.273 | DEBUG    | __main__:trials:29 - Trial = 24872/30000 | Total reward = 26.87
2022-01-26 14:18:27.275 | DEBUG    | __main__:trials:26 - Trial = 24873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.277 | DEBUG    | __main__:trials:29 - Trial = 24873/30000 | Total reward = 12.80
2022-01-26 14:18:27.280 | DEBUG    | __main__:trials:24 - Trial = 24874/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.281 | DEBUG    | __main__:trials:29 - Trial = 24874/30000 | Total reward = 38.36
2022-01-26 14:18:27.284 | DEBUG    | __main__:trials:26 - Trial = 24875/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.286 | DEBUG    | __main__:trials:29 - Trial = 24875/30000 | Total reward = 24.20
2022-01-26 14:18:27.290 | DEBUG    | __main__:trials:24 - Trial = 24876/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.291 | DEBUG    | __main__:trials:29 - Trial = 24876/30000 | Total reward = 28.33
2022-01-26 14:18:27.294 | DEBUG    | __main__:trials:24 - Trial = 24877/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.296 | DEBUG    | __main__:trials:29 - Trial = 24877/30000 | Total reward = 44.42
2022-01-26 14:18:27.299 | DEBUG    | __main__:trials:24 - Trial = 24878/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.300 | DEBUG    | __main__:trials:29 - Trial = 24878/30000 | Total reward = 43.14
2022-01-26 14:18:27.303 | DEBUG    | __main__:trials:24 - Trial = 24879/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.305 | DEBUG    | __main__:trials:29 - Trial = 24879/30000 | Total reward = 37.59
2022-01-26 14:18:27.308 | DEBUG    | __main__:trials:24 - Trial = 24880/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.310 | DEBUG    | __main__:trials:29 - Trial = 24880/30000 | Total reward = 42.14
2022-01-26 14:18:27.313 | DEBUG    | __main__:trials:24 - Trial = 24881/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.314 | DEBUG    | __main__:trials:29 - Trial = 24881/30000 | Total reward = 27.70
2022-01-26 14:18:27.317 | DEBUG    | __main__:trials:26 - Trial = 24882/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.319 | DEBUG    | __main__:trials:29 - Trial = 24882/30000 | Total reward = 18.83
2022-01-26 14:18:27.323 | DEBUG    | __main__:trials:24 - Trial = 24883/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.324 | DEBUG    | __main__:trials:29 - Trial = 24883/30000 | Total reward = 28.99
2022-01-26 14:18:27.328 | DEBUG    | __main__:trials:24 - Trial = 24884/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.330 | DEBUG    | __main__:trials:29 - Trial = 24884/30000 | Total reward = 47.73
2022-01-26 14:18:27.333 | DEBUG    | __main__:trials:24 - Trial = 24885/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.334 | DEBUG    | __main__:trials:29 - Trial = 24885/30000 | Total reward = 42.16
2022-01-26 14:18:27.338 | DEBUG    | __main__:trials:24 - Trial = 24886/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.338 | DEBUG    | __main__:trials:29 - Trial = 24886/30000 | Total reward = 48.75
2022-01-26 14:18:27.343 | DEBUG    | __main__:trials:24 - Trial = 24887/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.343 | DEBUG    | __main__:trials:29 - Trial = 24887/30000 | Total reward = 41.11
2022-01-26 14:18:27.348 | DEBUG    | __main__:trials:24 - Trial = 24888/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.349 | DEBUG    | __main__:trials:29 - Trial = 24888/30000 | Total reward = 40.08
2022-01-26 14:18:27.353 | DEBUG    | __main__:trials:26 - Trial = 24889/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.353 | DEBUG    | __main__:trials:29 - Trial = 24889/30000 | Total reward = 23.57
2022-01-26 14:18:27.356 | DEBUG    | __main__:trials:26 - Trial = 24890/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.358 | DEBUG    | __main__:trials:29 - Trial = 24890/30000 | Total reward = 23.57
2022-01-26 14:18:27.361 | DEBUG    | __main__:trials:24 - Trial = 24891/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.361 | DEBUG    | __main__:trials:29 - Trial = 24891/30000 | Total reward = 48.51
2022-01-26 14:18:27.364 | DEBUG    | __main__:trials:26 - Trial = 24892/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.366 | DEBUG    | __main__:trials:29 - Trial = 24892/30000 | Total reward = 19.27
2022-01-26 14:18:27.370 | DEBUG    | __main__:trials:24 - Trial = 24893/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.371 | DEBUG    | __main__:trials:29 - Trial = 24893/30000 | Total reward = 37.69
2022-01-26 14:18:27.374 | DEBUG    | __main__:trials:26 - Trial = 24894/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.376 | DEBUG    | __main__:trials:29 - Trial = 24894/30000 | Total reward = 27.74
2022-01-26 14:18:27.379 | DEBUG    | __main__:trials:24 - Trial = 24895/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.381 | DEBUG    | __main__:trials:29 - Trial = 24895/30000 | Total reward = 29.42
2022-01-26 14:18:27.384 | DEBUG    | __main__:trials:24 - Trial = 24896/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.386 | DEBUG    | __main__:trials:29 - Trial = 24896/30000 | Total reward = 38.70
2022-01-26 14:18:27.389 | DEBUG    | __main__:trials:26 - Trial = 24897/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.390 | DEBUG    | __main__:trials:29 - Trial = 24897/30000 | Total reward = 25.62
2022-01-26 14:18:27.394 | DEBUG    | __main__:trials:24 - Trial = 24898/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.396 | DEBUG    | __main__:trials:29 - Trial = 24898/30000 | Total reward = 42.78
2022-01-26 14:18:27.399 | DEBUG    | __main__:trials:24 - Trial = 24899/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.401 | DEBUG    | __main__:trials:29 - Trial = 24899/30000 | Total reward = 37.80
2022-01-26 14:18:27.404 | DEBUG    | __main__:trials:24 - Trial = 24900/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.406 | DEBUG    | __main__:trials:29 - Trial = 24900/30000 | Total reward = 53.63
2022-01-26 14:18:27.410 | DEBUG    | __main__:trials:24 - Trial = 24901/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.411 | DEBUG    | __main__:trials:29 - Trial = 24901/30000 | Total reward = 41.45
2022-01-26 14:18:27.415 | DEBUG    | __main__:trials:24 - Trial = 24902/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.416 | DEBUG    | __main__:trials:29 - Trial = 24902/30000 | Total reward = 46.16
2022-01-26 14:18:27.420 | DEBUG    | __main__:trials:26 - Trial = 24903/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.421 | DEBUG    | __main__:trials:29 - Trial = 24903/30000 | Total reward = 20.75
2022-01-26 14:18:27.425 | DEBUG    | __main__:trials:24 - Trial = 24904/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.426 | DEBUG    | __main__:trials:29 - Trial = 24904/30000 | Total reward = 37.61
2022-01-26 14:18:27.431 | DEBUG    | __main__:trials:24 - Trial = 24905/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.431 | DEBUG    | __main__:trials:29 - Trial = 24905/30000 | Total reward = 36.51
2022-01-26 14:18:27.436 | DEBUG    | __main__:trials:24 - Trial = 24906/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.437 | DEBUG    | __main__:trials:29 - Trial = 24906/30000 | Total reward = 37.32
2022-01-26 14:18:27.440 | DEBUG    | __main__:trials:24 - Trial = 24907/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.442 | DEBUG    | __main__:trials:29 - Trial = 24907/30000 | Total reward = 38.76
2022-01-26 14:18:27.445 | DEBUG    | __main__:trials:26 - Trial = 24908/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.446 | DEBUG    | __main__:trials:29 - Trial = 24908/30000 | Total reward = 16.39
2022-01-26 14:18:27.449 | DEBUG    | __main__:trials:24 - Trial = 24909/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.451 | DEBUG    | __main__:trials:29 - Trial = 24909/30000 | Total reward = 39.19
2022-01-26 14:18:27.455 | DEBUG    | __main__:trials:24 - Trial = 24910/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.455 | DEBUG    | __main__:trials:29 - Trial = 24910/30000 | Total reward = 39.90
2022-01-26 14:18:27.460 | DEBUG    | __main__:trials:24 - Trial = 24911/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.460 | DEBUG    | __main__:trials:29 - Trial = 24911/30000 | Total reward = 29.16
2022-01-26 14:18:27.465 | DEBUG    | __main__:trials:24 - Trial = 24912/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.465 | DEBUG    | __main__:trials:29 - Trial = 24912/30000 | Total reward = 35.84
2022-01-26 14:18:27.470 | DEBUG    | __main__:trials:24 - Trial = 24913/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.472 | DEBUG    | __main__:trials:29 - Trial = 24913/30000 | Total reward = 40.63
2022-01-26 14:18:27.476 | DEBUG    | __main__:trials:24 - Trial = 24914/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.477 | DEBUG    | __main__:trials:29 - Trial = 24914/30000 | Total reward = 41.75
2022-01-26 14:18:27.481 | DEBUG    | __main__:trials:24 - Trial = 24915/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.483 | DEBUG    | __main__:trials:29 - Trial = 24915/30000 | Total reward = 23.11
2022-01-26 14:18:27.486 | DEBUG    | __main__:trials:24 - Trial = 24916/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.487 | DEBUG    | __main__:trials:29 - Trial = 24916/30000 | Total reward = 34.83
2022-01-26 14:18:27.491 | DEBUG    | __main__:trials:24 - Trial = 24917/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.492 | DEBUG    | __main__:trials:29 - Trial = 24917/30000 | Total reward = 40.61
2022-01-26 14:18:27.496 | DEBUG    | __main__:trials:24 - Trial = 24918/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.497 | DEBUG    | __main__:trials:29 - Trial = 24918/30000 | Total reward = 41.34
2022-01-26 14:18:27.500 | DEBUG    | __main__:trials:26 - Trial = 24919/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.501 | DEBUG    | __main__:trials:29 - Trial = 24919/30000 | Total reward = 26.35
2022-01-26 14:18:27.504 | DEBUG    | __main__:trials:24 - Trial = 24920/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.506 | DEBUG    | __main__:trials:29 - Trial = 24920/30000 | Total reward = 17.94
2022-01-26 14:18:27.509 | DEBUG    | __main__:trials:24 - Trial = 24921/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.511 | DEBUG    | __main__:trials:29 - Trial = 24921/30000 | Total reward = 38.15
2022-01-26 14:18:27.514 | DEBUG    | __main__:trials:24 - Trial = 24922/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.515 | DEBUG    | __main__:trials:29 - Trial = 24922/30000 | Total reward = 44.45
2022-01-26 14:18:27.520 | DEBUG    | __main__:trials:24 - Trial = 24923/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.521 | DEBUG    | __main__:trials:29 - Trial = 24923/30000 | Total reward = 34.12
2022-01-26 14:18:27.525 | DEBUG    | __main__:trials:24 - Trial = 24924/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.526 | DEBUG    | __main__:trials:29 - Trial = 24924/30000 | Total reward = 35.61
2022-01-26 14:18:27.530 | DEBUG    | __main__:trials:24 - Trial = 24925/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.532 | DEBUG    | __main__:trials:29 - Trial = 24925/30000 | Total reward = 21.04
2022-01-26 14:18:27.535 | DEBUG    | __main__:trials:24 - Trial = 24926/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.537 | DEBUG    | __main__:trials:29 - Trial = 24926/30000 | Total reward = 37.37
2022-01-26 14:18:27.539 | DEBUG    | __main__:trials:24 - Trial = 24927/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.541 | DEBUG    | __main__:trials:29 - Trial = 24927/30000 | Total reward = 30.30
2022-01-26 14:18:27.545 | DEBUG    | __main__:trials:24 - Trial = 24928/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.546 | DEBUG    | __main__:trials:29 - Trial = 24928/30000 | Total reward = 31.79
2022-01-26 14:18:27.550 | DEBUG    | __main__:trials:24 - Trial = 24929/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.551 | DEBUG    | __main__:trials:29 - Trial = 24929/30000 | Total reward = 45.10
2022-01-26 14:18:27.554 | DEBUG    | __main__:trials:24 - Trial = 24930/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.556 | DEBUG    | __main__:trials:29 - Trial = 24930/30000 | Total reward = 38.85
2022-01-26 14:18:27.559 | DEBUG    | __main__:trials:24 - Trial = 24931/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.560 | DEBUG    | __main__:trials:29 - Trial = 24931/30000 | Total reward = 37.23
2022-01-26 14:18:27.564 | DEBUG    | __main__:trials:24 - Trial = 24932/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.566 | DEBUG    | __main__:trials:29 - Trial = 24932/30000 | Total reward = 36.03
2022-01-26 14:18:27.569 | DEBUG    | __main__:trials:24 - Trial = 24933/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.570 | DEBUG    | __main__:trials:29 - Trial = 24933/30000 | Total reward = 54.60
2022-01-26 14:18:27.574 | DEBUG    | __main__:trials:24 - Trial = 24934/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.575 | DEBUG    | __main__:trials:29 - Trial = 24934/30000 | Total reward = 37.32
2022-01-26 14:18:27.579 | DEBUG    | __main__:trials:24 - Trial = 24935/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.580 | DEBUG    | __main__:trials:29 - Trial = 24935/30000 | Total reward = 37.85
2022-01-26 14:18:27.584 | DEBUG    | __main__:trials:24 - Trial = 24936/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.585 | DEBUG    | __main__:trials:29 - Trial = 24936/30000 | Total reward = 37.52
2022-01-26 14:18:27.590 | DEBUG    | __main__:trials:24 - Trial = 24937/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.591 | DEBUG    | __main__:trials:29 - Trial = 24937/30000 | Total reward = 45.32
2022-01-26 14:18:27.594 | DEBUG    | __main__:trials:24 - Trial = 24938/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.596 | DEBUG    | __main__:trials:29 - Trial = 24938/30000 | Total reward = 47.14
2022-01-26 14:18:27.599 | DEBUG    | __main__:trials:24 - Trial = 24939/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.601 | DEBUG    | __main__:trials:29 - Trial = 24939/30000 | Total reward = 50.44
2022-01-26 14:18:27.604 | DEBUG    | __main__:trials:24 - Trial = 24940/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.605 | DEBUG    | __main__:trials:29 - Trial = 24940/30000 | Total reward = 38.23
2022-01-26 14:18:27.609 | DEBUG    | __main__:trials:24 - Trial = 24941/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.611 | DEBUG    | __main__:trials:29 - Trial = 24941/30000 | Total reward = 45.03
2022-01-26 14:18:27.615 | DEBUG    | __main__:trials:24 - Trial = 24942/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.616 | DEBUG    | __main__:trials:29 - Trial = 24942/30000 | Total reward = 33.78
2022-01-26 14:18:27.620 | DEBUG    | __main__:trials:24 - Trial = 24943/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.621 | DEBUG    | __main__:trials:29 - Trial = 24943/30000 | Total reward = 45.58
2022-01-26 14:18:27.624 | DEBUG    | __main__:trials:26 - Trial = 24944/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.625 | DEBUG    | __main__:trials:29 - Trial = 24944/30000 | Total reward = 16.52
2022-01-26 14:18:27.629 | DEBUG    | __main__:trials:24 - Trial = 24945/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.631 | DEBUG    | __main__:trials:29 - Trial = 24945/30000 | Total reward = 28.73
2022-01-26 14:18:27.634 | DEBUG    | __main__:trials:24 - Trial = 24946/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.636 | DEBUG    | __main__:trials:29 - Trial = 24946/30000 | Total reward = 29.76
2022-01-26 14:18:27.639 | DEBUG    | __main__:trials:24 - Trial = 24947/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.641 | DEBUG    | __main__:trials:29 - Trial = 24947/30000 | Total reward = 37.23
2022-01-26 14:18:27.645 | DEBUG    | __main__:trials:24 - Trial = 24948/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.646 | DEBUG    | __main__:trials:29 - Trial = 24948/30000 | Total reward = 38.57
2022-01-26 14:18:27.650 | DEBUG    | __main__:trials:24 - Trial = 24949/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.651 | DEBUG    | __main__:trials:29 - Trial = 24949/30000 | Total reward = 34.12
2022-01-26 14:18:27.655 | DEBUG    | __main__:trials:24 - Trial = 24950/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.657 | DEBUG    | __main__:trials:29 - Trial = 24950/30000 | Total reward = 33.52
2022-01-26 14:18:27.659 | DEBUG    | __main__:trials:26 - Trial = 24951/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.661 | DEBUG    | __main__:trials:29 - Trial = 24951/30000 | Total reward = 26.79
2022-01-26 14:18:27.665 | DEBUG    | __main__:trials:24 - Trial = 24952/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.665 | DEBUG    | __main__:trials:29 - Trial = 24952/30000 | Total reward = 25.20
2022-01-26 14:18:27.670 | DEBUG    | __main__:trials:24 - Trial = 24953/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.671 | DEBUG    | __main__:trials:29 - Trial = 24953/30000 | Total reward = 39.77
2022-01-26 14:18:27.674 | DEBUG    | __main__:trials:24 - Trial = 24954/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.676 | DEBUG    | __main__:trials:29 - Trial = 24954/30000 | Total reward = 31.72
2022-01-26 14:18:27.680 | DEBUG    | __main__:trials:24 - Trial = 24955/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.681 | DEBUG    | __main__:trials:29 - Trial = 24955/30000 | Total reward = 38.05
2022-01-26 14:18:27.685 | DEBUG    | __main__:trials:24 - Trial = 24956/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.686 | DEBUG    | __main__:trials:29 - Trial = 24956/30000 | Total reward = 36.22
2022-01-26 14:18:27.690 | DEBUG    | __main__:trials:24 - Trial = 24957/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.691 | DEBUG    | __main__:trials:29 - Trial = 24957/30000 | Total reward = 37.93
2022-01-26 14:18:27.695 | DEBUG    | __main__:trials:24 - Trial = 24958/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.697 | DEBUG    | __main__:trials:29 - Trial = 24958/30000 | Total reward = 48.94
2022-01-26 14:18:27.700 | DEBUG    | __main__:trials:24 - Trial = 24959/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.702 | DEBUG    | __main__:trials:29 - Trial = 24959/30000 | Total reward = 38.89
2022-01-26 14:18:27.706 | DEBUG    | __main__:trials:24 - Trial = 24960/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.707 | DEBUG    | __main__:trials:29 - Trial = 24960/30000 | Total reward = 37.41
2022-01-26 14:18:27.711 | DEBUG    | __main__:trials:24 - Trial = 24961/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.712 | DEBUG    | __main__:trials:29 - Trial = 24961/30000 | Total reward = 48.01
2022-01-26 14:18:27.715 | DEBUG    | __main__:trials:24 - Trial = 24962/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.717 | DEBUG    | __main__:trials:29 - Trial = 24962/30000 | Total reward = 23.28
2022-01-26 14:18:27.720 | DEBUG    | __main__:trials:24 - Trial = 24963/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.721 | DEBUG    | __main__:trials:29 - Trial = 24963/30000 | Total reward = 51.08
2022-01-26 14:18:27.725 | DEBUG    | __main__:trials:24 - Trial = 24964/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.725 | DEBUG    | __main__:trials:29 - Trial = 24964/30000 | Total reward = 37.39
2022-01-26 14:18:27.728 | DEBUG    | __main__:trials:24 - Trial = 24965/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.729 | DEBUG    | __main__:trials:29 - Trial = 24965/30000 | Total reward = 33.64
2022-01-26 14:18:27.733 | DEBUG    | __main__:trials:24 - Trial = 24966/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.734 | DEBUG    | __main__:trials:29 - Trial = 24966/30000 | Total reward = 41.13
2022-01-26 14:18:27.738 | DEBUG    | __main__:trials:24 - Trial = 24967/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.739 | DEBUG    | __main__:trials:29 - Trial = 24967/30000 | Total reward = 49.33
2022-01-26 14:18:27.742 | DEBUG    | __main__:trials:24 - Trial = 24968/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.744 | DEBUG    | __main__:trials:29 - Trial = 24968/30000 | Total reward = 35.82
2022-01-26 14:18:27.747 | DEBUG    | __main__:trials:24 - Trial = 24969/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.749 | DEBUG    | __main__:trials:29 - Trial = 24969/30000 | Total reward = 35.10
2022-01-26 14:18:27.752 | DEBUG    | __main__:trials:24 - Trial = 24970/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.754 | DEBUG    | __main__:trials:29 - Trial = 24970/30000 | Total reward = 31.44
2022-01-26 14:18:27.758 | DEBUG    | __main__:trials:24 - Trial = 24971/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.759 | DEBUG    | __main__:trials:29 - Trial = 24971/30000 | Total reward = 47.37
2022-01-26 14:18:27.762 | DEBUG    | __main__:trials:24 - Trial = 24972/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.764 | DEBUG    | __main__:trials:29 - Trial = 24972/30000 | Total reward = 46.70
2022-01-26 14:18:27.768 | DEBUG    | __main__:trials:24 - Trial = 24973/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.769 | DEBUG    | __main__:trials:29 - Trial = 24973/30000 | Total reward = 37.23
2022-01-26 14:18:27.773 | DEBUG    | __main__:trials:24 - Trial = 24974/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.774 | DEBUG    | __main__:trials:29 - Trial = 24974/30000 | Total reward = 23.34
2022-01-26 14:18:27.778 | DEBUG    | __main__:trials:26 - Trial = 24975/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.779 | DEBUG    | __main__:trials:29 - Trial = 24975/30000 | Total reward = 16.48
2022-01-26 14:18:27.782 | DEBUG    | __main__:trials:26 - Trial = 24976/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.784 | DEBUG    | __main__:trials:29 - Trial = 24976/30000 | Total reward = 12.63
2022-01-26 14:18:27.788 | DEBUG    | __main__:trials:24 - Trial = 24977/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.789 | DEBUG    | __main__:trials:29 - Trial = 24977/30000 | Total reward = 40.41
2022-01-26 14:18:27.792 | DEBUG    | __main__:trials:26 - Trial = 24978/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.793 | DEBUG    | __main__:trials:29 - Trial = 24978/30000 | Total reward = 6.44
2022-01-26 14:18:27.797 | DEBUG    | __main__:trials:24 - Trial = 24979/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.798 | DEBUG    | __main__:trials:29 - Trial = 24979/30000 | Total reward = 37.17
2022-01-26 14:18:27.800 | DEBUG    | __main__:trials:26 - Trial = 24980/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.801 | DEBUG    | __main__:trials:29 - Trial = 24980/30000 | Total reward = 6.44
2022-01-26 14:18:27.804 | DEBUG    | __main__:trials:24 - Trial = 24981/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.805 | DEBUG    | __main__:trials:29 - Trial = 24981/30000 | Total reward = 46.68
2022-01-26 14:18:27.808 | DEBUG    | __main__:trials:24 - Trial = 24982/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.810 | DEBUG    | __main__:trials:29 - Trial = 24982/30000 | Total reward = 46.86
2022-01-26 14:18:27.813 | DEBUG    | __main__:trials:24 - Trial = 24983/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.814 | DEBUG    | __main__:trials:29 - Trial = 24983/30000 | Total reward = 34.17
2022-01-26 14:18:27.819 | DEBUG    | __main__:trials:24 - Trial = 24984/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.820 | DEBUG    | __main__:trials:29 - Trial = 24984/30000 | Total reward = 34.99
2022-01-26 14:18:27.823 | DEBUG    | __main__:trials:26 - Trial = 24985/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.825 | DEBUG    | __main__:trials:29 - Trial = 24985/30000 | Total reward = 25.52
2022-01-26 14:18:27.828 | DEBUG    | __main__:trials:24 - Trial = 24986/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.830 | DEBUG    | __main__:trials:29 - Trial = 24986/30000 | Total reward = 35.44
2022-01-26 14:18:27.833 | DEBUG    | __main__:trials:26 - Trial = 24987/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.835 | DEBUG    | __main__:trials:29 - Trial = 24987/30000 | Total reward = 26.23
2022-01-26 14:18:27.839 | DEBUG    | __main__:trials:24 - Trial = 24988/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.840 | DEBUG    | __main__:trials:29 - Trial = 24988/30000 | Total reward = 32.76
2022-01-26 14:18:27.844 | DEBUG    | __main__:trials:24 - Trial = 24989/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.844 | DEBUG    | __main__:trials:29 - Trial = 24989/30000 | Total reward = 36.38
2022-01-26 14:18:27.849 | DEBUG    | __main__:trials:24 - Trial = 24990/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.849 | DEBUG    | __main__:trials:29 - Trial = 24990/30000 | Total reward = 39.34
2022-01-26 14:18:27.853 | DEBUG    | __main__:trials:24 - Trial = 24991/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.854 | DEBUG    | __main__:trials:29 - Trial = 24991/30000 | Total reward = 35.42
2022-01-26 14:18:27.859 | DEBUG    | __main__:trials:24 - Trial = 24992/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.859 | DEBUG    | __main__:trials:29 - Trial = 24992/30000 | Total reward = 28.17
2022-01-26 14:18:27.863 | DEBUG    | __main__:trials:24 - Trial = 24993/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.865 | DEBUG    | __main__:trials:29 - Trial = 24993/30000 | Total reward = 33.38
2022-01-26 14:18:27.868 | DEBUG    | __main__:trials:24 - Trial = 24994/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.869 | DEBUG    | __main__:trials:29 - Trial = 24994/30000 | Total reward = 26.14
2022-01-26 14:18:27.873 | DEBUG    | __main__:trials:24 - Trial = 24995/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.874 | DEBUG    | __main__:trials:29 - Trial = 24995/30000 | Total reward = 36.84
2022-01-26 14:18:27.877 | DEBUG    | __main__:trials:26 - Trial = 24996/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.878 | DEBUG    | __main__:trials:29 - Trial = 24996/30000 | Total reward = 24.91
2022-01-26 14:18:27.882 | DEBUG    | __main__:trials:24 - Trial = 24997/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.884 | DEBUG    | __main__:trials:29 - Trial = 24997/30000 | Total reward = 41.32
2022-01-26 14:18:27.887 | DEBUG    | __main__:trials:24 - Trial = 24998/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.889 | DEBUG    | __main__:trials:29 - Trial = 24998/30000 | Total reward = 33.72
2022-01-26 14:18:27.892 | DEBUG    | __main__:trials:24 - Trial = 24999/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.893 | DEBUG    | __main__:trials:29 - Trial = 24999/30000 | Total reward = 38.82
2022-01-26 14:18:27.897 | DEBUG    | __main__:trials:24 - Trial = 25000/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.898 | DEBUG    | __main__:trials:29 - Trial = 25000/30000 | Total reward = 45.88
2022-01-26 14:18:27.900 | DEBUG    | __main__:trials:26 - Trial = 25001/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.901 | DEBUG    | __main__:trials:29 - Trial = 25001/30000 | Total reward = 11.60
2022-01-26 14:18:27.904 | DEBUG    | __main__:trials:24 - Trial = 25002/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.905 | DEBUG    | __main__:trials:29 - Trial = 25002/30000 | Total reward = 38.89
2022-01-26 14:18:27.908 | DEBUG    | __main__:trials:24 - Trial = 25003/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.909 | DEBUG    | __main__:trials:29 - Trial = 25003/30000 | Total reward = 34.32
2022-01-26 14:18:27.912 | DEBUG    | __main__:trials:24 - Trial = 25004/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.914 | DEBUG    | __main__:trials:29 - Trial = 25004/30000 | Total reward = 32.42
2022-01-26 14:18:27.917 | DEBUG    | __main__:trials:24 - Trial = 25005/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.919 | DEBUG    | __main__:trials:29 - Trial = 25005/30000 | Total reward = 48.58
2022-01-26 14:18:27.923 | DEBUG    | __main__:trials:24 - Trial = 25006/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.924 | DEBUG    | __main__:trials:29 - Trial = 25006/30000 | Total reward = 31.85
2022-01-26 14:18:27.928 | DEBUG    | __main__:trials:24 - Trial = 25007/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.929 | DEBUG    | __main__:trials:29 - Trial = 25007/30000 | Total reward = 32.98
2022-01-26 14:18:27.933 | DEBUG    | __main__:trials:24 - Trial = 25008/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.934 | DEBUG    | __main__:trials:29 - Trial = 25008/30000 | Total reward = 35.12
2022-01-26 14:18:27.937 | DEBUG    | __main__:trials:24 - Trial = 25009/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.938 | DEBUG    | __main__:trials:29 - Trial = 25009/30000 | Total reward = 37.54
2022-01-26 14:18:27.942 | DEBUG    | __main__:trials:24 - Trial = 25010/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.943 | DEBUG    | __main__:trials:29 - Trial = 25010/30000 | Total reward = 46.76
2022-01-26 14:18:27.948 | DEBUG    | __main__:trials:24 - Trial = 25011/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.949 | DEBUG    | __main__:trials:29 - Trial = 25011/30000 | Total reward = 49.90
2022-01-26 14:18:27.952 | DEBUG    | __main__:trials:24 - Trial = 25012/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.953 | DEBUG    | __main__:trials:29 - Trial = 25012/30000 | Total reward = 45.06
2022-01-26 14:18:27.956 | DEBUG    | __main__:trials:24 - Trial = 25013/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.958 | DEBUG    | __main__:trials:29 - Trial = 25013/30000 | Total reward = 36.83
2022-01-26 14:18:27.962 | DEBUG    | __main__:trials:24 - Trial = 25014/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.963 | DEBUG    | __main__:trials:29 - Trial = 25014/30000 | Total reward = 37.39
2022-01-26 14:18:27.967 | DEBUG    | __main__:trials:24 - Trial = 25015/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.967 | DEBUG    | __main__:trials:29 - Trial = 25015/30000 | Total reward = 36.90
2022-01-26 14:18:27.971 | DEBUG    | __main__:trials:24 - Trial = 25016/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.973 | DEBUG    | __main__:trials:29 - Trial = 25016/30000 | Total reward = 38.10
2022-01-26 14:18:27.976 | DEBUG    | __main__:trials:24 - Trial = 25017/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.978 | DEBUG    | __main__:trials:29 - Trial = 25017/30000 | Total reward = 53.12
2022-01-26 14:18:27.981 | DEBUG    | __main__:trials:24 - Trial = 25018/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.983 | DEBUG    | __main__:trials:29 - Trial = 25018/30000 | Total reward = 29.81
2022-01-26 14:18:27.987 | DEBUG    | __main__:trials:24 - Trial = 25019/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.987 | DEBUG    | __main__:trials:29 - Trial = 25019/30000 | Total reward = 48.26
2022-01-26 14:18:27.992 | DEBUG    | __main__:trials:24 - Trial = 25020/30000 | Max number of steps (20) reached
2022-01-26 14:18:27.993 | DEBUG    | __main__:trials:29 - Trial = 25020/30000 | Total reward = 48.34
2022-01-26 14:18:27.997 | DEBUG    | __main__:trials:26 - Trial = 25021/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:27.998 | DEBUG    | __main__:trials:29 - Trial = 25021/30000 | Total reward = 19.71
2022-01-26 14:18:28.002 | DEBUG    | __main__:trials:24 - Trial = 25022/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.002 | DEBUG    | __main__:trials:29 - Trial = 25022/30000 | Total reward = 38.62
2022-01-26 14:18:28.007 | DEBUG    | __main__:trials:24 - Trial = 25023/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.007 | DEBUG    | __main__:trials:29 - Trial = 25023/30000 | Total reward = 40.67
2022-01-26 14:18:28.012 | DEBUG    | __main__:trials:24 - Trial = 25024/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.012 | DEBUG    | __main__:trials:29 - Trial = 25024/30000 | Total reward = 38.59
2022-01-26 14:18:28.016 | DEBUG    | __main__:trials:24 - Trial = 25025/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.018 | DEBUG    | __main__:trials:29 - Trial = 25025/30000 | Total reward = 37.51
2022-01-26 14:18:28.021 | DEBUG    | __main__:trials:24 - Trial = 25026/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.023 | DEBUG    | __main__:trials:29 - Trial = 25026/30000 | Total reward = 47.59
2022-01-26 14:18:28.026 | DEBUG    | __main__:trials:26 - Trial = 25027/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.028 | DEBUG    | __main__:trials:29 - Trial = 25027/30000 | Total reward = 22.51
2022-01-26 14:18:28.031 | DEBUG    | __main__:trials:24 - Trial = 25028/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.032 | DEBUG    | __main__:trials:29 - Trial = 25028/30000 | Total reward = 35.84
2022-01-26 14:18:28.036 | DEBUG    | __main__:trials:24 - Trial = 25029/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.037 | DEBUG    | __main__:trials:29 - Trial = 25029/30000 | Total reward = 33.51
2022-01-26 14:18:28.040 | DEBUG    | __main__:trials:24 - Trial = 25030/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.041 | DEBUG    | __main__:trials:29 - Trial = 25030/30000 | Total reward = 33.42
2022-01-26 14:18:28.045 | DEBUG    | __main__:trials:24 - Trial = 25031/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.045 | DEBUG    | __main__:trials:29 - Trial = 25031/30000 | Total reward = 43.63
2022-01-26 14:18:28.049 | DEBUG    | __main__:trials:24 - Trial = 25032/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.051 | DEBUG    | __main__:trials:29 - Trial = 25032/30000 | Total reward = 36.45
2022-01-26 14:18:28.054 | DEBUG    | __main__:trials:24 - Trial = 25033/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.054 | DEBUG    | __main__:trials:29 - Trial = 25033/30000 | Total reward = 51.90
2022-01-26 14:18:28.058 | DEBUG    | __main__:trials:24 - Trial = 25034/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.060 | DEBUG    | __main__:trials:29 - Trial = 25034/30000 | Total reward = 36.02
2022-01-26 14:18:28.063 | DEBUG    | __main__:trials:24 - Trial = 25035/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.064 | DEBUG    | __main__:trials:29 - Trial = 25035/30000 | Total reward = 38.31
2022-01-26 14:18:28.068 | DEBUG    | __main__:trials:24 - Trial = 25036/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.069 | DEBUG    | __main__:trials:29 - Trial = 25036/30000 | Total reward = 36.97
2022-01-26 14:18:28.073 | DEBUG    | __main__:trials:24 - Trial = 25037/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.075 | DEBUG    | __main__:trials:29 - Trial = 25037/30000 | Total reward = 26.57
2022-01-26 14:18:28.077 | DEBUG    | __main__:trials:24 - Trial = 25038/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.079 | DEBUG    | __main__:trials:29 - Trial = 25038/30000 | Total reward = 36.26
2022-01-26 14:18:28.082 | DEBUG    | __main__:trials:24 - Trial = 25039/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.084 | DEBUG    | __main__:trials:29 - Trial = 25039/30000 | Total reward = 38.89
2022-01-26 14:18:28.087 | DEBUG    | __main__:trials:24 - Trial = 25040/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.088 | DEBUG    | __main__:trials:29 - Trial = 25040/30000 | Total reward = 51.15
2022-01-26 14:18:28.092 | DEBUG    | __main__:trials:24 - Trial = 25041/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.092 | DEBUG    | __main__:trials:29 - Trial = 25041/30000 | Total reward = 33.06
2022-01-26 14:18:28.097 | DEBUG    | __main__:trials:24 - Trial = 25042/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.097 | DEBUG    | __main__:trials:29 - Trial = 25042/30000 | Total reward = 33.08
2022-01-26 14:18:28.101 | DEBUG    | __main__:trials:24 - Trial = 25043/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.102 | DEBUG    | __main__:trials:29 - Trial = 25043/30000 | Total reward = 36.89
2022-01-26 14:18:28.107 | DEBUG    | __main__:trials:24 - Trial = 25044/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.108 | DEBUG    | __main__:trials:29 - Trial = 25044/30000 | Total reward = 50.79
2022-01-26 14:18:28.111 | DEBUG    | __main__:trials:24 - Trial = 25045/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.113 | DEBUG    | __main__:trials:29 - Trial = 25045/30000 | Total reward = 35.58
2022-01-26 14:18:28.116 | DEBUG    | __main__:trials:24 - Trial = 25046/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.117 | DEBUG    | __main__:trials:29 - Trial = 25046/30000 | Total reward = 35.04
2022-01-26 14:18:28.120 | DEBUG    | __main__:trials:24 - Trial = 25047/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.122 | DEBUG    | __main__:trials:29 - Trial = 25047/30000 | Total reward = 40.79
2022-01-26 14:18:28.125 | DEBUG    | __main__:trials:24 - Trial = 25048/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.126 | DEBUG    | __main__:trials:29 - Trial = 25048/30000 | Total reward = 29.48
2022-01-26 14:18:28.130 | DEBUG    | __main__:trials:24 - Trial = 25049/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.131 | DEBUG    | __main__:trials:29 - Trial = 25049/30000 | Total reward = 36.87
2022-01-26 14:18:28.134 | DEBUG    | __main__:trials:24 - Trial = 25050/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.135 | DEBUG    | __main__:trials:29 - Trial = 25050/30000 | Total reward = 37.45
2022-01-26 14:18:28.139 | DEBUG    | __main__:trials:24 - Trial = 25051/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.140 | DEBUG    | __main__:trials:29 - Trial = 25051/30000 | Total reward = 33.42
2022-01-26 14:18:28.144 | DEBUG    | __main__:trials:24 - Trial = 25052/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.146 | DEBUG    | __main__:trials:29 - Trial = 25052/30000 | Total reward = 62.23
2022-01-26 14:18:28.149 | DEBUG    | __main__:trials:26 - Trial = 25053/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.152 | DEBUG    | __main__:trials:29 - Trial = 25053/30000 | Total reward = 29.23
2022-01-26 14:18:28.155 | DEBUG    | __main__:trials:24 - Trial = 25054/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.156 | DEBUG    | __main__:trials:29 - Trial = 25054/30000 | Total reward = 45.07
2022-01-26 14:18:28.160 | DEBUG    | __main__:trials:24 - Trial = 25055/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.161 | DEBUG    | __main__:trials:29 - Trial = 25055/30000 | Total reward = 43.34
2022-01-26 14:18:28.165 | DEBUG    | __main__:trials:24 - Trial = 25056/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.167 | DEBUG    | __main__:trials:29 - Trial = 25056/30000 | Total reward = 37.23
2022-01-26 14:18:28.169 | DEBUG    | __main__:trials:24 - Trial = 25057/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.171 | DEBUG    | __main__:trials:29 - Trial = 25057/30000 | Total reward = 46.21
2022-01-26 14:18:28.175 | DEBUG    | __main__:trials:24 - Trial = 25058/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.177 | DEBUG    | __main__:trials:29 - Trial = 25058/30000 | Total reward = 40.31
2022-01-26 14:18:28.180 | DEBUG    | __main__:trials:24 - Trial = 25059/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.182 | DEBUG    | __main__:trials:29 - Trial = 25059/30000 | Total reward = 41.03
2022-01-26 14:18:28.185 | DEBUG    | __main__:trials:24 - Trial = 25060/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.187 | DEBUG    | __main__:trials:29 - Trial = 25060/30000 | Total reward = 47.40
2022-01-26 14:18:28.190 | DEBUG    | __main__:trials:24 - Trial = 25061/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.192 | DEBUG    | __main__:trials:29 - Trial = 25061/30000 | Total reward = 39.50
2022-01-26 14:18:28.194 | DEBUG    | __main__:trials:24 - Trial = 25062/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.196 | DEBUG    | __main__:trials:29 - Trial = 25062/30000 | Total reward = 34.85
2022-01-26 14:18:28.200 | DEBUG    | __main__:trials:24 - Trial = 25063/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.202 | DEBUG    | __main__:trials:29 - Trial = 25063/30000 | Total reward = 37.83
2022-01-26 14:18:28.206 | DEBUG    | __main__:trials:24 - Trial = 25064/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.207 | DEBUG    | __main__:trials:29 - Trial = 25064/30000 | Total reward = 42.06
2022-01-26 14:18:28.210 | DEBUG    | __main__:trials:24 - Trial = 25065/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.212 | DEBUG    | __main__:trials:29 - Trial = 25065/30000 | Total reward = 43.26
2022-01-26 14:18:28.215 | DEBUG    | __main__:trials:24 - Trial = 25066/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.217 | DEBUG    | __main__:trials:29 - Trial = 25066/30000 | Total reward = 34.88
2022-01-26 14:18:28.220 | DEBUG    | __main__:trials:24 - Trial = 25067/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.222 | DEBUG    | __main__:trials:29 - Trial = 25067/30000 | Total reward = 41.47
2022-01-26 14:18:28.225 | DEBUG    | __main__:trials:24 - Trial = 25068/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.226 | DEBUG    | __main__:trials:29 - Trial = 25068/30000 | Total reward = 36.51
2022-01-26 14:18:28.230 | DEBUG    | __main__:trials:24 - Trial = 25069/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.231 | DEBUG    | __main__:trials:29 - Trial = 25069/30000 | Total reward = 48.05
2022-01-26 14:18:28.235 | DEBUG    | __main__:trials:24 - Trial = 25070/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.236 | DEBUG    | __main__:trials:29 - Trial = 25070/30000 | Total reward = 33.61
2022-01-26 14:18:28.239 | DEBUG    | __main__:trials:26 - Trial = 25071/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.241 | DEBUG    | __main__:trials:29 - Trial = 25071/30000 | Total reward = 13.14
2022-01-26 14:18:28.244 | DEBUG    | __main__:trials:24 - Trial = 25072/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.246 | DEBUG    | __main__:trials:29 - Trial = 25072/30000 | Total reward = 40.87
2022-01-26 14:18:28.250 | DEBUG    | __main__:trials:24 - Trial = 25073/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.251 | DEBUG    | __main__:trials:29 - Trial = 25073/30000 | Total reward = 35.77
2022-01-26 14:18:28.255 | DEBUG    | __main__:trials:24 - Trial = 25074/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.255 | DEBUG    | __main__:trials:29 - Trial = 25074/30000 | Total reward = 38.84
2022-01-26 14:18:28.260 | DEBUG    | __main__:trials:24 - Trial = 25075/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.261 | DEBUG    | __main__:trials:29 - Trial = 25075/30000 | Total reward = 47.10
2022-01-26 14:18:28.266 | DEBUG    | __main__:trials:24 - Trial = 25076/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.267 | DEBUG    | __main__:trials:29 - Trial = 25076/30000 | Total reward = 38.49
2022-01-26 14:18:28.271 | DEBUG    | __main__:trials:24 - Trial = 25077/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.273 | DEBUG    | __main__:trials:29 - Trial = 25077/30000 | Total reward = 39.56
2022-01-26 14:18:28.278 | DEBUG    | __main__:trials:24 - Trial = 25078/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.278 | DEBUG    | __main__:trials:29 - Trial = 25078/30000 | Total reward = 31.55
2022-01-26 14:18:28.283 | DEBUG    | __main__:trials:24 - Trial = 25079/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.285 | DEBUG    | __main__:trials:29 - Trial = 25079/30000 | Total reward = 46.61
2022-01-26 14:18:28.289 | DEBUG    | __main__:trials:24 - Trial = 25080/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.289 | DEBUG    | __main__:trials:29 - Trial = 25080/30000 | Total reward = 42.83
2022-01-26 14:18:28.294 | DEBUG    | __main__:trials:24 - Trial = 25081/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.295 | DEBUG    | __main__:trials:29 - Trial = 25081/30000 | Total reward = 46.97
2022-01-26 14:18:28.299 | DEBUG    | __main__:trials:24 - Trial = 25082/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.301 | DEBUG    | __main__:trials:29 - Trial = 25082/30000 | Total reward = 34.00
2022-01-26 14:18:28.305 | DEBUG    | __main__:trials:24 - Trial = 25083/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.306 | DEBUG    | __main__:trials:29 - Trial = 25083/30000 | Total reward = 44.96
2022-01-26 14:18:28.310 | DEBUG    | __main__:trials:24 - Trial = 25084/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.312 | DEBUG    | __main__:trials:29 - Trial = 25084/30000 | Total reward = 46.18
2022-01-26 14:18:28.315 | DEBUG    | __main__:trials:24 - Trial = 25085/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.316 | DEBUG    | __main__:trials:29 - Trial = 25085/30000 | Total reward = 36.62
2022-01-26 14:18:28.320 | DEBUG    | __main__:trials:24 - Trial = 25086/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.322 | DEBUG    | __main__:trials:29 - Trial = 25086/30000 | Total reward = 20.98
2022-01-26 14:18:28.326 | DEBUG    | __main__:trials:24 - Trial = 25087/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.327 | DEBUG    | __main__:trials:29 - Trial = 25087/30000 | Total reward = 18.95
2022-01-26 14:18:28.331 | DEBUG    | __main__:trials:26 - Trial = 25088/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.331 | DEBUG    | __main__:trials:29 - Trial = 25088/30000 | Total reward = 24.02
2022-01-26 14:18:28.336 | DEBUG    | __main__:trials:24 - Trial = 25089/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.337 | DEBUG    | __main__:trials:29 - Trial = 25089/30000 | Total reward = 38.48
2022-01-26 14:18:28.341 | DEBUG    | __main__:trials:24 - Trial = 25090/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.342 | DEBUG    | __main__:trials:29 - Trial = 25090/30000 | Total reward = 40.26
2022-01-26 14:18:28.345 | DEBUG    | __main__:trials:24 - Trial = 25091/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.346 | DEBUG    | __main__:trials:29 - Trial = 25091/30000 | Total reward = 27.45
2022-01-26 14:18:28.350 | DEBUG    | __main__:trials:24 - Trial = 25092/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.351 | DEBUG    | __main__:trials:29 - Trial = 25092/30000 | Total reward = 26.81
2022-01-26 14:18:28.355 | DEBUG    | __main__:trials:24 - Trial = 25093/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.356 | DEBUG    | __main__:trials:29 - Trial = 25093/30000 | Total reward = 37.23
2022-01-26 14:18:28.360 | DEBUG    | __main__:trials:24 - Trial = 25094/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.361 | DEBUG    | __main__:trials:29 - Trial = 25094/30000 | Total reward = 28.93
2022-01-26 14:18:28.366 | DEBUG    | __main__:trials:24 - Trial = 25095/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.366 | DEBUG    | __main__:trials:29 - Trial = 25095/30000 | Total reward = 39.41
2022-01-26 14:18:28.371 | DEBUG    | __main__:trials:24 - Trial = 25096/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.371 | DEBUG    | __main__:trials:29 - Trial = 25096/30000 | Total reward = 37.23
2022-01-26 14:18:28.375 | DEBUG    | __main__:trials:26 - Trial = 25097/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.376 | DEBUG    | __main__:trials:29 - Trial = 25097/30000 | Total reward = 31.31
2022-01-26 14:18:28.380 | DEBUG    | __main__:trials:24 - Trial = 25098/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.382 | DEBUG    | __main__:trials:29 - Trial = 25098/30000 | Total reward = 38.29
2022-01-26 14:18:28.385 | DEBUG    | __main__:trials:24 - Trial = 25099/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.386 | DEBUG    | __main__:trials:29 - Trial = 25099/30000 | Total reward = 40.92
2022-01-26 14:18:28.390 | DEBUG    | __main__:trials:24 - Trial = 25100/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.391 | DEBUG    | __main__:trials:29 - Trial = 25100/30000 | Total reward = 45.27
2022-01-26 14:18:28.395 | DEBUG    | __main__:trials:24 - Trial = 25101/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.397 | DEBUG    | __main__:trials:29 - Trial = 25101/30000 | Total reward = 36.22
2022-01-26 14:18:28.400 | DEBUG    | __main__:trials:24 - Trial = 25102/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.402 | DEBUG    | __main__:trials:29 - Trial = 25102/30000 | Total reward = 37.83
2022-01-26 14:18:28.405 | DEBUG    | __main__:trials:24 - Trial = 25103/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.407 | DEBUG    | __main__:trials:29 - Trial = 25103/30000 | Total reward = 32.50
2022-01-26 14:18:28.410 | DEBUG    | __main__:trials:24 - Trial = 25104/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.412 | DEBUG    | __main__:trials:29 - Trial = 25104/30000 | Total reward = 36.40
2022-01-26 14:18:28.415 | DEBUG    | __main__:trials:24 - Trial = 25105/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.417 | DEBUG    | __main__:trials:29 - Trial = 25105/30000 | Total reward = 39.65
2022-01-26 14:18:28.420 | DEBUG    | __main__:trials:24 - Trial = 25106/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.421 | DEBUG    | __main__:trials:29 - Trial = 25106/30000 | Total reward = 47.28
2022-01-26 14:18:28.425 | DEBUG    | __main__:trials:24 - Trial = 25107/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.427 | DEBUG    | __main__:trials:29 - Trial = 25107/30000 | Total reward = 38.11
2022-01-26 14:18:28.430 | DEBUG    | __main__:trials:24 - Trial = 25108/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.431 | DEBUG    | __main__:trials:29 - Trial = 25108/30000 | Total reward = 37.77
2022-01-26 14:18:28.435 | DEBUG    | __main__:trials:24 - Trial = 25109/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.437 | DEBUG    | __main__:trials:29 - Trial = 25109/30000 | Total reward = 42.95
2022-01-26 14:18:28.440 | DEBUG    | __main__:trials:24 - Trial = 25110/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.441 | DEBUG    | __main__:trials:29 - Trial = 25110/30000 | Total reward = 34.95
2022-01-26 14:18:28.445 | DEBUG    | __main__:trials:24 - Trial = 25111/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.445 | DEBUG    | __main__:trials:29 - Trial = 25111/30000 | Total reward = 50.37
2022-01-26 14:18:28.449 | DEBUG    | __main__:trials:24 - Trial = 25112/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.450 | DEBUG    | __main__:trials:29 - Trial = 25112/30000 | Total reward = 30.98
2022-01-26 14:18:28.454 | DEBUG    | __main__:trials:24 - Trial = 25113/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.455 | DEBUG    | __main__:trials:29 - Trial = 25113/30000 | Total reward = 31.14
2022-01-26 14:18:28.459 | DEBUG    | __main__:trials:24 - Trial = 25114/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.460 | DEBUG    | __main__:trials:29 - Trial = 25114/30000 | Total reward = 36.15
2022-01-26 14:18:28.464 | DEBUG    | __main__:trials:24 - Trial = 25115/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.465 | DEBUG    | __main__:trials:29 - Trial = 25115/30000 | Total reward = 41.89
2022-01-26 14:18:28.469 | DEBUG    | __main__:trials:24 - Trial = 25116/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.470 | DEBUG    | __main__:trials:29 - Trial = 25116/30000 | Total reward = 38.12
2022-01-26 14:18:28.473 | DEBUG    | __main__:trials:24 - Trial = 25117/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.474 | DEBUG    | __main__:trials:29 - Trial = 25117/30000 | Total reward = 37.86
2022-01-26 14:18:28.479 | DEBUG    | __main__:trials:24 - Trial = 25118/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.481 | DEBUG    | __main__:trials:29 - Trial = 25118/30000 | Total reward = 35.37
2022-01-26 14:18:28.484 | DEBUG    | __main__:trials:24 - Trial = 25119/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.485 | DEBUG    | __main__:trials:29 - Trial = 25119/30000 | Total reward = 39.16
2022-01-26 14:18:28.488 | DEBUG    | __main__:trials:24 - Trial = 25120/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.490 | DEBUG    | __main__:trials:29 - Trial = 25120/30000 | Total reward = 38.31
2022-01-26 14:18:28.493 | DEBUG    | __main__:trials:24 - Trial = 25121/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.493 | DEBUG    | __main__:trials:29 - Trial = 25121/30000 | Total reward = 40.87
2022-01-26 14:18:28.497 | DEBUG    | __main__:trials:24 - Trial = 25122/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.498 | DEBUG    | __main__:trials:29 - Trial = 25122/30000 | Total reward = 11.36
2022-01-26 14:18:28.502 | DEBUG    | __main__:trials:24 - Trial = 25123/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.502 | DEBUG    | __main__:trials:29 - Trial = 25123/30000 | Total reward = 41.52
2022-01-26 14:18:28.507 | DEBUG    | __main__:trials:24 - Trial = 25124/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.508 | DEBUG    | __main__:trials:29 - Trial = 25124/30000 | Total reward = 35.45
2022-01-26 14:18:28.511 | DEBUG    | __main__:trials:24 - Trial = 25125/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.513 | DEBUG    | __main__:trials:29 - Trial = 25125/30000 | Total reward = 35.04
2022-01-26 14:18:28.516 | DEBUG    | __main__:trials:24 - Trial = 25126/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.518 | DEBUG    | __main__:trials:29 - Trial = 25126/30000 | Total reward = 53.61
2022-01-26 14:18:28.522 | DEBUG    | __main__:trials:24 - Trial = 25127/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.522 | DEBUG    | __main__:trials:29 - Trial = 25127/30000 | Total reward = 38.52
2022-01-26 14:18:28.527 | DEBUG    | __main__:trials:24 - Trial = 25128/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.529 | DEBUG    | __main__:trials:29 - Trial = 25128/30000 | Total reward = 33.48
2022-01-26 14:18:28.533 | DEBUG    | __main__:trials:24 - Trial = 25129/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.534 | DEBUG    | __main__:trials:29 - Trial = 25129/30000 | Total reward = 38.85
2022-01-26 14:18:28.538 | DEBUG    | __main__:trials:24 - Trial = 25130/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.539 | DEBUG    | __main__:trials:29 - Trial = 25130/30000 | Total reward = 48.36
2022-01-26 14:18:28.543 | DEBUG    | __main__:trials:24 - Trial = 25131/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.544 | DEBUG    | __main__:trials:29 - Trial = 25131/30000 | Total reward = 42.15
2022-01-26 14:18:28.549 | DEBUG    | __main__:trials:24 - Trial = 25132/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.549 | DEBUG    | __main__:trials:29 - Trial = 25132/30000 | Total reward = 41.99
2022-01-26 14:18:28.554 | DEBUG    | __main__:trials:24 - Trial = 25133/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.554 | DEBUG    | __main__:trials:29 - Trial = 25133/30000 | Total reward = 41.62
2022-01-26 14:18:28.558 | DEBUG    | __main__:trials:24 - Trial = 25134/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.560 | DEBUG    | __main__:trials:29 - Trial = 25134/30000 | Total reward = 29.96
2022-01-26 14:18:28.562 | DEBUG    | __main__:trials:24 - Trial = 25135/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.564 | DEBUG    | __main__:trials:29 - Trial = 25135/30000 | Total reward = 35.36
2022-01-26 14:18:28.568 | DEBUG    | __main__:trials:24 - Trial = 25136/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.569 | DEBUG    | __main__:trials:29 - Trial = 25136/30000 | Total reward = 34.58
2022-01-26 14:18:28.573 | DEBUG    | __main__:trials:24 - Trial = 25137/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.575 | DEBUG    | __main__:trials:29 - Trial = 25137/30000 | Total reward = 39.72
2022-01-26 14:18:28.578 | DEBUG    | __main__:trials:26 - Trial = 25138/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.578 | DEBUG    | __main__:trials:29 - Trial = 25138/30000 | Total reward = 19.91
2022-01-26 14:18:28.582 | DEBUG    | __main__:trials:24 - Trial = 25139/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.584 | DEBUG    | __main__:trials:29 - Trial = 25139/30000 | Total reward = 34.08
2022-01-26 14:18:28.588 | DEBUG    | __main__:trials:24 - Trial = 25140/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.588 | DEBUG    | __main__:trials:29 - Trial = 25140/30000 | Total reward = 34.69
2022-01-26 14:18:28.592 | DEBUG    | __main__:trials:24 - Trial = 25141/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.594 | DEBUG    | __main__:trials:29 - Trial = 25141/30000 | Total reward = 40.74
2022-01-26 14:18:28.597 | DEBUG    | __main__:trials:24 - Trial = 25142/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.599 | DEBUG    | __main__:trials:29 - Trial = 25142/30000 | Total reward = 52.62
2022-01-26 14:18:28.602 | DEBUG    | __main__:trials:24 - Trial = 25143/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.603 | DEBUG    | __main__:trials:29 - Trial = 25143/30000 | Total reward = 51.68
2022-01-26 14:18:28.607 | DEBUG    | __main__:trials:24 - Trial = 25144/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.608 | DEBUG    | __main__:trials:29 - Trial = 25144/30000 | Total reward = 55.79
2022-01-26 14:18:28.612 | DEBUG    | __main__:trials:24 - Trial = 25145/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.614 | DEBUG    | __main__:trials:29 - Trial = 25145/30000 | Total reward = 54.98
2022-01-26 14:18:28.617 | DEBUG    | __main__:trials:24 - Trial = 25146/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.618 | DEBUG    | __main__:trials:29 - Trial = 25146/30000 | Total reward = 37.51
2022-01-26 14:18:28.622 | DEBUG    | __main__:trials:24 - Trial = 25147/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.623 | DEBUG    | __main__:trials:29 - Trial = 25147/30000 | Total reward = 38.34
2022-01-26 14:18:28.627 | DEBUG    | __main__:trials:24 - Trial = 25148/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.629 | DEBUG    | __main__:trials:29 - Trial = 25148/30000 | Total reward = 36.77
2022-01-26 14:18:28.632 | DEBUG    | __main__:trials:24 - Trial = 25149/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.633 | DEBUG    | __main__:trials:29 - Trial = 25149/30000 | Total reward = 35.68
2022-01-26 14:18:28.637 | DEBUG    | __main__:trials:24 - Trial = 25150/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.639 | DEBUG    | __main__:trials:29 - Trial = 25150/30000 | Total reward = 39.42
2022-01-26 14:18:28.642 | DEBUG    | __main__:trials:24 - Trial = 25151/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.643 | DEBUG    | __main__:trials:29 - Trial = 25151/30000 | Total reward = 42.46
2022-01-26 14:18:28.647 | DEBUG    | __main__:trials:24 - Trial = 25152/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.649 | DEBUG    | __main__:trials:29 - Trial = 25152/30000 | Total reward = 41.62
2022-01-26 14:18:28.652 | DEBUG    | __main__:trials:24 - Trial = 25153/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.653 | DEBUG    | __main__:trials:29 - Trial = 25153/30000 | Total reward = 32.93
2022-01-26 14:18:28.658 | DEBUG    | __main__:trials:24 - Trial = 25154/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.658 | DEBUG    | __main__:trials:29 - Trial = 25154/30000 | Total reward = 46.33
2022-01-26 14:18:28.663 | DEBUG    | __main__:trials:24 - Trial = 25155/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.663 | DEBUG    | __main__:trials:29 - Trial = 25155/30000 | Total reward = 33.10
2022-01-26 14:18:28.668 | DEBUG    | __main__:trials:24 - Trial = 25156/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.669 | DEBUG    | __main__:trials:29 - Trial = 25156/30000 | Total reward = 37.74
2022-01-26 14:18:28.672 | DEBUG    | __main__:trials:24 - Trial = 25157/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.673 | DEBUG    | __main__:trials:29 - Trial = 25157/30000 | Total reward = 55.60
2022-01-26 14:18:28.677 | DEBUG    | __main__:trials:24 - Trial = 25158/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.678 | DEBUG    | __main__:trials:29 - Trial = 25158/30000 | Total reward = 51.15
2022-01-26 14:18:28.682 | DEBUG    | __main__:trials:24 - Trial = 25159/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.684 | DEBUG    | __main__:trials:29 - Trial = 25159/30000 | Total reward = 39.85
2022-01-26 14:18:28.688 | DEBUG    | __main__:trials:24 - Trial = 25160/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.689 | DEBUG    | __main__:trials:29 - Trial = 25160/30000 | Total reward = 34.53
2022-01-26 14:18:28.692 | DEBUG    | __main__:trials:24 - Trial = 25161/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.694 | DEBUG    | __main__:trials:29 - Trial = 25161/30000 | Total reward = 48.11
2022-01-26 14:18:28.697 | DEBUG    | __main__:trials:24 - Trial = 25162/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.698 | DEBUG    | __main__:trials:29 - Trial = 25162/30000 | Total reward = 37.58
2022-01-26 14:18:28.702 | DEBUG    | __main__:trials:24 - Trial = 25163/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.703 | DEBUG    | __main__:trials:29 - Trial = 25163/30000 | Total reward = 47.47
2022-01-26 14:18:28.707 | DEBUG    | __main__:trials:24 - Trial = 25164/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.707 | DEBUG    | __main__:trials:29 - Trial = 25164/30000 | Total reward = 33.34
2022-01-26 14:18:28.711 | DEBUG    | __main__:trials:24 - Trial = 25165/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.713 | DEBUG    | __main__:trials:29 - Trial = 25165/30000 | Total reward = 37.32
2022-01-26 14:18:28.716 | DEBUG    | __main__:trials:24 - Trial = 25166/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.718 | DEBUG    | __main__:trials:29 - Trial = 25166/30000 | Total reward = 36.10
2022-01-26 14:18:28.721 | DEBUG    | __main__:trials:24 - Trial = 25167/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.722 | DEBUG    | __main__:trials:29 - Trial = 25167/30000 | Total reward = 34.63
2022-01-26 14:18:28.727 | DEBUG    | __main__:trials:24 - Trial = 25168/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.728 | DEBUG    | __main__:trials:29 - Trial = 25168/30000 | Total reward = 38.70
2022-01-26 14:18:28.731 | DEBUG    | __main__:trials:24 - Trial = 25169/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.733 | DEBUG    | __main__:trials:29 - Trial = 25169/30000 | Total reward = 38.51
2022-01-26 14:18:28.736 | DEBUG    | __main__:trials:24 - Trial = 25170/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.738 | DEBUG    | __main__:trials:29 - Trial = 25170/30000 | Total reward = 35.47
2022-01-26 14:18:28.742 | DEBUG    | __main__:trials:24 - Trial = 25171/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.743 | DEBUG    | __main__:trials:29 - Trial = 25171/30000 | Total reward = 38.35
2022-01-26 14:18:28.747 | DEBUG    | __main__:trials:24 - Trial = 25172/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.748 | DEBUG    | __main__:trials:29 - Trial = 25172/30000 | Total reward = 45.38
2022-01-26 14:18:28.752 | DEBUG    | __main__:trials:24 - Trial = 25173/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.753 | DEBUG    | __main__:trials:29 - Trial = 25173/30000 | Total reward = 39.20
2022-01-26 14:18:28.757 | DEBUG    | __main__:trials:24 - Trial = 25174/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.759 | DEBUG    | __main__:trials:29 - Trial = 25174/30000 | Total reward = 36.52
2022-01-26 14:18:28.762 | DEBUG    | __main__:trials:24 - Trial = 25175/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.764 | DEBUG    | __main__:trials:29 - Trial = 25175/30000 | Total reward = 60.53
2022-01-26 14:18:28.767 | DEBUG    | __main__:trials:24 - Trial = 25176/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.768 | DEBUG    | __main__:trials:29 - Trial = 25176/30000 | Total reward = 46.50
2022-01-26 14:18:28.772 | DEBUG    | __main__:trials:24 - Trial = 25177/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.773 | DEBUG    | __main__:trials:29 - Trial = 25177/30000 | Total reward = 30.75
2022-01-26 14:18:28.777 | DEBUG    | __main__:trials:24 - Trial = 25178/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.778 | DEBUG    | __main__:trials:29 - Trial = 25178/30000 | Total reward = 33.90
2022-01-26 14:18:28.781 | DEBUG    | __main__:trials:24 - Trial = 25179/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.781 | DEBUG    | __main__:trials:29 - Trial = 25179/30000 | Total reward = 33.91
2022-01-26 14:18:28.786 | DEBUG    | __main__:trials:26 - Trial = 25180/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.786 | DEBUG    | __main__:trials:29 - Trial = 25180/30000 | Total reward = 33.90
2022-01-26 14:18:28.791 | DEBUG    | __main__:trials:24 - Trial = 25181/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.792 | DEBUG    | __main__:trials:29 - Trial = 25181/30000 | Total reward = 32.76
2022-01-26 14:18:28.796 | DEBUG    | __main__:trials:24 - Trial = 25182/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.797 | DEBUG    | __main__:trials:29 - Trial = 25182/30000 | Total reward = 40.76
2022-01-26 14:18:28.801 | DEBUG    | __main__:trials:26 - Trial = 25183/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.803 | DEBUG    | __main__:trials:29 - Trial = 25183/30000 | Total reward = 22.29
2022-01-26 14:18:28.807 | DEBUG    | __main__:trials:24 - Trial = 25184/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.808 | DEBUG    | __main__:trials:29 - Trial = 25184/30000 | Total reward = 37.65
2022-01-26 14:18:28.812 | DEBUG    | __main__:trials:24 - Trial = 25185/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.814 | DEBUG    | __main__:trials:29 - Trial = 25185/30000 | Total reward = 27.63
2022-01-26 14:18:28.817 | DEBUG    | __main__:trials:24 - Trial = 25186/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.818 | DEBUG    | __main__:trials:29 - Trial = 25186/30000 | Total reward = 37.96
2022-01-26 14:18:28.821 | DEBUG    | __main__:trials:24 - Trial = 25187/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.822 | DEBUG    | __main__:trials:29 - Trial = 25187/30000 | Total reward = 39.89
2022-01-26 14:18:28.827 | DEBUG    | __main__:trials:24 - Trial = 25188/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.828 | DEBUG    | __main__:trials:29 - Trial = 25188/30000 | Total reward = 37.23
2022-01-26 14:18:28.832 | DEBUG    | __main__:trials:24 - Trial = 25189/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.833 | DEBUG    | __main__:trials:29 - Trial = 25189/30000 | Total reward = 27.20
2022-01-26 14:18:28.837 | DEBUG    | __main__:trials:24 - Trial = 25190/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.837 | DEBUG    | __main__:trials:29 - Trial = 25190/30000 | Total reward = 42.93
2022-01-26 14:18:28.842 | DEBUG    | __main__:trials:24 - Trial = 25191/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.843 | DEBUG    | __main__:trials:29 - Trial = 25191/30000 | Total reward = 36.01
2022-01-26 14:18:28.847 | DEBUG    | __main__:trials:24 - Trial = 25192/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.849 | DEBUG    | __main__:trials:29 - Trial = 25192/30000 | Total reward = 36.91
2022-01-26 14:18:28.852 | DEBUG    | __main__:trials:24 - Trial = 25193/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.853 | DEBUG    | __main__:trials:29 - Trial = 25193/30000 | Total reward = 49.12
2022-01-26 14:18:28.857 | DEBUG    | __main__:trials:24 - Trial = 25194/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.858 | DEBUG    | __main__:trials:29 - Trial = 25194/30000 | Total reward = 39.26
2022-01-26 14:18:28.861 | DEBUG    | __main__:trials:26 - Trial = 25195/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.862 | DEBUG    | __main__:trials:29 - Trial = 25195/30000 | Total reward = 14.09
2022-01-26 14:18:28.865 | DEBUG    | __main__:trials:24 - Trial = 25196/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.867 | DEBUG    | __main__:trials:29 - Trial = 25196/30000 | Total reward = 37.88
2022-01-26 14:18:28.870 | DEBUG    | __main__:trials:24 - Trial = 25197/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.872 | DEBUG    | __main__:trials:29 - Trial = 25197/30000 | Total reward = 48.90
2022-01-26 14:18:28.876 | DEBUG    | __main__:trials:24 - Trial = 25198/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.876 | DEBUG    | __main__:trials:29 - Trial = 25198/30000 | Total reward = 30.77
2022-01-26 14:18:28.881 | DEBUG    | __main__:trials:24 - Trial = 25199/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.882 | DEBUG    | __main__:trials:29 - Trial = 25199/30000 | Total reward = 37.23
2022-01-26 14:18:28.887 | DEBUG    | __main__:trials:24 - Trial = 25200/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.888 | DEBUG    | __main__:trials:29 - Trial = 25200/30000 | Total reward = 37.61
2022-01-26 14:18:28.892 | DEBUG    | __main__:trials:24 - Trial = 25201/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.894 | DEBUG    | __main__:trials:29 - Trial = 25201/30000 | Total reward = 54.64
2022-01-26 14:18:28.897 | DEBUG    | __main__:trials:24 - Trial = 25202/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.898 | DEBUG    | __main__:trials:29 - Trial = 25202/30000 | Total reward = 30.89
2022-01-26 14:18:28.901 | DEBUG    | __main__:trials:24 - Trial = 25203/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.902 | DEBUG    | __main__:trials:29 - Trial = 25203/30000 | Total reward = 34.36
2022-01-26 14:18:28.906 | DEBUG    | __main__:trials:24 - Trial = 25204/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.906 | DEBUG    | __main__:trials:29 - Trial = 25204/30000 | Total reward = 37.85
2022-01-26 14:18:28.911 | DEBUG    | __main__:trials:24 - Trial = 25205/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.912 | DEBUG    | __main__:trials:29 - Trial = 25205/30000 | Total reward = 30.40
2022-01-26 14:18:28.916 | DEBUG    | __main__:trials:24 - Trial = 25206/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.918 | DEBUG    | __main__:trials:29 - Trial = 25206/30000 | Total reward = 45.06
2022-01-26 14:18:28.921 | DEBUG    | __main__:trials:24 - Trial = 25207/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.923 | DEBUG    | __main__:trials:29 - Trial = 25207/30000 | Total reward = 34.24
2022-01-26 14:18:28.927 | DEBUG    | __main__:trials:24 - Trial = 25208/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.927 | DEBUG    | __main__:trials:29 - Trial = 25208/30000 | Total reward = 49.46
2022-01-26 14:18:28.930 | DEBUG    | __main__:trials:26 - Trial = 25209/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.931 | DEBUG    | __main__:trials:29 - Trial = 25209/30000 | Total reward = 12.64
2022-01-26 14:18:28.936 | DEBUG    | __main__:trials:24 - Trial = 25210/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.936 | DEBUG    | __main__:trials:29 - Trial = 25210/30000 | Total reward = 50.27
2022-01-26 14:18:28.941 | DEBUG    | __main__:trials:24 - Trial = 25211/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.941 | DEBUG    | __main__:trials:29 - Trial = 25211/30000 | Total reward = 48.04
2022-01-26 14:18:28.945 | DEBUG    | __main__:trials:24 - Trial = 25212/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.946 | DEBUG    | __main__:trials:29 - Trial = 25212/30000 | Total reward = 37.79
2022-01-26 14:18:28.949 | DEBUG    | __main__:trials:24 - Trial = 25213/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.950 | DEBUG    | __main__:trials:29 - Trial = 25213/30000 | Total reward = 34.91
2022-01-26 14:18:28.953 | DEBUG    | __main__:trials:26 - Trial = 25214/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.955 | DEBUG    | __main__:trials:29 - Trial = 25214/30000 | Total reward = 24.02
2022-01-26 14:18:28.959 | DEBUG    | __main__:trials:24 - Trial = 25215/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.960 | DEBUG    | __main__:trials:29 - Trial = 25215/30000 | Total reward = 37.04
2022-01-26 14:18:28.963 | DEBUG    | __main__:trials:24 - Trial = 25216/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.965 | DEBUG    | __main__:trials:29 - Trial = 25216/30000 | Total reward = 44.59
2022-01-26 14:18:28.968 | DEBUG    | __main__:trials:24 - Trial = 25217/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.970 | DEBUG    | __main__:trials:29 - Trial = 25217/30000 | Total reward = 56.70
2022-01-26 14:18:28.973 | DEBUG    | __main__:trials:24 - Trial = 25218/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.973 | DEBUG    | __main__:trials:29 - Trial = 25218/30000 | Total reward = 40.50
2022-01-26 14:18:28.977 | DEBUG    | __main__:trials:26 - Trial = 25219/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:28.977 | DEBUG    | __main__:trials:29 - Trial = 25219/30000 | Total reward = 22.95
2022-01-26 14:18:28.981 | DEBUG    | __main__:trials:24 - Trial = 25220/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.982 | DEBUG    | __main__:trials:29 - Trial = 25220/30000 | Total reward = 42.08
2022-01-26 14:18:28.987 | DEBUG    | __main__:trials:24 - Trial = 25221/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.988 | DEBUG    | __main__:trials:29 - Trial = 25221/30000 | Total reward = 36.25
2022-01-26 14:18:28.992 | DEBUG    | __main__:trials:24 - Trial = 25222/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.992 | DEBUG    | __main__:trials:29 - Trial = 25222/30000 | Total reward = 34.36
2022-01-26 14:18:28.997 | DEBUG    | __main__:trials:24 - Trial = 25223/30000 | Max number of steps (20) reached
2022-01-26 14:18:28.998 | DEBUG    | __main__:trials:29 - Trial = 25223/30000 | Total reward = 36.88
2022-01-26 14:18:29.001 | DEBUG    | __main__:trials:24 - Trial = 25224/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.003 | DEBUG    | __main__:trials:29 - Trial = 25224/30000 | Total reward = 46.23
2022-01-26 14:18:29.006 | DEBUG    | __main__:trials:24 - Trial = 25225/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.008 | DEBUG    | __main__:trials:29 - Trial = 25225/30000 | Total reward = 35.78
2022-01-26 14:18:29.011 | DEBUG    | __main__:trials:24 - Trial = 25226/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.012 | DEBUG    | __main__:trials:29 - Trial = 25226/30000 | Total reward = 41.03
2022-01-26 14:18:29.016 | DEBUG    | __main__:trials:26 - Trial = 25227/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.018 | DEBUG    | __main__:trials:29 - Trial = 25227/30000 | Total reward = 31.35
2022-01-26 14:18:29.021 | DEBUG    | __main__:trials:24 - Trial = 25228/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.023 | DEBUG    | __main__:trials:29 - Trial = 25228/30000 | Total reward = 34.91
2022-01-26 14:18:29.026 | DEBUG    | __main__:trials:24 - Trial = 25229/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.027 | DEBUG    | __main__:trials:29 - Trial = 25229/30000 | Total reward = 46.61
2022-01-26 14:18:29.029 | DEBUG    | __main__:trials:26 - Trial = 25230/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.030 | DEBUG    | __main__:trials:29 - Trial = 25230/30000 | Total reward = 10.63
2022-01-26 14:18:29.033 | DEBUG    | __main__:trials:24 - Trial = 25231/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.034 | DEBUG    | __main__:trials:29 - Trial = 25231/30000 | Total reward = 35.27
2022-01-26 14:18:29.037 | DEBUG    | __main__:trials:24 - Trial = 25232/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.038 | DEBUG    | __main__:trials:29 - Trial = 25232/30000 | Total reward = 41.44
2022-01-26 14:18:29.041 | DEBUG    | __main__:trials:24 - Trial = 25233/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.042 | DEBUG    | __main__:trials:29 - Trial = 25233/30000 | Total reward = 41.35
2022-01-26 14:18:29.045 | DEBUG    | __main__:trials:24 - Trial = 25234/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.046 | DEBUG    | __main__:trials:29 - Trial = 25234/30000 | Total reward = 35.57
2022-01-26 14:18:29.049 | DEBUG    | __main__:trials:24 - Trial = 25235/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.051 | DEBUG    | __main__:trials:29 - Trial = 25235/30000 | Total reward = 35.87
2022-01-26 14:18:29.055 | DEBUG    | __main__:trials:24 - Trial = 25236/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.056 | DEBUG    | __main__:trials:29 - Trial = 25236/30000 | Total reward = 33.62
2022-01-26 14:18:29.060 | DEBUG    | __main__:trials:24 - Trial = 25237/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.061 | DEBUG    | __main__:trials:29 - Trial = 25237/30000 | Total reward = 45.97
2022-01-26 14:18:29.065 | DEBUG    | __main__:trials:24 - Trial = 25238/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.067 | DEBUG    | __main__:trials:29 - Trial = 25238/30000 | Total reward = 31.76
2022-01-26 14:18:29.071 | DEBUG    | __main__:trials:24 - Trial = 25239/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.072 | DEBUG    | __main__:trials:29 - Trial = 25239/30000 | Total reward = 35.44
2022-01-26 14:18:29.076 | DEBUG    | __main__:trials:24 - Trial = 25240/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.076 | DEBUG    | __main__:trials:29 - Trial = 25240/30000 | Total reward = 47.61
2022-01-26 14:18:29.079 | DEBUG    | __main__:trials:26 - Trial = 25241/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.081 | DEBUG    | __main__:trials:29 - Trial = 25241/30000 | Total reward = 14.41
2022-01-26 14:18:29.084 | DEBUG    | __main__:trials:24 - Trial = 25242/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.086 | DEBUG    | __main__:trials:29 - Trial = 25242/30000 | Total reward = 41.74
2022-01-26 14:18:29.090 | DEBUG    | __main__:trials:24 - Trial = 25243/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.090 | DEBUG    | __main__:trials:29 - Trial = 25243/30000 | Total reward = 43.44
2022-01-26 14:18:29.095 | DEBUG    | __main__:trials:24 - Trial = 25244/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.095 | DEBUG    | __main__:trials:29 - Trial = 25244/30000 | Total reward = 34.32
2022-01-26 14:18:29.100 | DEBUG    | __main__:trials:24 - Trial = 25245/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.101 | DEBUG    | __main__:trials:29 - Trial = 25245/30000 | Total reward = 35.27
2022-01-26 14:18:29.104 | DEBUG    | __main__:trials:24 - Trial = 25246/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.106 | DEBUG    | __main__:trials:29 - Trial = 25246/30000 | Total reward = 32.21
2022-01-26 14:18:29.110 | DEBUG    | __main__:trials:24 - Trial = 25247/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.111 | DEBUG    | __main__:trials:29 - Trial = 25247/30000 | Total reward = 31.83
2022-01-26 14:18:29.114 | DEBUG    | __main__:trials:24 - Trial = 25248/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.115 | DEBUG    | __main__:trials:29 - Trial = 25248/30000 | Total reward = 47.56
2022-01-26 14:18:29.119 | DEBUG    | __main__:trials:24 - Trial = 25249/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.119 | DEBUG    | __main__:trials:29 - Trial = 25249/30000 | Total reward = 45.89
2022-01-26 14:18:29.123 | DEBUG    | __main__:trials:24 - Trial = 25250/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.124 | DEBUG    | __main__:trials:29 - Trial = 25250/30000 | Total reward = 41.49
2022-01-26 14:18:29.128 | DEBUG    | __main__:trials:24 - Trial = 25251/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.129 | DEBUG    | __main__:trials:29 - Trial = 25251/30000 | Total reward = 37.77
2022-01-26 14:18:29.133 | DEBUG    | __main__:trials:24 - Trial = 25252/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.133 | DEBUG    | __main__:trials:29 - Trial = 25252/30000 | Total reward = 41.17
2022-01-26 14:18:29.137 | DEBUG    | __main__:trials:24 - Trial = 25253/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.138 | DEBUG    | __main__:trials:29 - Trial = 25253/30000 | Total reward = 60.99
2022-01-26 14:18:29.142 | DEBUG    | __main__:trials:24 - Trial = 25254/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.143 | DEBUG    | __main__:trials:29 - Trial = 25254/30000 | Total reward = 37.07
2022-01-26 14:18:29.146 | DEBUG    | __main__:trials:26 - Trial = 25255/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.148 | DEBUG    | __main__:trials:29 - Trial = 25255/30000 | Total reward = 28.74
2022-01-26 14:18:29.151 | DEBUG    | __main__:trials:24 - Trial = 25256/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.152 | DEBUG    | __main__:trials:29 - Trial = 25256/30000 | Total reward = 42.33
2022-01-26 14:18:29.157 | DEBUG    | __main__:trials:24 - Trial = 25257/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.158 | DEBUG    | __main__:trials:29 - Trial = 25257/30000 | Total reward = 27.83
2022-01-26 14:18:29.162 | DEBUG    | __main__:trials:24 - Trial = 25258/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.163 | DEBUG    | __main__:trials:29 - Trial = 25258/30000 | Total reward = 42.11
2022-01-26 14:18:29.167 | DEBUG    | __main__:trials:24 - Trial = 25259/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.167 | DEBUG    | __main__:trials:29 - Trial = 25259/30000 | Total reward = 42.08
2022-01-26 14:18:29.172 | DEBUG    | __main__:trials:24 - Trial = 25260/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.173 | DEBUG    | __main__:trials:29 - Trial = 25260/30000 | Total reward = 32.50
2022-01-26 14:18:29.177 | DEBUG    | __main__:trials:24 - Trial = 25261/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.178 | DEBUG    | __main__:trials:29 - Trial = 25261/30000 | Total reward = 50.16
2022-01-26 14:18:29.182 | DEBUG    | __main__:trials:24 - Trial = 25262/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.182 | DEBUG    | __main__:trials:29 - Trial = 25262/30000 | Total reward = 33.78
2022-01-26 14:18:29.187 | DEBUG    | __main__:trials:24 - Trial = 25263/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.188 | DEBUG    | __main__:trials:29 - Trial = 25263/30000 | Total reward = 39.29
2022-01-26 14:18:29.192 | DEBUG    | __main__:trials:24 - Trial = 25264/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.193 | DEBUG    | __main__:trials:29 - Trial = 25264/30000 | Total reward = 33.42
2022-01-26 14:18:29.197 | DEBUG    | __main__:trials:24 - Trial = 25265/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.199 | DEBUG    | __main__:trials:29 - Trial = 25265/30000 | Total reward = 31.91
2022-01-26 14:18:29.203 | DEBUG    | __main__:trials:24 - Trial = 25266/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.203 | DEBUG    | __main__:trials:29 - Trial = 25266/30000 | Total reward = 39.48
2022-01-26 14:18:29.208 | DEBUG    | __main__:trials:24 - Trial = 25267/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.209 | DEBUG    | __main__:trials:29 - Trial = 25267/30000 | Total reward = 39.85
2022-01-26 14:18:29.212 | DEBUG    | __main__:trials:24 - Trial = 25268/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.214 | DEBUG    | __main__:trials:29 - Trial = 25268/30000 | Total reward = 35.07
2022-01-26 14:18:29.217 | DEBUG    | __main__:trials:24 - Trial = 25269/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.219 | DEBUG    | __main__:trials:29 - Trial = 25269/30000 | Total reward = 29.28
2022-01-26 14:18:29.223 | DEBUG    | __main__:trials:24 - Trial = 25270/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.224 | DEBUG    | __main__:trials:29 - Trial = 25270/30000 | Total reward = 48.07
2022-01-26 14:18:29.228 | DEBUG    | __main__:trials:24 - Trial = 25271/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.229 | DEBUG    | __main__:trials:29 - Trial = 25271/30000 | Total reward = 42.93
2022-01-26 14:18:29.233 | DEBUG    | __main__:trials:24 - Trial = 25272/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.234 | DEBUG    | __main__:trials:29 - Trial = 25272/30000 | Total reward = 49.42
2022-01-26 14:18:29.238 | DEBUG    | __main__:trials:24 - Trial = 25273/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.239 | DEBUG    | __main__:trials:29 - Trial = 25273/30000 | Total reward = 40.09
2022-01-26 14:18:29.243 | DEBUG    | __main__:trials:24 - Trial = 25274/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.244 | DEBUG    | __main__:trials:29 - Trial = 25274/30000 | Total reward = 39.80
2022-01-26 14:18:29.247 | DEBUG    | __main__:trials:26 - Trial = 25275/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.248 | DEBUG    | __main__:trials:29 - Trial = 25275/30000 | Total reward = 15.34
2022-01-26 14:18:29.251 | DEBUG    | __main__:trials:24 - Trial = 25276/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.253 | DEBUG    | __main__:trials:29 - Trial = 25276/30000 | Total reward = 38.98
2022-01-26 14:18:29.256 | DEBUG    | __main__:trials:24 - Trial = 25277/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.257 | DEBUG    | __main__:trials:29 - Trial = 25277/30000 | Total reward = 34.72
2022-01-26 14:18:29.262 | DEBUG    | __main__:trials:24 - Trial = 25278/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.263 | DEBUG    | __main__:trials:29 - Trial = 25278/30000 | Total reward = 34.91
2022-01-26 14:18:29.267 | DEBUG    | __main__:trials:24 - Trial = 25279/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.268 | DEBUG    | __main__:trials:29 - Trial = 25279/30000 | Total reward = 30.06
2022-01-26 14:18:29.272 | DEBUG    | __main__:trials:24 - Trial = 25280/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.273 | DEBUG    | __main__:trials:29 - Trial = 25280/30000 | Total reward = 44.78
2022-01-26 14:18:29.276 | DEBUG    | __main__:trials:24 - Trial = 25281/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.278 | DEBUG    | __main__:trials:29 - Trial = 25281/30000 | Total reward = 45.62
2022-01-26 14:18:29.282 | DEBUG    | __main__:trials:24 - Trial = 25282/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.283 | DEBUG    | __main__:trials:29 - Trial = 25282/30000 | Total reward = 36.60
2022-01-26 14:18:29.287 | DEBUG    | __main__:trials:24 - Trial = 25283/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.289 | DEBUG    | __main__:trials:29 - Trial = 25283/30000 | Total reward = 33.23
2022-01-26 14:18:29.292 | DEBUG    | __main__:trials:24 - Trial = 25284/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.294 | DEBUG    | __main__:trials:29 - Trial = 25284/30000 | Total reward = 51.06
2022-01-26 14:18:29.298 | DEBUG    | __main__:trials:24 - Trial = 25285/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.298 | DEBUG    | __main__:trials:29 - Trial = 25285/30000 | Total reward = 37.23
2022-01-26 14:18:29.303 | DEBUG    | __main__:trials:24 - Trial = 25286/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.305 | DEBUG    | __main__:trials:29 - Trial = 25286/30000 | Total reward = 29.89
2022-01-26 14:18:29.308 | DEBUG    | __main__:trials:24 - Trial = 25287/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.309 | DEBUG    | __main__:trials:29 - Trial = 25287/30000 | Total reward = 37.77
2022-01-26 14:18:29.314 | DEBUG    | __main__:trials:24 - Trial = 25288/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.315 | DEBUG    | __main__:trials:29 - Trial = 25288/30000 | Total reward = 36.16
2022-01-26 14:18:29.319 | DEBUG    | __main__:trials:24 - Trial = 25289/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.320 | DEBUG    | __main__:trials:29 - Trial = 25289/30000 | Total reward = 27.65
2022-01-26 14:18:29.324 | DEBUG    | __main__:trials:24 - Trial = 25290/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.326 | DEBUG    | __main__:trials:29 - Trial = 25290/30000 | Total reward = 37.86
2022-01-26 14:18:29.329 | DEBUG    | __main__:trials:26 - Trial = 25291/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.330 | DEBUG    | __main__:trials:29 - Trial = 25291/30000 | Total reward = 17.88
2022-01-26 14:18:29.333 | DEBUG    | __main__:trials:26 - Trial = 25292/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.335 | DEBUG    | __main__:trials:29 - Trial = 25292/30000 | Total reward = 14.48
2022-01-26 14:18:29.338 | DEBUG    | __main__:trials:24 - Trial = 25293/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.340 | DEBUG    | __main__:trials:29 - Trial = 25293/30000 | Total reward = 38.41
2022-01-26 14:18:29.343 | DEBUG    | __main__:trials:24 - Trial = 25294/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.344 | DEBUG    | __main__:trials:29 - Trial = 25294/30000 | Total reward = 41.08
2022-01-26 14:18:29.348 | DEBUG    | __main__:trials:24 - Trial = 25295/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.350 | DEBUG    | __main__:trials:29 - Trial = 25295/30000 | Total reward = 38.44
2022-01-26 14:18:29.353 | DEBUG    | __main__:trials:24 - Trial = 25296/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.354 | DEBUG    | __main__:trials:29 - Trial = 25296/30000 | Total reward = 21.24
2022-01-26 14:18:29.357 | DEBUG    | __main__:trials:26 - Trial = 25297/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.358 | DEBUG    | __main__:trials:29 - Trial = 25297/30000 | Total reward = 6.95
2022-01-26 14:18:29.362 | DEBUG    | __main__:trials:24 - Trial = 25298/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.362 | DEBUG    | __main__:trials:29 - Trial = 25298/30000 | Total reward = 26.98
2022-01-26 14:18:29.367 | DEBUG    | __main__:trials:24 - Trial = 25299/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.367 | DEBUG    | __main__:trials:29 - Trial = 25299/30000 | Total reward = 51.29
2022-01-26 14:18:29.371 | DEBUG    | __main__:trials:24 - Trial = 25300/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.372 | DEBUG    | __main__:trials:29 - Trial = 25300/30000 | Total reward = 42.51
2022-01-26 14:18:29.376 | DEBUG    | __main__:trials:24 - Trial = 25301/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.378 | DEBUG    | __main__:trials:29 - Trial = 25301/30000 | Total reward = 40.00
2022-01-26 14:18:29.382 | DEBUG    | __main__:trials:24 - Trial = 25302/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.382 | DEBUG    | __main__:trials:29 - Trial = 25302/30000 | Total reward = 26.71
2022-01-26 14:18:29.387 | DEBUG    | __main__:trials:24 - Trial = 25303/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.388 | DEBUG    | __main__:trials:29 - Trial = 25303/30000 | Total reward = 30.25
2022-01-26 14:18:29.392 | DEBUG    | __main__:trials:24 - Trial = 25304/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.392 | DEBUG    | __main__:trials:29 - Trial = 25304/30000 | Total reward = 27.84
2022-01-26 14:18:29.395 | DEBUG    | __main__:trials:26 - Trial = 25305/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.396 | DEBUG    | __main__:trials:29 - Trial = 25305/30000 | Total reward = 15.20
2022-01-26 14:18:29.400 | DEBUG    | __main__:trials:26 - Trial = 25306/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.402 | DEBUG    | __main__:trials:29 - Trial = 25306/30000 | Total reward = 17.75
2022-01-26 14:18:29.405 | DEBUG    | __main__:trials:24 - Trial = 25307/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.406 | DEBUG    | __main__:trials:29 - Trial = 25307/30000 | Total reward = 38.61
2022-01-26 14:18:29.410 | DEBUG    | __main__:trials:24 - Trial = 25308/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.412 | DEBUG    | __main__:trials:29 - Trial = 25308/30000 | Total reward = 46.36
2022-01-26 14:18:29.414 | DEBUG    | __main__:trials:26 - Trial = 25309/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.416 | DEBUG    | __main__:trials:29 - Trial = 25309/30000 | Total reward = 29.29
2022-01-26 14:18:29.419 | DEBUG    | __main__:trials:24 - Trial = 25310/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.421 | DEBUG    | __main__:trials:29 - Trial = 25310/30000 | Total reward = 35.72
2022-01-26 14:18:29.424 | DEBUG    | __main__:trials:24 - Trial = 25311/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.426 | DEBUG    | __main__:trials:29 - Trial = 25311/30000 | Total reward = 39.91
2022-01-26 14:18:29.430 | DEBUG    | __main__:trials:24 - Trial = 25312/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.431 | DEBUG    | __main__:trials:29 - Trial = 25312/30000 | Total reward = 37.73
2022-01-26 14:18:29.435 | DEBUG    | __main__:trials:24 - Trial = 25313/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.437 | DEBUG    | __main__:trials:29 - Trial = 25313/30000 | Total reward = 36.41
2022-01-26 14:18:29.439 | DEBUG    | __main__:trials:26 - Trial = 25314/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.441 | DEBUG    | __main__:trials:29 - Trial = 25314/30000 | Total reward = 23.94
2022-01-26 14:18:29.444 | DEBUG    | __main__:trials:24 - Trial = 25315/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.446 | DEBUG    | __main__:trials:29 - Trial = 25315/30000 | Total reward = 13.44
2022-01-26 14:18:29.449 | DEBUG    | __main__:trials:24 - Trial = 25316/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.451 | DEBUG    | __main__:trials:29 - Trial = 25316/30000 | Total reward = 36.56
2022-01-26 14:18:29.455 | DEBUG    | __main__:trials:24 - Trial = 25317/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.457 | DEBUG    | __main__:trials:29 - Trial = 25317/30000 | Total reward = 39.17
2022-01-26 14:18:29.461 | DEBUG    | __main__:trials:24 - Trial = 25318/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.461 | DEBUG    | __main__:trials:29 - Trial = 25318/30000 | Total reward = 46.10
2022-01-26 14:18:29.464 | DEBUG    | __main__:trials:24 - Trial = 25319/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.466 | DEBUG    | __main__:trials:29 - Trial = 25319/30000 | Total reward = 47.08
2022-01-26 14:18:29.469 | DEBUG    | __main__:trials:24 - Trial = 25320/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.470 | DEBUG    | __main__:trials:29 - Trial = 25320/30000 | Total reward = 33.10
2022-01-26 14:18:29.473 | DEBUG    | __main__:trials:24 - Trial = 25321/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.473 | DEBUG    | __main__:trials:29 - Trial = 25321/30000 | Total reward = 35.66
2022-01-26 14:18:29.477 | DEBUG    | __main__:trials:24 - Trial = 25322/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.479 | DEBUG    | __main__:trials:29 - Trial = 25322/30000 | Total reward = 14.89
2022-01-26 14:18:29.483 | DEBUG    | __main__:trials:24 - Trial = 25323/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.484 | DEBUG    | __main__:trials:29 - Trial = 25323/30000 | Total reward = 51.00
2022-01-26 14:18:29.487 | DEBUG    | __main__:trials:24 - Trial = 25324/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.489 | DEBUG    | __main__:trials:29 - Trial = 25324/30000 | Total reward = 36.74
2022-01-26 14:18:29.493 | DEBUG    | __main__:trials:24 - Trial = 25325/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.494 | DEBUG    | __main__:trials:29 - Trial = 25325/30000 | Total reward = 56.14
2022-01-26 14:18:29.497 | DEBUG    | __main__:trials:26 - Trial = 25326/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.498 | DEBUG    | __main__:trials:29 - Trial = 25326/30000 | Total reward = 12.96
2022-01-26 14:18:29.501 | DEBUG    | __main__:trials:26 - Trial = 25327/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.502 | DEBUG    | __main__:trials:29 - Trial = 25327/30000 | Total reward = 11.06
2022-01-26 14:18:29.505 | DEBUG    | __main__:trials:26 - Trial = 25328/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.506 | DEBUG    | __main__:trials:29 - Trial = 25328/30000 | Total reward = 11.06
2022-01-26 14:18:29.509 | DEBUG    | __main__:trials:26 - Trial = 25329/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.510 | DEBUG    | __main__:trials:29 - Trial = 25329/30000 | Total reward = 15.67
2022-01-26 14:18:29.514 | DEBUG    | __main__:trials:24 - Trial = 25330/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.514 | DEBUG    | __main__:trials:29 - Trial = 25330/30000 | Total reward = 40.03
2022-01-26 14:18:29.517 | DEBUG    | __main__:trials:26 - Trial = 25331/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.519 | DEBUG    | __main__:trials:29 - Trial = 25331/30000 | Total reward = 11.06
2022-01-26 14:18:29.523 | DEBUG    | __main__:trials:26 - Trial = 25332/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.524 | DEBUG    | __main__:trials:29 - Trial = 25332/30000 | Total reward = 23.75
2022-01-26 14:18:29.528 | DEBUG    | __main__:trials:24 - Trial = 25333/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.530 | DEBUG    | __main__:trials:29 - Trial = 25333/30000 | Total reward = 32.53
2022-01-26 14:18:29.533 | DEBUG    | __main__:trials:26 - Trial = 25334/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.535 | DEBUG    | __main__:trials:29 - Trial = 25334/30000 | Total reward = 27.65
2022-01-26 14:18:29.538 | DEBUG    | __main__:trials:24 - Trial = 25335/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.540 | DEBUG    | __main__:trials:29 - Trial = 25335/30000 | Total reward = 36.65
2022-01-26 14:18:29.543 | DEBUG    | __main__:trials:24 - Trial = 25336/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.545 | DEBUG    | __main__:trials:29 - Trial = 25336/30000 | Total reward = 49.56
2022-01-26 14:18:29.548 | DEBUG    | __main__:trials:24 - Trial = 25337/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.550 | DEBUG    | __main__:trials:29 - Trial = 25337/30000 | Total reward = 44.59
2022-01-26 14:18:29.554 | DEBUG    | __main__:trials:24 - Trial = 25338/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.555 | DEBUG    | __main__:trials:29 - Trial = 25338/30000 | Total reward = 33.85
2022-01-26 14:18:29.559 | DEBUG    | __main__:trials:24 - Trial = 25339/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.561 | DEBUG    | __main__:trials:29 - Trial = 25339/30000 | Total reward = 36.49
2022-01-26 14:18:29.564 | DEBUG    | __main__:trials:24 - Trial = 25340/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.566 | DEBUG    | __main__:trials:29 - Trial = 25340/30000 | Total reward = 44.48
2022-01-26 14:18:29.570 | DEBUG    | __main__:trials:24 - Trial = 25341/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.571 | DEBUG    | __main__:trials:29 - Trial = 25341/30000 | Total reward = 33.51
2022-01-26 14:18:29.576 | DEBUG    | __main__:trials:24 - Trial = 25342/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.578 | DEBUG    | __main__:trials:29 - Trial = 25342/30000 | Total reward = 33.50
2022-01-26 14:18:29.581 | DEBUG    | __main__:trials:24 - Trial = 25343/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.583 | DEBUG    | __main__:trials:29 - Trial = 25343/30000 | Total reward = 52.39
2022-01-26 14:18:29.586 | DEBUG    | __main__:trials:26 - Trial = 25344/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.588 | DEBUG    | __main__:trials:29 - Trial = 25344/30000 | Total reward = 24.25
2022-01-26 14:18:29.591 | DEBUG    | __main__:trials:26 - Trial = 25345/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.592 | DEBUG    | __main__:trials:29 - Trial = 25345/30000 | Total reward = 17.31
2022-01-26 14:18:29.596 | DEBUG    | __main__:trials:24 - Trial = 25346/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.597 | DEBUG    | __main__:trials:29 - Trial = 25346/30000 | Total reward = 16.49
2022-01-26 14:18:29.601 | DEBUG    | __main__:trials:24 - Trial = 25347/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.603 | DEBUG    | __main__:trials:29 - Trial = 25347/30000 | Total reward = 34.57
2022-01-26 14:18:29.606 | DEBUG    | __main__:trials:24 - Trial = 25348/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.608 | DEBUG    | __main__:trials:29 - Trial = 25348/30000 | Total reward = 41.89
2022-01-26 14:18:29.612 | DEBUG    | __main__:trials:24 - Trial = 25349/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.613 | DEBUG    | __main__:trials:29 - Trial = 25349/30000 | Total reward = 40.34
2022-01-26 14:18:29.616 | DEBUG    | __main__:trials:24 - Trial = 25350/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.618 | DEBUG    | __main__:trials:29 - Trial = 25350/30000 | Total reward = 47.43
2022-01-26 14:18:29.620 | DEBUG    | __main__:trials:26 - Trial = 25351/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.622 | DEBUG    | __main__:trials:29 - Trial = 25351/30000 | Total reward = 12.92
2022-01-26 14:18:29.626 | DEBUG    | __main__:trials:24 - Trial = 25352/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.626 | DEBUG    | __main__:trials:29 - Trial = 25352/30000 | Total reward = 32.57
2022-01-26 14:18:29.630 | DEBUG    | __main__:trials:24 - Trial = 25353/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.632 | DEBUG    | __main__:trials:29 - Trial = 25353/30000 | Total reward = 55.04
2022-01-26 14:18:29.636 | DEBUG    | __main__:trials:24 - Trial = 25354/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.638 | DEBUG    | __main__:trials:29 - Trial = 25354/30000 | Total reward = 15.55
2022-01-26 14:18:29.642 | DEBUG    | __main__:trials:24 - Trial = 25355/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.642 | DEBUG    | __main__:trials:29 - Trial = 25355/30000 | Total reward = 38.09
2022-01-26 14:18:29.645 | DEBUG    | __main__:trials:26 - Trial = 25356/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.646 | DEBUG    | __main__:trials:29 - Trial = 25356/30000 | Total reward = 10.11
2022-01-26 14:18:29.650 | DEBUG    | __main__:trials:24 - Trial = 25357/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.651 | DEBUG    | __main__:trials:29 - Trial = 25357/30000 | Total reward = 43.16
2022-01-26 14:18:29.654 | DEBUG    | __main__:trials:26 - Trial = 25358/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.656 | DEBUG    | __main__:trials:29 - Trial = 25358/30000 | Total reward = 12.78
2022-01-26 14:18:29.659 | DEBUG    | __main__:trials:24 - Trial = 25359/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.661 | DEBUG    | __main__:trials:29 - Trial = 25359/30000 | Total reward = 29.31
2022-01-26 14:18:29.663 | DEBUG    | __main__:trials:26 - Trial = 25360/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.665 | DEBUG    | __main__:trials:29 - Trial = 25360/30000 | Total reward = 11.57
2022-01-26 14:18:29.667 | DEBUG    | __main__:trials:26 - Trial = 25361/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.669 | DEBUG    | __main__:trials:29 - Trial = 25361/30000 | Total reward = 17.64
2022-01-26 14:18:29.672 | DEBUG    | __main__:trials:24 - Trial = 25362/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.674 | DEBUG    | __main__:trials:29 - Trial = 25362/30000 | Total reward = 39.05
2022-01-26 14:18:29.677 | DEBUG    | __main__:trials:26 - Trial = 25363/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.679 | DEBUG    | __main__:trials:29 - Trial = 25363/30000 | Total reward = 23.01
2022-01-26 14:18:29.682 | DEBUG    | __main__:trials:26 - Trial = 25364/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.684 | DEBUG    | __main__:trials:29 - Trial = 25364/30000 | Total reward = 15.64
2022-01-26 14:18:29.687 | DEBUG    | __main__:trials:24 - Trial = 25365/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.689 | DEBUG    | __main__:trials:29 - Trial = 25365/30000 | Total reward = 39.51
2022-01-26 14:18:29.692 | DEBUG    | __main__:trials:24 - Trial = 25366/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.694 | DEBUG    | __main__:trials:29 - Trial = 25366/30000 | Total reward = 33.48
2022-01-26 14:18:29.697 | DEBUG    | __main__:trials:24 - Trial = 25367/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.699 | DEBUG    | __main__:trials:29 - Trial = 25367/30000 | Total reward = 41.59
2022-01-26 14:18:29.703 | DEBUG    | __main__:trials:26 - Trial = 25368/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.704 | DEBUG    | __main__:trials:29 - Trial = 25368/30000 | Total reward = 22.71
2022-01-26 14:18:29.707 | DEBUG    | __main__:trials:26 - Trial = 25369/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.709 | DEBUG    | __main__:trials:29 - Trial = 25369/30000 | Total reward = 17.64
2022-01-26 14:18:29.712 | DEBUG    | __main__:trials:24 - Trial = 25370/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.713 | DEBUG    | __main__:trials:29 - Trial = 25370/30000 | Total reward = 27.20
2022-01-26 14:18:29.717 | DEBUG    | __main__:trials:26 - Trial = 25371/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.719 | DEBUG    | __main__:trials:29 - Trial = 25371/30000 | Total reward = 20.93
2022-01-26 14:18:29.721 | DEBUG    | __main__:trials:26 - Trial = 25372/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.723 | DEBUG    | __main__:trials:29 - Trial = 25372/30000 | Total reward = 14.33
2022-01-26 14:18:29.726 | DEBUG    | __main__:trials:24 - Trial = 25373/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.728 | DEBUG    | __main__:trials:29 - Trial = 25373/30000 | Total reward = 34.57
2022-01-26 14:18:29.731 | DEBUG    | __main__:trials:26 - Trial = 25374/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.733 | DEBUG    | __main__:trials:29 - Trial = 25374/30000 | Total reward = 18.64
2022-01-26 14:18:29.737 | DEBUG    | __main__:trials:24 - Trial = 25375/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.738 | DEBUG    | __main__:trials:29 - Trial = 25375/30000 | Total reward = 39.98
2022-01-26 14:18:29.741 | DEBUG    | __main__:trials:24 - Trial = 25376/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.742 | DEBUG    | __main__:trials:29 - Trial = 25376/30000 | Total reward = 43.69
2022-01-26 14:18:29.745 | DEBUG    | __main__:trials:24 - Trial = 25377/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.747 | DEBUG    | __main__:trials:29 - Trial = 25377/30000 | Total reward = 44.68
2022-01-26 14:18:29.750 | DEBUG    | __main__:trials:24 - Trial = 25378/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.751 | DEBUG    | __main__:trials:29 - Trial = 25378/30000 | Total reward = 49.27
2022-01-26 14:18:29.754 | DEBUG    | __main__:trials:24 - Trial = 25379/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.756 | DEBUG    | __main__:trials:29 - Trial = 25379/30000 | Total reward = 18.27
2022-01-26 14:18:29.760 | DEBUG    | __main__:trials:26 - Trial = 25380/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.761 | DEBUG    | __main__:trials:29 - Trial = 25380/30000 | Total reward = 12.62
2022-01-26 14:18:29.765 | DEBUG    | __main__:trials:26 - Trial = 25381/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.766 | DEBUG    | __main__:trials:29 - Trial = 25381/30000 | Total reward = 24.61
2022-01-26 14:18:29.769 | DEBUG    | __main__:trials:26 - Trial = 25382/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.771 | DEBUG    | __main__:trials:29 - Trial = 25382/30000 | Total reward = 19.31
2022-01-26 14:18:29.775 | DEBUG    | __main__:trials:26 - Trial = 25383/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.776 | DEBUG    | __main__:trials:29 - Trial = 25383/30000 | Total reward = 23.92
2022-01-26 14:18:29.779 | DEBUG    | __main__:trials:26 - Trial = 25384/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.781 | DEBUG    | __main__:trials:29 - Trial = 25384/30000 | Total reward = 17.64
2022-01-26 14:18:29.784 | DEBUG    | __main__:trials:24 - Trial = 25385/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.786 | DEBUG    | __main__:trials:29 - Trial = 25385/30000 | Total reward = 28.65
2022-01-26 14:18:29.789 | DEBUG    | __main__:trials:24 - Trial = 25386/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.790 | DEBUG    | __main__:trials:29 - Trial = 25386/30000 | Total reward = 28.47
2022-01-26 14:18:29.795 | DEBUG    | __main__:trials:24 - Trial = 25387/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.795 | DEBUG    | __main__:trials:29 - Trial = 25387/30000 | Total reward = 24.11
2022-01-26 14:18:29.799 | DEBUG    | __main__:trials:26 - Trial = 25388/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.800 | DEBUG    | __main__:trials:29 - Trial = 25388/30000 | Total reward = 17.64
2022-01-26 14:18:29.804 | DEBUG    | __main__:trials:24 - Trial = 25389/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.806 | DEBUG    | __main__:trials:29 - Trial = 25389/30000 | Total reward = 24.59
2022-01-26 14:18:29.809 | DEBUG    | __main__:trials:24 - Trial = 25390/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.811 | DEBUG    | __main__:trials:29 - Trial = 25390/30000 | Total reward = 28.53
2022-01-26 14:18:29.815 | DEBUG    | __main__:trials:24 - Trial = 25391/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.816 | DEBUG    | __main__:trials:29 - Trial = 25391/30000 | Total reward = 31.36
2022-01-26 14:18:29.820 | DEBUG    | __main__:trials:26 - Trial = 25392/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.821 | DEBUG    | __main__:trials:29 - Trial = 25392/30000 | Total reward = 17.79
2022-01-26 14:18:29.825 | DEBUG    | __main__:trials:24 - Trial = 25393/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.826 | DEBUG    | __main__:trials:29 - Trial = 25393/30000 | Total reward = 26.59
2022-01-26 14:18:29.830 | DEBUG    | __main__:trials:24 - Trial = 25394/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.832 | DEBUG    | __main__:trials:29 - Trial = 25394/30000 | Total reward = 24.27
2022-01-26 14:18:29.834 | DEBUG    | __main__:trials:26 - Trial = 25395/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.836 | DEBUG    | __main__:trials:29 - Trial = 25395/30000 | Total reward = 12.66
2022-01-26 14:18:29.840 | DEBUG    | __main__:trials:24 - Trial = 25396/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.842 | DEBUG    | __main__:trials:29 - Trial = 25396/30000 | Total reward = 31.96
2022-01-26 14:18:29.845 | DEBUG    | __main__:trials:26 - Trial = 25397/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.847 | DEBUG    | __main__:trials:29 - Trial = 25397/30000 | Total reward = 18.79
2022-01-26 14:18:29.851 | DEBUG    | __main__:trials:24 - Trial = 25398/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.852 | DEBUG    | __main__:trials:29 - Trial = 25398/30000 | Total reward = 43.46
2022-01-26 14:18:29.856 | DEBUG    | __main__:trials:24 - Trial = 25399/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.857 | DEBUG    | __main__:trials:29 - Trial = 25399/30000 | Total reward = 36.36
2022-01-26 14:18:29.861 | DEBUG    | __main__:trials:24 - Trial = 25400/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.861 | DEBUG    | __main__:trials:29 - Trial = 25400/30000 | Total reward = 27.10
2022-01-26 14:18:29.865 | DEBUG    | __main__:trials:26 - Trial = 25401/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.866 | DEBUG    | __main__:trials:29 - Trial = 25401/30000 | Total reward = 41.01
2022-01-26 14:18:29.870 | DEBUG    | __main__:trials:24 - Trial = 25402/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.871 | DEBUG    | __main__:trials:29 - Trial = 25402/30000 | Total reward = 36.13
2022-01-26 14:18:29.874 | DEBUG    | __main__:trials:26 - Trial = 25403/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.874 | DEBUG    | __main__:trials:29 - Trial = 25403/30000 | Total reward = 19.71
2022-01-26 14:18:29.877 | DEBUG    | __main__:trials:26 - Trial = 25404/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.879 | DEBUG    | __main__:trials:29 - Trial = 25404/30000 | Total reward = 20.45
2022-01-26 14:18:29.882 | DEBUG    | __main__:trials:24 - Trial = 25405/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.883 | DEBUG    | __main__:trials:29 - Trial = 25405/30000 | Total reward = 31.20
2022-01-26 14:18:29.886 | DEBUG    | __main__:trials:26 - Trial = 25406/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.887 | DEBUG    | __main__:trials:29 - Trial = 25406/30000 | Total reward = 20.12
2022-01-26 14:18:29.890 | DEBUG    | __main__:trials:26 - Trial = 25407/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.890 | DEBUG    | __main__:trials:29 - Trial = 25407/30000 | Total reward = 19.01
2022-01-26 14:18:29.894 | DEBUG    | __main__:trials:24 - Trial = 25408/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.894 | DEBUG    | __main__:trials:29 - Trial = 25408/30000 | Total reward = 33.71
2022-01-26 14:18:29.897 | DEBUG    | __main__:trials:26 - Trial = 25409/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.898 | DEBUG    | __main__:trials:29 - Trial = 25409/30000 | Total reward = 17.64
2022-01-26 14:18:29.901 | DEBUG    | __main__:trials:24 - Trial = 25410/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.902 | DEBUG    | __main__:trials:29 - Trial = 25410/30000 | Total reward = 31.96
2022-01-26 14:18:29.904 | DEBUG    | __main__:trials:26 - Trial = 25411/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.908 | DEBUG    | __main__:trials:29 - Trial = 25411/30000 | Total reward = 17.64
2022-01-26 14:18:29.911 | DEBUG    | __main__:trials:24 - Trial = 25412/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.912 | DEBUG    | __main__:trials:29 - Trial = 25412/30000 | Total reward = 27.85
2022-01-26 14:18:29.917 | DEBUG    | __main__:trials:24 - Trial = 25413/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.919 | DEBUG    | __main__:trials:29 - Trial = 25413/30000 | Total reward = 32.32
2022-01-26 14:18:29.921 | DEBUG    | __main__:trials:26 - Trial = 25414/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.921 | DEBUG    | __main__:trials:29 - Trial = 25414/30000 | Total reward = 14.88
2022-01-26 14:18:29.924 | DEBUG    | __main__:trials:26 - Trial = 25415/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.925 | DEBUG    | __main__:trials:29 - Trial = 25415/30000 | Total reward = 17.64
2022-01-26 14:18:29.928 | DEBUG    | __main__:trials:26 - Trial = 25416/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.929 | DEBUG    | __main__:trials:29 - Trial = 25416/30000 | Total reward = 22.02
2022-01-26 14:18:29.931 | DEBUG    | __main__:trials:26 - Trial = 25417/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.932 | DEBUG    | __main__:trials:29 - Trial = 25417/30000 | Total reward = 10.11
2022-01-26 14:18:29.935 | DEBUG    | __main__:trials:26 - Trial = 25418/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.935 | DEBUG    | __main__:trials:29 - Trial = 25418/30000 | Total reward = 18.03
2022-01-26 14:18:29.938 | DEBUG    | __main__:trials:26 - Trial = 25419/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.940 | DEBUG    | __main__:trials:29 - Trial = 25419/30000 | Total reward = 13.26
2022-01-26 14:18:29.943 | DEBUG    | __main__:trials:24 - Trial = 25420/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.945 | DEBUG    | __main__:trials:29 - Trial = 25420/30000 | Total reward = 24.27
2022-01-26 14:18:29.948 | DEBUG    | __main__:trials:26 - Trial = 25421/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.948 | DEBUG    | __main__:trials:29 - Trial = 25421/30000 | Total reward = 17.64
2022-01-26 14:18:29.952 | DEBUG    | __main__:trials:24 - Trial = 25422/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.953 | DEBUG    | __main__:trials:29 - Trial = 25422/30000 | Total reward = 21.83
2022-01-26 14:18:29.956 | DEBUG    | __main__:trials:24 - Trial = 25423/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.957 | DEBUG    | __main__:trials:29 - Trial = 25423/30000 | Total reward = 25.57
2022-01-26 14:18:29.960 | DEBUG    | __main__:trials:26 - Trial = 25424/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.962 | DEBUG    | __main__:trials:29 - Trial = 25424/30000 | Total reward = 17.02
2022-01-26 14:18:29.965 | DEBUG    | __main__:trials:24 - Trial = 25425/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.966 | DEBUG    | __main__:trials:29 - Trial = 25425/30000 | Total reward = 38.09
2022-01-26 14:18:29.970 | DEBUG    | __main__:trials:26 - Trial = 25426/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.972 | DEBUG    | __main__:trials:29 - Trial = 25426/30000 | Total reward = 25.89
2022-01-26 14:18:29.975 | DEBUG    | __main__:trials:26 - Trial = 25427/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.976 | DEBUG    | __main__:trials:29 - Trial = 25427/30000 | Total reward = 21.15
2022-01-26 14:18:29.980 | DEBUG    | __main__:trials:24 - Trial = 25428/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.981 | DEBUG    | __main__:trials:29 - Trial = 25428/30000 | Total reward = 31.78
2022-01-26 14:18:29.985 | DEBUG    | __main__:trials:26 - Trial = 25429/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.986 | DEBUG    | __main__:trials:29 - Trial = 25429/30000 | Total reward = 14.88
2022-01-26 14:18:29.989 | DEBUG    | __main__:trials:26 - Trial = 25430/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.990 | DEBUG    | __main__:trials:29 - Trial = 25430/30000 | Total reward = 10.11
2022-01-26 14:18:29.993 | DEBUG    | __main__:trials:24 - Trial = 25431/30000 | Max number of steps (20) reached
2022-01-26 14:18:29.995 | DEBUG    | __main__:trials:29 - Trial = 25431/30000 | Total reward = 26.27
2022-01-26 14:18:29.998 | DEBUG    | __main__:trials:26 - Trial = 25432/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:29.999 | DEBUG    | __main__:trials:29 - Trial = 25432/30000 | Total reward = 40.54
2022-01-26 14:18:30.002 | DEBUG    | __main__:trials:24 - Trial = 25433/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.004 | DEBUG    | __main__:trials:29 - Trial = 25433/30000 | Total reward = 43.60
2022-01-26 14:18:30.006 | DEBUG    | __main__:trials:26 - Trial = 25434/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.008 | DEBUG    | __main__:trials:29 - Trial = 25434/30000 | Total reward = 21.59
2022-01-26 14:18:30.011 | DEBUG    | __main__:trials:26 - Trial = 25435/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.013 | DEBUG    | __main__:trials:29 - Trial = 25435/30000 | Total reward = 24.23
2022-01-26 14:18:30.016 | DEBUG    | __main__:trials:24 - Trial = 25436/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.017 | DEBUG    | __main__:trials:29 - Trial = 25436/30000 | Total reward = 30.39
2022-01-26 14:18:30.021 | DEBUG    | __main__:trials:24 - Trial = 25437/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.022 | DEBUG    | __main__:trials:29 - Trial = 25437/30000 | Total reward = 34.59
2022-01-26 14:18:30.026 | DEBUG    | __main__:trials:24 - Trial = 25438/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.028 | DEBUG    | __main__:trials:29 - Trial = 25438/30000 | Total reward = 43.55
2022-01-26 14:18:30.032 | DEBUG    | __main__:trials:24 - Trial = 25439/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.033 | DEBUG    | __main__:trials:29 - Trial = 25439/30000 | Total reward = 29.38
2022-01-26 14:18:30.036 | DEBUG    | __main__:trials:26 - Trial = 25440/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.037 | DEBUG    | __main__:trials:29 - Trial = 25440/30000 | Total reward = 17.91
2022-01-26 14:18:30.040 | DEBUG    | __main__:trials:24 - Trial = 25441/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.042 | DEBUG    | __main__:trials:29 - Trial = 25441/30000 | Total reward = 32.91
2022-01-26 14:18:30.044 | DEBUG    | __main__:trials:26 - Trial = 25442/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.045 | DEBUG    | __main__:trials:29 - Trial = 25442/30000 | Total reward = 17.86
2022-01-26 14:18:30.049 | DEBUG    | __main__:trials:24 - Trial = 25443/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.050 | DEBUG    | __main__:trials:29 - Trial = 25443/30000 | Total reward = 32.16
2022-01-26 14:18:30.054 | DEBUG    | __main__:trials:24 - Trial = 25444/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.055 | DEBUG    | __main__:trials:29 - Trial = 25444/30000 | Total reward = 36.87
2022-01-26 14:18:30.059 | DEBUG    | __main__:trials:24 - Trial = 25445/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.061 | DEBUG    | __main__:trials:29 - Trial = 25445/30000 | Total reward = 45.84
2022-01-26 14:18:30.063 | DEBUG    | __main__:trials:24 - Trial = 25446/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.065 | DEBUG    | __main__:trials:29 - Trial = 25446/30000 | Total reward = 34.18
2022-01-26 14:18:30.068 | DEBUG    | __main__:trials:26 - Trial = 25447/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.070 | DEBUG    | __main__:trials:29 - Trial = 25447/30000 | Total reward = 20.36
2022-01-26 14:18:30.074 | DEBUG    | __main__:trials:24 - Trial = 25448/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.074 | DEBUG    | __main__:trials:29 - Trial = 25448/30000 | Total reward = 28.16
2022-01-26 14:18:30.079 | DEBUG    | __main__:trials:24 - Trial = 25449/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.080 | DEBUG    | __main__:trials:29 - Trial = 25449/30000 | Total reward = 29.99
2022-01-26 14:18:30.083 | DEBUG    | __main__:trials:24 - Trial = 25450/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.085 | DEBUG    | __main__:trials:29 - Trial = 25450/30000 | Total reward = 43.45
2022-01-26 14:18:30.087 | DEBUG    | __main__:trials:26 - Trial = 25451/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.089 | DEBUG    | __main__:trials:29 - Trial = 25451/30000 | Total reward = 16.86
2022-01-26 14:18:30.092 | DEBUG    | __main__:trials:24 - Trial = 25452/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.093 | DEBUG    | __main__:trials:29 - Trial = 25452/30000 | Total reward = 28.46
2022-01-26 14:18:30.096 | DEBUG    | __main__:trials:24 - Trial = 25453/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.098 | DEBUG    | __main__:trials:29 - Trial = 25453/30000 | Total reward = 23.15
2022-01-26 14:18:30.102 | DEBUG    | __main__:trials:24 - Trial = 25454/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.102 | DEBUG    | __main__:trials:29 - Trial = 25454/30000 | Total reward = 32.54
2022-01-26 14:18:30.107 | DEBUG    | __main__:trials:24 - Trial = 25455/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.107 | DEBUG    | __main__:trials:29 - Trial = 25455/30000 | Total reward = 35.55
2022-01-26 14:18:30.112 | DEBUG    | __main__:trials:24 - Trial = 25456/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.114 | DEBUG    | __main__:trials:29 - Trial = 25456/30000 | Total reward = 38.24
2022-01-26 14:18:30.117 | DEBUG    | __main__:trials:24 - Trial = 25457/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.119 | DEBUG    | __main__:trials:29 - Trial = 25457/30000 | Total reward = 44.03
2022-01-26 14:18:30.122 | DEBUG    | __main__:trials:26 - Trial = 25458/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.123 | DEBUG    | __main__:trials:29 - Trial = 25458/30000 | Total reward = 18.76
2022-01-26 14:18:30.126 | DEBUG    | __main__:trials:24 - Trial = 25459/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.128 | DEBUG    | __main__:trials:29 - Trial = 25459/30000 | Total reward = 33.33
2022-01-26 14:18:30.131 | DEBUG    | __main__:trials:24 - Trial = 25460/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.133 | DEBUG    | __main__:trials:29 - Trial = 25460/30000 | Total reward = 33.07
2022-01-26 14:18:30.136 | DEBUG    | __main__:trials:24 - Trial = 25461/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.137 | DEBUG    | __main__:trials:29 - Trial = 25461/30000 | Total reward = 32.49
2022-01-26 14:18:30.141 | DEBUG    | __main__:trials:24 - Trial = 25462/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.142 | DEBUG    | __main__:trials:29 - Trial = 25462/30000 | Total reward = 35.67
2022-01-26 14:18:30.145 | DEBUG    | __main__:trials:24 - Trial = 25463/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.147 | DEBUG    | __main__:trials:29 - Trial = 25463/30000 | Total reward = 33.33
2022-01-26 14:18:30.150 | DEBUG    | __main__:trials:24 - Trial = 25464/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.152 | DEBUG    | __main__:trials:29 - Trial = 25464/30000 | Total reward = 31.10
2022-01-26 14:18:30.155 | DEBUG    | __main__:trials:24 - Trial = 25465/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.156 | DEBUG    | __main__:trials:29 - Trial = 25465/30000 | Total reward = 43.11
2022-01-26 14:18:30.158 | DEBUG    | __main__:trials:26 - Trial = 25466/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.160 | DEBUG    | __main__:trials:29 - Trial = 25466/30000 | Total reward = 15.88
2022-01-26 14:18:30.162 | DEBUG    | __main__:trials:26 - Trial = 25467/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.164 | DEBUG    | __main__:trials:29 - Trial = 25467/30000 | Total reward = 13.20
2022-01-26 14:18:30.167 | DEBUG    | __main__:trials:26 - Trial = 25468/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.167 | DEBUG    | __main__:trials:29 - Trial = 25468/30000 | Total reward = 14.42
2022-01-26 14:18:30.172 | DEBUG    | __main__:trials:24 - Trial = 25469/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.173 | DEBUG    | __main__:trials:29 - Trial = 25469/30000 | Total reward = 32.60
2022-01-26 14:18:30.175 | DEBUG    | __main__:trials:26 - Trial = 25470/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.177 | DEBUG    | __main__:trials:29 - Trial = 25470/30000 | Total reward = 17.64
2022-01-26 14:18:30.181 | DEBUG    | __main__:trials:24 - Trial = 25471/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.183 | DEBUG    | __main__:trials:29 - Trial = 25471/30000 | Total reward = 43.36
2022-01-26 14:18:30.186 | DEBUG    | __main__:trials:26 - Trial = 25472/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.187 | DEBUG    | __main__:trials:29 - Trial = 25472/30000 | Total reward = 17.64
2022-01-26 14:18:30.191 | DEBUG    | __main__:trials:26 - Trial = 25473/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.192 | DEBUG    | __main__:trials:29 - Trial = 25473/30000 | Total reward = 19.35
2022-01-26 14:18:30.196 | DEBUG    | __main__:trials:26 - Trial = 25474/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.197 | DEBUG    | __main__:trials:29 - Trial = 25474/30000 | Total reward = 24.51
2022-01-26 14:18:30.201 | DEBUG    | __main__:trials:24 - Trial = 25475/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.202 | DEBUG    | __main__:trials:29 - Trial = 25475/30000 | Total reward = 26.57
2022-01-26 14:18:30.205 | DEBUG    | __main__:trials:26 - Trial = 25476/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.206 | DEBUG    | __main__:trials:29 - Trial = 25476/30000 | Total reward = 17.64
2022-01-26 14:18:30.209 | DEBUG    | __main__:trials:26 - Trial = 25477/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.211 | DEBUG    | __main__:trials:29 - Trial = 25477/30000 | Total reward = 15.71
2022-01-26 14:18:30.214 | DEBUG    | __main__:trials:26 - Trial = 25478/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.216 | DEBUG    | __main__:trials:29 - Trial = 25478/30000 | Total reward = 17.64
2022-01-26 14:18:30.219 | DEBUG    | __main__:trials:26 - Trial = 25479/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.221 | DEBUG    | __main__:trials:29 - Trial = 25479/30000 | Total reward = 22.74
2022-01-26 14:18:30.224 | DEBUG    | __main__:trials:24 - Trial = 25480/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.225 | DEBUG    | __main__:trials:29 - Trial = 25480/30000 | Total reward = 27.19
2022-01-26 14:18:30.230 | DEBUG    | __main__:trials:24 - Trial = 25481/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.230 | DEBUG    | __main__:trials:29 - Trial = 25481/30000 | Total reward = 27.65
2022-01-26 14:18:30.235 | DEBUG    | __main__:trials:24 - Trial = 25482/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.236 | DEBUG    | __main__:trials:29 - Trial = 25482/30000 | Total reward = 39.91
2022-01-26 14:18:30.240 | DEBUG    | __main__:trials:24 - Trial = 25483/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.242 | DEBUG    | __main__:trials:29 - Trial = 25483/30000 | Total reward = 33.28
2022-01-26 14:18:30.245 | DEBUG    | __main__:trials:24 - Trial = 25484/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.247 | DEBUG    | __main__:trials:29 - Trial = 25484/30000 | Total reward = 31.08
2022-01-26 14:18:30.250 | DEBUG    | __main__:trials:24 - Trial = 25485/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.252 | DEBUG    | __main__:trials:29 - Trial = 25485/30000 | Total reward = 33.10
2022-01-26 14:18:30.255 | DEBUG    | __main__:trials:24 - Trial = 25486/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.256 | DEBUG    | __main__:trials:29 - Trial = 25486/30000 | Total reward = 32.46
2022-01-26 14:18:30.260 | DEBUG    | __main__:trials:24 - Trial = 25487/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.262 | DEBUG    | __main__:trials:29 - Trial = 25487/30000 | Total reward = 37.64
2022-01-26 14:18:30.264 | DEBUG    | __main__:trials:26 - Trial = 25488/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.265 | DEBUG    | __main__:trials:29 - Trial = 25488/30000 | Total reward = 16.81
2022-01-26 14:18:30.270 | DEBUG    | __main__:trials:24 - Trial = 25489/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.272 | DEBUG    | __main__:trials:29 - Trial = 25489/30000 | Total reward = 32.64
2022-01-26 14:18:30.275 | DEBUG    | __main__:trials:24 - Trial = 25490/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.277 | DEBUG    | __main__:trials:29 - Trial = 25490/30000 | Total reward = 41.20
2022-01-26 14:18:30.280 | DEBUG    | __main__:trials:24 - Trial = 25491/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.282 | DEBUG    | __main__:trials:29 - Trial = 25491/30000 | Total reward = 43.66
2022-01-26 14:18:30.285 | DEBUG    | __main__:trials:24 - Trial = 25492/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.286 | DEBUG    | __main__:trials:29 - Trial = 25492/30000 | Total reward = 33.60
2022-01-26 14:18:30.290 | DEBUG    | __main__:trials:24 - Trial = 25493/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.291 | DEBUG    | __main__:trials:29 - Trial = 25493/30000 | Total reward = 27.23
2022-01-26 14:18:30.294 | DEBUG    | __main__:trials:26 - Trial = 25494/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.296 | DEBUG    | __main__:trials:29 - Trial = 25494/30000 | Total reward = 14.37
2022-01-26 14:18:30.299 | DEBUG    | __main__:trials:26 - Trial = 25495/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.301 | DEBUG    | __main__:trials:29 - Trial = 25495/30000 | Total reward = 21.03
2022-01-26 14:18:30.303 | DEBUG    | __main__:trials:24 - Trial = 25496/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.305 | DEBUG    | __main__:trials:29 - Trial = 25496/30000 | Total reward = 31.36
2022-01-26 14:18:30.308 | DEBUG    | __main__:trials:24 - Trial = 25497/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.310 | DEBUG    | __main__:trials:29 - Trial = 25497/30000 | Total reward = 36.47
2022-01-26 14:18:30.313 | DEBUG    | __main__:trials:26 - Trial = 25498/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.313 | DEBUG    | __main__:trials:29 - Trial = 25498/30000 | Total reward = 18.38
2022-01-26 14:18:30.317 | DEBUG    | __main__:trials:26 - Trial = 25499/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.318 | DEBUG    | __main__:trials:29 - Trial = 25499/30000 | Total reward = 21.34
2022-01-26 14:18:30.322 | DEBUG    | __main__:trials:26 - Trial = 25500/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.323 | DEBUG    | __main__:trials:29 - Trial = 25500/30000 | Total reward = 14.65
2022-01-26 14:18:30.326 | DEBUG    | __main__:trials:26 - Trial = 25501/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.327 | DEBUG    | __main__:trials:29 - Trial = 25501/30000 | Total reward = 16.64
2022-01-26 14:18:30.331 | DEBUG    | __main__:trials:26 - Trial = 25502/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.333 | DEBUG    | __main__:trials:29 - Trial = 25502/30000 | Total reward = 25.30
2022-01-26 14:18:30.336 | DEBUG    | __main__:trials:26 - Trial = 25503/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.336 | DEBUG    | __main__:trials:29 - Trial = 25503/30000 | Total reward = 21.41
2022-01-26 14:18:30.341 | DEBUG    | __main__:trials:24 - Trial = 25504/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.341 | DEBUG    | __main__:trials:29 - Trial = 25504/30000 | Total reward = 34.68
2022-01-26 14:18:30.344 | DEBUG    | __main__:trials:26 - Trial = 25505/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.345 | DEBUG    | __main__:trials:29 - Trial = 25505/30000 | Total reward = 18.40
2022-01-26 14:18:30.348 | DEBUG    | __main__:trials:26 - Trial = 25506/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.349 | DEBUG    | __main__:trials:29 - Trial = 25506/30000 | Total reward = 14.88
2022-01-26 14:18:30.352 | DEBUG    | __main__:trials:24 - Trial = 25507/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.354 | DEBUG    | __main__:trials:29 - Trial = 25507/30000 | Total reward = 45.03
2022-01-26 14:18:30.358 | DEBUG    | __main__:trials:24 - Trial = 25508/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.358 | DEBUG    | __main__:trials:29 - Trial = 25508/30000 | Total reward = 45.63
2022-01-26 14:18:30.362 | DEBUG    | __main__:trials:26 - Trial = 25509/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.363 | DEBUG    | __main__:trials:29 - Trial = 25509/30000 | Total reward = 16.87
2022-01-26 14:18:30.367 | DEBUG    | __main__:trials:24 - Trial = 25510/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.368 | DEBUG    | __main__:trials:29 - Trial = 25510/30000 | Total reward = 46.56
2022-01-26 14:18:30.371 | DEBUG    | __main__:trials:26 - Trial = 25511/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.372 | DEBUG    | __main__:trials:29 - Trial = 25511/30000 | Total reward = 9.83
2022-01-26 14:18:30.375 | DEBUG    | __main__:trials:24 - Trial = 25512/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.377 | DEBUG    | __main__:trials:29 - Trial = 25512/30000 | Total reward = 31.19
2022-01-26 14:18:30.380 | DEBUG    | __main__:trials:26 - Trial = 25513/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.382 | DEBUG    | __main__:trials:29 - Trial = 25513/30000 | Total reward = 22.23
2022-01-26 14:18:30.385 | DEBUG    | __main__:trials:24 - Trial = 25514/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.387 | DEBUG    | __main__:trials:29 - Trial = 25514/30000 | Total reward = 41.88
2022-01-26 14:18:30.390 | DEBUG    | __main__:trials:24 - Trial = 25515/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.392 | DEBUG    | __main__:trials:29 - Trial = 25515/30000 | Total reward = 36.93
2022-01-26 14:18:30.395 | DEBUG    | __main__:trials:26 - Trial = 25516/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.396 | DEBUG    | __main__:trials:29 - Trial = 25516/30000 | Total reward = 16.31
2022-01-26 14:18:30.400 | DEBUG    | __main__:trials:24 - Trial = 25517/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.402 | DEBUG    | __main__:trials:29 - Trial = 25517/30000 | Total reward = 38.31
2022-01-26 14:18:30.404 | DEBUG    | __main__:trials:26 - Trial = 25518/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.405 | DEBUG    | __main__:trials:29 - Trial = 25518/30000 | Total reward = 16.87
2022-01-26 14:18:30.409 | DEBUG    | __main__:trials:24 - Trial = 25519/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.410 | DEBUG    | __main__:trials:29 - Trial = 25519/30000 | Total reward = 41.73
2022-01-26 14:18:30.413 | DEBUG    | __main__:trials:26 - Trial = 25520/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.415 | DEBUG    | __main__:trials:29 - Trial = 25520/30000 | Total reward = 15.05
2022-01-26 14:18:30.418 | DEBUG    | __main__:trials:24 - Trial = 25521/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.420 | DEBUG    | __main__:trials:29 - Trial = 25521/30000 | Total reward = 41.44
2022-01-26 14:18:30.423 | DEBUG    | __main__:trials:26 - Trial = 25522/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.424 | DEBUG    | __main__:trials:29 - Trial = 25522/30000 | Total reward = 16.87
2022-01-26 14:18:30.428 | DEBUG    | __main__:trials:24 - Trial = 25523/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.429 | DEBUG    | __main__:trials:29 - Trial = 25523/30000 | Total reward = 59.78
2022-01-26 14:18:30.433 | DEBUG    | __main__:trials:24 - Trial = 25524/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.435 | DEBUG    | __main__:trials:29 - Trial = 25524/30000 | Total reward = 31.47
2022-01-26 14:18:30.438 | DEBUG    | __main__:trials:24 - Trial = 25525/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.440 | DEBUG    | __main__:trials:29 - Trial = 25525/30000 | Total reward = 20.07
2022-01-26 14:18:30.444 | DEBUG    | __main__:trials:24 - Trial = 25526/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.445 | DEBUG    | __main__:trials:29 - Trial = 25526/30000 | Total reward = 61.62
2022-01-26 14:18:30.448 | DEBUG    | __main__:trials:26 - Trial = 25527/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.449 | DEBUG    | __main__:trials:29 - Trial = 25527/30000 | Total reward = 16.87
2022-01-26 14:18:30.453 | DEBUG    | __main__:trials:24 - Trial = 25528/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.454 | DEBUG    | __main__:trials:29 - Trial = 25528/30000 | Total reward = 46.63
2022-01-26 14:18:30.458 | DEBUG    | __main__:trials:26 - Trial = 25529/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.459 | DEBUG    | __main__:trials:29 - Trial = 25529/30000 | Total reward = 26.45
2022-01-26 14:18:30.463 | DEBUG    | __main__:trials:24 - Trial = 25530/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.464 | DEBUG    | __main__:trials:29 - Trial = 25530/30000 | Total reward = 29.90
2022-01-26 14:18:30.468 | DEBUG    | __main__:trials:24 - Trial = 25531/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.468 | DEBUG    | __main__:trials:29 - Trial = 25531/30000 | Total reward = 44.46
2022-01-26 14:18:30.472 | DEBUG    | __main__:trials:26 - Trial = 25532/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.473 | DEBUG    | __main__:trials:29 - Trial = 25532/30000 | Total reward = 18.64
2022-01-26 14:18:30.476 | DEBUG    | __main__:trials:26 - Trial = 25533/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.478 | DEBUG    | __main__:trials:29 - Trial = 25533/30000 | Total reward = 16.87
2022-01-26 14:18:30.481 | DEBUG    | __main__:trials:24 - Trial = 25534/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.482 | DEBUG    | __main__:trials:29 - Trial = 25534/30000 | Total reward = 36.41
2022-01-26 14:18:30.485 | DEBUG    | __main__:trials:26 - Trial = 25535/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.486 | DEBUG    | __main__:trials:29 - Trial = 25535/30000 | Total reward = 18.40
2022-01-26 14:18:30.490 | DEBUG    | __main__:trials:26 - Trial = 25536/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.490 | DEBUG    | __main__:trials:29 - Trial = 25536/30000 | Total reward = 11.06
2022-01-26 14:18:30.495 | DEBUG    | __main__:trials:24 - Trial = 25537/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.496 | DEBUG    | __main__:trials:29 - Trial = 25537/30000 | Total reward = 48.99
2022-01-26 14:18:30.500 | DEBUG    | __main__:trials:24 - Trial = 25538/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.501 | DEBUG    | __main__:trials:29 - Trial = 25538/30000 | Total reward = 45.72
2022-01-26 14:18:30.505 | DEBUG    | __main__:trials:24 - Trial = 25539/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.507 | DEBUG    | __main__:trials:29 - Trial = 25539/30000 | Total reward = 45.92
2022-01-26 14:18:30.510 | DEBUG    | __main__:trials:24 - Trial = 25540/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.511 | DEBUG    | __main__:trials:29 - Trial = 25540/30000 | Total reward = 60.69
2022-01-26 14:18:30.514 | DEBUG    | __main__:trials:26 - Trial = 25541/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.515 | DEBUG    | __main__:trials:29 - Trial = 25541/30000 | Total reward = 20.04
2022-01-26 14:18:30.518 | DEBUG    | __main__:trials:24 - Trial = 25542/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.520 | DEBUG    | __main__:trials:29 - Trial = 25542/30000 | Total reward = 34.99
2022-01-26 14:18:30.523 | DEBUG    | __main__:trials:24 - Trial = 25543/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.524 | DEBUG    | __main__:trials:29 - Trial = 25543/30000 | Total reward = 47.96
2022-01-26 14:18:30.528 | DEBUG    | __main__:trials:24 - Trial = 25544/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.530 | DEBUG    | __main__:trials:29 - Trial = 25544/30000 | Total reward = 40.36
2022-01-26 14:18:30.533 | DEBUG    | __main__:trials:24 - Trial = 25545/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.535 | DEBUG    | __main__:trials:29 - Trial = 25545/30000 | Total reward = 36.73
2022-01-26 14:18:30.537 | DEBUG    | __main__:trials:26 - Trial = 25546/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.538 | DEBUG    | __main__:trials:29 - Trial = 25546/30000 | Total reward = 17.40
2022-01-26 14:18:30.541 | DEBUG    | __main__:trials:26 - Trial = 25547/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.542 | DEBUG    | __main__:trials:29 - Trial = 25547/30000 | Total reward = 23.45
2022-01-26 14:18:30.546 | DEBUG    | __main__:trials:26 - Trial = 25548/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.547 | DEBUG    | __main__:trials:29 - Trial = 25548/30000 | Total reward = 29.54
2022-01-26 14:18:30.550 | DEBUG    | __main__:trials:24 - Trial = 25549/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.552 | DEBUG    | __main__:trials:29 - Trial = 25549/30000 | Total reward = 41.97
2022-01-26 14:18:30.555 | DEBUG    | __main__:trials:24 - Trial = 25550/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.557 | DEBUG    | __main__:trials:29 - Trial = 25550/30000 | Total reward = 30.49
2022-01-26 14:18:30.560 | DEBUG    | __main__:trials:24 - Trial = 25551/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.562 | DEBUG    | __main__:trials:29 - Trial = 25551/30000 | Total reward = 40.59
2022-01-26 14:18:30.566 | DEBUG    | __main__:trials:24 - Trial = 25552/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.567 | DEBUG    | __main__:trials:29 - Trial = 25552/30000 | Total reward = 45.67
2022-01-26 14:18:30.571 | DEBUG    | __main__:trials:24 - Trial = 25553/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.572 | DEBUG    | __main__:trials:29 - Trial = 25553/30000 | Total reward = 37.07
2022-01-26 14:18:30.574 | DEBUG    | __main__:trials:26 - Trial = 25554/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.576 | DEBUG    | __main__:trials:29 - Trial = 25554/30000 | Total reward = 19.33
2022-01-26 14:18:30.579 | DEBUG    | __main__:trials:26 - Trial = 25555/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.581 | DEBUG    | __main__:trials:29 - Trial = 25555/30000 | Total reward = 16.87
2022-01-26 14:18:30.584 | DEBUG    | __main__:trials:24 - Trial = 25556/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.586 | DEBUG    | __main__:trials:29 - Trial = 25556/30000 | Total reward = 33.68
2022-01-26 14:18:30.589 | DEBUG    | __main__:trials:24 - Trial = 25557/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.590 | DEBUG    | __main__:trials:29 - Trial = 25557/30000 | Total reward = 40.23
2022-01-26 14:18:30.594 | DEBUG    | __main__:trials:26 - Trial = 25558/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.595 | DEBUG    | __main__:trials:29 - Trial = 25558/30000 | Total reward = 13.06
2022-01-26 14:18:30.599 | DEBUG    | __main__:trials:24 - Trial = 25559/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.599 | DEBUG    | __main__:trials:29 - Trial = 25559/30000 | Total reward = 56.82
2022-01-26 14:18:30.604 | DEBUG    | __main__:trials:26 - Trial = 25560/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.604 | DEBUG    | __main__:trials:29 - Trial = 25560/30000 | Total reward = 23.54
2022-01-26 14:18:30.608 | DEBUG    | __main__:trials:24 - Trial = 25561/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.610 | DEBUG    | __main__:trials:29 - Trial = 25561/30000 | Total reward = 38.83
2022-01-26 14:18:30.612 | DEBUG    | __main__:trials:24 - Trial = 25562/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.614 | DEBUG    | __main__:trials:29 - Trial = 25562/30000 | Total reward = 30.09
2022-01-26 14:18:30.617 | DEBUG    | __main__:trials:26 - Trial = 25563/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.618 | DEBUG    | __main__:trials:29 - Trial = 25563/30000 | Total reward = 14.65
2022-01-26 14:18:30.621 | DEBUG    | __main__:trials:26 - Trial = 25564/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.622 | DEBUG    | __main__:trials:29 - Trial = 25564/30000 | Total reward = 17.64
2022-01-26 14:18:30.625 | DEBUG    | __main__:trials:24 - Trial = 25565/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.627 | DEBUG    | __main__:trials:29 - Trial = 25565/30000 | Total reward = 52.62
2022-01-26 14:18:30.630 | DEBUG    | __main__:trials:26 - Trial = 25566/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.631 | DEBUG    | __main__:trials:29 - Trial = 25566/30000 | Total reward = 8.87
2022-01-26 14:18:30.633 | DEBUG    | __main__:trials:26 - Trial = 25567/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.634 | DEBUG    | __main__:trials:29 - Trial = 25567/30000 | Total reward = 17.37
2022-01-26 14:18:30.636 | DEBUG    | __main__:trials:26 - Trial = 25568/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.638 | DEBUG    | __main__:trials:29 - Trial = 25568/30000 | Total reward = 14.88
2022-01-26 14:18:30.642 | DEBUG    | __main__:trials:24 - Trial = 25569/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.642 | DEBUG    | __main__:trials:29 - Trial = 25569/30000 | Total reward = 38.25
2022-01-26 14:18:30.646 | DEBUG    | __main__:trials:24 - Trial = 25570/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.647 | DEBUG    | __main__:trials:29 - Trial = 25570/30000 | Total reward = 44.91
2022-01-26 14:18:30.650 | DEBUG    | __main__:trials:24 - Trial = 25571/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.652 | DEBUG    | __main__:trials:29 - Trial = 25571/30000 | Total reward = 36.15
2022-01-26 14:18:30.655 | DEBUG    | __main__:trials:24 - Trial = 25572/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.657 | DEBUG    | __main__:trials:29 - Trial = 25572/30000 | Total reward = 35.89
2022-01-26 14:18:30.659 | DEBUG    | __main__:trials:24 - Trial = 25573/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.661 | DEBUG    | __main__:trials:29 - Trial = 25573/30000 | Total reward = 43.98
2022-01-26 14:18:30.664 | DEBUG    | __main__:trials:26 - Trial = 25574/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.665 | DEBUG    | __main__:trials:29 - Trial = 25574/30000 | Total reward = 16.87
2022-01-26 14:18:30.669 | DEBUG    | __main__:trials:26 - Trial = 25575/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.670 | DEBUG    | __main__:trials:29 - Trial = 25575/30000 | Total reward = 22.38
2022-01-26 14:18:30.673 | DEBUG    | __main__:trials:24 - Trial = 25576/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.675 | DEBUG    | __main__:trials:29 - Trial = 25576/30000 | Total reward = 32.90
2022-01-26 14:18:30.679 | DEBUG    | __main__:trials:24 - Trial = 25577/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.680 | DEBUG    | __main__:trials:29 - Trial = 25577/30000 | Total reward = 36.11
2022-01-26 14:18:30.684 | DEBUG    | __main__:trials:24 - Trial = 25578/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.685 | DEBUG    | __main__:trials:29 - Trial = 25578/30000 | Total reward = 62.31
2022-01-26 14:18:30.689 | DEBUG    | __main__:trials:24 - Trial = 25579/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.689 | DEBUG    | __main__:trials:29 - Trial = 25579/30000 | Total reward = 46.04
2022-01-26 14:18:30.693 | DEBUG    | __main__:trials:24 - Trial = 25580/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.694 | DEBUG    | __main__:trials:29 - Trial = 25580/30000 | Total reward = 51.06
2022-01-26 14:18:30.698 | DEBUG    | __main__:trials:24 - Trial = 25581/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.699 | DEBUG    | __main__:trials:29 - Trial = 25581/30000 | Total reward = 51.55
2022-01-26 14:18:30.702 | DEBUG    | __main__:trials:26 - Trial = 25582/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.704 | DEBUG    | __main__:trials:29 - Trial = 25582/30000 | Total reward = 16.67
2022-01-26 14:18:30.707 | DEBUG    | __main__:trials:24 - Trial = 25583/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.709 | DEBUG    | __main__:trials:29 - Trial = 25583/30000 | Total reward = 34.51
2022-01-26 14:18:30.712 | DEBUG    | __main__:trials:24 - Trial = 25584/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.714 | DEBUG    | __main__:trials:29 - Trial = 25584/30000 | Total reward = 46.91
2022-01-26 14:18:30.717 | DEBUG    | __main__:trials:24 - Trial = 25585/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.719 | DEBUG    | __main__:trials:29 - Trial = 25585/30000 | Total reward = 45.73
2022-01-26 14:18:30.723 | DEBUG    | __main__:trials:24 - Trial = 25586/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.724 | DEBUG    | __main__:trials:29 - Trial = 25586/30000 | Total reward = 49.03
2022-01-26 14:18:30.727 | DEBUG    | __main__:trials:24 - Trial = 25587/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.729 | DEBUG    | __main__:trials:29 - Trial = 25587/30000 | Total reward = 30.20
2022-01-26 14:18:30.731 | DEBUG    | __main__:trials:26 - Trial = 25588/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.733 | DEBUG    | __main__:trials:29 - Trial = 25588/30000 | Total reward = 16.87
2022-01-26 14:18:30.736 | DEBUG    | __main__:trials:24 - Trial = 25589/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.737 | DEBUG    | __main__:trials:29 - Trial = 25589/30000 | Total reward = 32.39
2022-01-26 14:18:30.740 | DEBUG    | __main__:trials:26 - Trial = 25590/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.741 | DEBUG    | __main__:trials:29 - Trial = 25590/30000 | Total reward = 16.87
2022-01-26 14:18:30.745 | DEBUG    | __main__:trials:26 - Trial = 25591/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.746 | DEBUG    | __main__:trials:29 - Trial = 25591/30000 | Total reward = 16.74
2022-01-26 14:18:30.750 | DEBUG    | __main__:trials:24 - Trial = 25592/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.750 | DEBUG    | __main__:trials:29 - Trial = 25592/30000 | Total reward = 23.67
2022-01-26 14:18:30.755 | DEBUG    | __main__:trials:24 - Trial = 25593/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.756 | DEBUG    | __main__:trials:29 - Trial = 25593/30000 | Total reward = 37.90
2022-01-26 14:18:30.760 | DEBUG    | __main__:trials:24 - Trial = 25594/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.762 | DEBUG    | __main__:trials:29 - Trial = 25594/30000 | Total reward = 28.13
2022-01-26 14:18:30.765 | DEBUG    | __main__:trials:26 - Trial = 25595/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.766 | DEBUG    | __main__:trials:29 - Trial = 25595/30000 | Total reward = 20.26
2022-01-26 14:18:30.770 | DEBUG    | __main__:trials:24 - Trial = 25596/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.772 | DEBUG    | __main__:trials:29 - Trial = 25596/30000 | Total reward = 26.01
2022-01-26 14:18:30.775 | DEBUG    | __main__:trials:26 - Trial = 25597/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.776 | DEBUG    | __main__:trials:29 - Trial = 25597/30000 | Total reward = 17.91
2022-01-26 14:18:30.780 | DEBUG    | __main__:trials:24 - Trial = 25598/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.782 | DEBUG    | __main__:trials:29 - Trial = 25598/30000 | Total reward = 29.50
2022-01-26 14:18:30.784 | DEBUG    | __main__:trials:24 - Trial = 25599/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.786 | DEBUG    | __main__:trials:29 - Trial = 25599/30000 | Total reward = 43.90
2022-01-26 14:18:30.789 | DEBUG    | __main__:trials:26 - Trial = 25600/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.790 | DEBUG    | __main__:trials:29 - Trial = 25600/30000 | Total reward = 14.65
2022-01-26 14:18:30.793 | DEBUG    | __main__:trials:26 - Trial = 25601/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.795 | DEBUG    | __main__:trials:29 - Trial = 25601/30000 | Total reward = 26.08
2022-01-26 14:18:30.798 | DEBUG    | __main__:trials:24 - Trial = 25602/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.799 | DEBUG    | __main__:trials:29 - Trial = 25602/30000 | Total reward = 37.60
2022-01-26 14:18:30.803 | DEBUG    | __main__:trials:24 - Trial = 25603/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.805 | DEBUG    | __main__:trials:29 - Trial = 25603/30000 | Total reward = 36.15
2022-01-26 14:18:30.808 | DEBUG    | __main__:trials:24 - Trial = 25604/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.810 | DEBUG    | __main__:trials:29 - Trial = 25604/30000 | Total reward = 35.33
2022-01-26 14:18:30.813 | DEBUG    | __main__:trials:24 - Trial = 25605/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.815 | DEBUG    | __main__:trials:29 - Trial = 25605/30000 | Total reward = 40.15
2022-01-26 14:18:30.819 | DEBUG    | __main__:trials:24 - Trial = 25606/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.821 | DEBUG    | __main__:trials:29 - Trial = 25606/30000 | Total reward = 38.79
2022-01-26 14:18:30.824 | DEBUG    | __main__:trials:24 - Trial = 25607/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.825 | DEBUG    | __main__:trials:29 - Trial = 25607/30000 | Total reward = 54.77
2022-01-26 14:18:30.828 | DEBUG    | __main__:trials:26 - Trial = 25608/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.829 | DEBUG    | __main__:trials:29 - Trial = 25608/30000 | Total reward = 17.90
2022-01-26 14:18:30.832 | DEBUG    | __main__:trials:26 - Trial = 25609/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.833 | DEBUG    | __main__:trials:29 - Trial = 25609/30000 | Total reward = 20.75
2022-01-26 14:18:30.836 | DEBUG    | __main__:trials:24 - Trial = 25610/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.838 | DEBUG    | __main__:trials:29 - Trial = 25610/30000 | Total reward = 32.53
2022-01-26 14:18:30.841 | DEBUG    | __main__:trials:24 - Trial = 25611/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.842 | DEBUG    | __main__:trials:29 - Trial = 25611/30000 | Total reward = 43.93
2022-01-26 14:18:30.846 | DEBUG    | __main__:trials:24 - Trial = 25612/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.847 | DEBUG    | __main__:trials:29 - Trial = 25612/30000 | Total reward = 51.96
2022-01-26 14:18:30.851 | DEBUG    | __main__:trials:26 - Trial = 25613/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.852 | DEBUG    | __main__:trials:29 - Trial = 25613/30000 | Total reward = 25.00
2022-01-26 14:18:30.855 | DEBUG    | __main__:trials:26 - Trial = 25614/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.857 | DEBUG    | __main__:trials:29 - Trial = 25614/30000 | Total reward = 19.06
2022-01-26 14:18:30.860 | DEBUG    | __main__:trials:26 - Trial = 25615/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.860 | DEBUG    | __main__:trials:29 - Trial = 25615/30000 | Total reward = 17.90
2022-01-26 14:18:30.865 | DEBUG    | __main__:trials:24 - Trial = 25616/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.865 | DEBUG    | __main__:trials:29 - Trial = 25616/30000 | Total reward = 40.73
2022-01-26 14:18:30.869 | DEBUG    | __main__:trials:26 - Trial = 25617/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.870 | DEBUG    | __main__:trials:29 - Trial = 25617/30000 | Total reward = 17.90
2022-01-26 14:18:30.874 | DEBUG    | __main__:trials:26 - Trial = 25618/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.874 | DEBUG    | __main__:trials:29 - Trial = 25618/30000 | Total reward = 20.48
2022-01-26 14:18:30.878 | DEBUG    | __main__:trials:26 - Trial = 25619/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.879 | DEBUG    | __main__:trials:29 - Trial = 25619/30000 | Total reward = 18.90
2022-01-26 14:18:30.881 | DEBUG    | __main__:trials:26 - Trial = 25620/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.882 | DEBUG    | __main__:trials:29 - Trial = 25620/30000 | Total reward = 9.55
2022-01-26 14:18:30.885 | DEBUG    | __main__:trials:24 - Trial = 25621/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.886 | DEBUG    | __main__:trials:29 - Trial = 25621/30000 | Total reward = 41.50
2022-01-26 14:18:30.889 | DEBUG    | __main__:trials:24 - Trial = 25622/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.890 | DEBUG    | __main__:trials:29 - Trial = 25622/30000 | Total reward = 40.59
2022-01-26 14:18:30.893 | DEBUG    | __main__:trials:26 - Trial = 25623/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.893 | DEBUG    | __main__:trials:29 - Trial = 25623/30000 | Total reward = 17.90
2022-01-26 14:18:30.897 | DEBUG    | __main__:trials:26 - Trial = 25624/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.899 | DEBUG    | __main__:trials:29 - Trial = 25624/30000 | Total reward = 23.71
2022-01-26 14:18:30.902 | DEBUG    | __main__:trials:24 - Trial = 25625/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.904 | DEBUG    | __main__:trials:29 - Trial = 25625/30000 | Total reward = 38.79
2022-01-26 14:18:30.908 | DEBUG    | __main__:trials:24 - Trial = 25626/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.909 | DEBUG    | __main__:trials:29 - Trial = 25626/30000 | Total reward = 36.38
2022-01-26 14:18:30.913 | DEBUG    | __main__:trials:24 - Trial = 25627/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.914 | DEBUG    | __main__:trials:29 - Trial = 25627/30000 | Total reward = 46.44
2022-01-26 14:18:30.917 | DEBUG    | __main__:trials:26 - Trial = 25628/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.919 | DEBUG    | __main__:trials:29 - Trial = 25628/30000 | Total reward = 19.49
2022-01-26 14:18:30.922 | DEBUG    | __main__:trials:24 - Trial = 25629/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.923 | DEBUG    | __main__:trials:29 - Trial = 25629/30000 | Total reward = 50.20
2022-01-26 14:18:30.927 | DEBUG    | __main__:trials:26 - Trial = 25630/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.928 | DEBUG    | __main__:trials:29 - Trial = 25630/30000 | Total reward = 21.96
2022-01-26 14:18:30.932 | DEBUG    | __main__:trials:24 - Trial = 25631/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.933 | DEBUG    | __main__:trials:29 - Trial = 25631/30000 | Total reward = 42.44
2022-01-26 14:18:30.937 | DEBUG    | __main__:trials:26 - Trial = 25632/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.938 | DEBUG    | __main__:trials:29 - Trial = 25632/30000 | Total reward = 24.45
2022-01-26 14:18:30.941 | DEBUG    | __main__:trials:26 - Trial = 25633/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.942 | DEBUG    | __main__:trials:29 - Trial = 25633/30000 | Total reward = 20.14
2022-01-26 14:18:30.946 | DEBUG    | __main__:trials:24 - Trial = 25634/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.947 | DEBUG    | __main__:trials:29 - Trial = 25634/30000 | Total reward = 24.07
2022-01-26 14:18:30.951 | DEBUG    | __main__:trials:24 - Trial = 25635/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.953 | DEBUG    | __main__:trials:29 - Trial = 25635/30000 | Total reward = 20.26
2022-01-26 14:18:30.955 | DEBUG    | __main__:trials:26 - Trial = 25636/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.957 | DEBUG    | __main__:trials:29 - Trial = 25636/30000 | Total reward = 19.18
2022-01-26 14:18:30.960 | DEBUG    | __main__:trials:24 - Trial = 25637/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.961 | DEBUG    | __main__:trials:29 - Trial = 25637/30000 | Total reward = 12.91
2022-01-26 14:18:30.965 | DEBUG    | __main__:trials:24 - Trial = 25638/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.966 | DEBUG    | __main__:trials:29 - Trial = 25638/30000 | Total reward = 36.75
2022-01-26 14:18:30.969 | DEBUG    | __main__:trials:26 - Trial = 25639/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.971 | DEBUG    | __main__:trials:29 - Trial = 25639/30000 | Total reward = 19.11
2022-01-26 14:18:30.974 | DEBUG    | __main__:trials:24 - Trial = 25640/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.975 | DEBUG    | __main__:trials:29 - Trial = 25640/30000 | Total reward = 27.57
2022-01-26 14:18:30.979 | DEBUG    | __main__:trials:24 - Trial = 25641/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.981 | DEBUG    | __main__:trials:29 - Trial = 25641/30000 | Total reward = 32.48
2022-01-26 14:18:30.983 | DEBUG    | __main__:trials:26 - Trial = 25642/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.984 | DEBUG    | __main__:trials:29 - Trial = 25642/30000 | Total reward = 22.57
2022-01-26 14:18:30.987 | DEBUG    | __main__:trials:26 - Trial = 25643/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:30.989 | DEBUG    | __main__:trials:29 - Trial = 25643/30000 | Total reward = 21.56
2022-01-26 14:18:30.993 | DEBUG    | __main__:trials:24 - Trial = 25644/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.994 | DEBUG    | __main__:trials:29 - Trial = 25644/30000 | Total reward = 30.92
2022-01-26 14:18:30.998 | DEBUG    | __main__:trials:24 - Trial = 25645/30000 | Max number of steps (20) reached
2022-01-26 14:18:30.999 | DEBUG    | __main__:trials:29 - Trial = 25645/30000 | Total reward = 52.84
2022-01-26 14:18:31.003 | DEBUG    | __main__:trials:26 - Trial = 25646/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.004 | DEBUG    | __main__:trials:29 - Trial = 25646/30000 | Total reward = 17.90
2022-01-26 14:18:31.007 | DEBUG    | __main__:trials:24 - Trial = 25647/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.009 | DEBUG    | __main__:trials:29 - Trial = 25647/30000 | Total reward = 39.39
2022-01-26 14:18:31.012 | DEBUG    | __main__:trials:26 - Trial = 25648/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.014 | DEBUG    | __main__:trials:29 - Trial = 25648/30000 | Total reward = 27.93
2022-01-26 14:18:31.016 | DEBUG    | __main__:trials:26 - Trial = 25649/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.018 | DEBUG    | __main__:trials:29 - Trial = 25649/30000 | Total reward = 17.90
2022-01-26 14:18:31.020 | DEBUG    | __main__:trials:26 - Trial = 25650/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.021 | DEBUG    | __main__:trials:29 - Trial = 25650/30000 | Total reward = 22.76
2022-01-26 14:18:31.024 | DEBUG    | __main__:trials:24 - Trial = 25651/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.026 | DEBUG    | __main__:trials:29 - Trial = 25651/30000 | Total reward = 35.63
2022-01-26 14:18:31.029 | DEBUG    | __main__:trials:24 - Trial = 25652/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.031 | DEBUG    | __main__:trials:29 - Trial = 25652/30000 | Total reward = 35.37
2022-01-26 14:18:31.035 | DEBUG    | __main__:trials:24 - Trial = 25653/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.035 | DEBUG    | __main__:trials:29 - Trial = 25653/30000 | Total reward = 35.21
2022-01-26 14:18:31.039 | DEBUG    | __main__:trials:24 - Trial = 25654/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.041 | DEBUG    | __main__:trials:29 - Trial = 25654/30000 | Total reward = 41.67
2022-01-26 14:18:31.044 | DEBUG    | __main__:trials:24 - Trial = 25655/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.045 | DEBUG    | __main__:trials:29 - Trial = 25655/30000 | Total reward = 32.99
2022-01-26 14:18:31.048 | DEBUG    | __main__:trials:26 - Trial = 25656/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.050 | DEBUG    | __main__:trials:29 - Trial = 25656/30000 | Total reward = 17.90
2022-01-26 14:18:31.053 | DEBUG    | __main__:trials:26 - Trial = 25657/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.054 | DEBUG    | __main__:trials:29 - Trial = 25657/30000 | Total reward = 21.74
2022-01-26 14:18:31.058 | DEBUG    | __main__:trials:24 - Trial = 25658/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.060 | DEBUG    | __main__:trials:29 - Trial = 25658/30000 | Total reward = 34.08
2022-01-26 14:18:31.063 | DEBUG    | __main__:trials:26 - Trial = 25659/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.064 | DEBUG    | __main__:trials:29 - Trial = 25659/30000 | Total reward = 17.90
2022-01-26 14:18:31.068 | DEBUG    | __main__:trials:24 - Trial = 25660/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.069 | DEBUG    | __main__:trials:29 - Trial = 25660/30000 | Total reward = 25.11
2022-01-26 14:18:31.073 | DEBUG    | __main__:trials:24 - Trial = 25661/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.074 | DEBUG    | __main__:trials:29 - Trial = 25661/30000 | Total reward = 34.47
2022-01-26 14:18:31.078 | DEBUG    | __main__:trials:24 - Trial = 25662/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.079 | DEBUG    | __main__:trials:29 - Trial = 25662/30000 | Total reward = 38.86
2022-01-26 14:18:31.083 | DEBUG    | __main__:trials:24 - Trial = 25663/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.085 | DEBUG    | __main__:trials:29 - Trial = 25663/30000 | Total reward = 21.50
2022-01-26 14:18:31.087 | DEBUG    | __main__:trials:24 - Trial = 25664/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.089 | DEBUG    | __main__:trials:29 - Trial = 25664/30000 | Total reward = 28.60
2022-01-26 14:18:31.092 | DEBUG    | __main__:trials:26 - Trial = 25665/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.094 | DEBUG    | __main__:trials:29 - Trial = 25665/30000 | Total reward = 23.09
2022-01-26 14:18:31.097 | DEBUG    | __main__:trials:26 - Trial = 25666/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.099 | DEBUG    | __main__:trials:29 - Trial = 25666/30000 | Total reward = 16.15
2022-01-26 14:18:31.102 | DEBUG    | __main__:trials:24 - Trial = 25667/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.103 | DEBUG    | __main__:trials:29 - Trial = 25667/30000 | Total reward = 36.68
2022-01-26 14:18:31.106 | DEBUG    | __main__:trials:26 - Trial = 25668/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.108 | DEBUG    | __main__:trials:29 - Trial = 25668/30000 | Total reward = 14.84
2022-01-26 14:18:31.111 | DEBUG    | __main__:trials:24 - Trial = 25669/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.113 | DEBUG    | __main__:trials:29 - Trial = 25669/30000 | Total reward = 33.84
2022-01-26 14:18:31.116 | DEBUG    | __main__:trials:24 - Trial = 25670/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.117 | DEBUG    | __main__:trials:29 - Trial = 25670/30000 | Total reward = 33.84
2022-01-26 14:18:31.120 | DEBUG    | __main__:trials:26 - Trial = 25671/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.122 | DEBUG    | __main__:trials:29 - Trial = 25671/30000 | Total reward = 20.87
2022-01-26 14:18:31.125 | DEBUG    | __main__:trials:24 - Trial = 25672/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.126 | DEBUG    | __main__:trials:29 - Trial = 25672/30000 | Total reward = 34.72
2022-01-26 14:18:31.129 | DEBUG    | __main__:trials:26 - Trial = 25673/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.130 | DEBUG    | __main__:trials:29 - Trial = 25673/30000 | Total reward = 16.82
2022-01-26 14:18:31.133 | DEBUG    | __main__:trials:26 - Trial = 25674/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.133 | DEBUG    | __main__:trials:29 - Trial = 25674/30000 | Total reward = 13.94
2022-01-26 14:18:31.137 | DEBUG    | __main__:trials:24 - Trial = 25675/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.138 | DEBUG    | __main__:trials:29 - Trial = 25675/30000 | Total reward = 39.25
2022-01-26 14:18:31.142 | DEBUG    | __main__:trials:24 - Trial = 25676/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.142 | DEBUG    | __main__:trials:29 - Trial = 25676/30000 | Total reward = 28.67
2022-01-26 14:18:31.147 | DEBUG    | __main__:trials:24 - Trial = 25677/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.147 | DEBUG    | __main__:trials:29 - Trial = 25677/30000 | Total reward = 39.62
2022-01-26 14:18:31.152 | DEBUG    | __main__:trials:24 - Trial = 25678/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.153 | DEBUG    | __main__:trials:29 - Trial = 25678/30000 | Total reward = 39.11
2022-01-26 14:18:31.156 | DEBUG    | __main__:trials:24 - Trial = 25679/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.158 | DEBUG    | __main__:trials:29 - Trial = 25679/30000 | Total reward = 39.68
2022-01-26 14:18:31.161 | DEBUG    | __main__:trials:26 - Trial = 25680/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.162 | DEBUG    | __main__:trials:29 - Trial = 25680/30000 | Total reward = 25.70
2022-01-26 14:18:31.164 | DEBUG    | __main__:trials:26 - Trial = 25681/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.166 | DEBUG    | __main__:trials:29 - Trial = 25681/30000 | Total reward = 9.55
2022-01-26 14:18:31.170 | DEBUG    | __main__:trials:24 - Trial = 25682/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.170 | DEBUG    | __main__:trials:29 - Trial = 25682/30000 | Total reward = 46.26
2022-01-26 14:18:31.174 | DEBUG    | __main__:trials:24 - Trial = 25683/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.175 | DEBUG    | __main__:trials:29 - Trial = 25683/30000 | Total reward = 37.10
2022-01-26 14:18:31.179 | DEBUG    | __main__:trials:24 - Trial = 25684/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.181 | DEBUG    | __main__:trials:29 - Trial = 25684/30000 | Total reward = 38.46
2022-01-26 14:18:31.184 | DEBUG    | __main__:trials:24 - Trial = 25685/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.185 | DEBUG    | __main__:trials:29 - Trial = 25685/30000 | Total reward = 35.70
2022-01-26 14:18:31.188 | DEBUG    | __main__:trials:24 - Trial = 25686/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.189 | DEBUG    | __main__:trials:29 - Trial = 25686/30000 | Total reward = 42.83
2022-01-26 14:18:31.193 | DEBUG    | __main__:trials:24 - Trial = 25687/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.194 | DEBUG    | __main__:trials:29 - Trial = 25687/30000 | Total reward = 40.84
2022-01-26 14:18:31.198 | DEBUG    | __main__:trials:24 - Trial = 25688/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.200 | DEBUG    | __main__:trials:29 - Trial = 25688/30000 | Total reward = 39.25
2022-01-26 14:18:31.203 | DEBUG    | __main__:trials:24 - Trial = 25689/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.205 | DEBUG    | __main__:trials:29 - Trial = 25689/30000 | Total reward = 38.61
2022-01-26 14:18:31.208 | DEBUG    | __main__:trials:24 - Trial = 25690/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.209 | DEBUG    | __main__:trials:29 - Trial = 25690/30000 | Total reward = 35.80
2022-01-26 14:18:31.213 | DEBUG    | __main__:trials:24 - Trial = 25691/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.214 | DEBUG    | __main__:trials:29 - Trial = 25691/30000 | Total reward = 36.51
2022-01-26 14:18:31.218 | DEBUG    | __main__:trials:24 - Trial = 25692/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.218 | DEBUG    | __main__:trials:29 - Trial = 25692/30000 | Total reward = 35.61
2022-01-26 14:18:31.222 | DEBUG    | __main__:trials:24 - Trial = 25693/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.224 | DEBUG    | __main__:trials:29 - Trial = 25693/30000 | Total reward = 58.90
2022-01-26 14:18:31.228 | DEBUG    | __main__:trials:24 - Trial = 25694/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.229 | DEBUG    | __main__:trials:29 - Trial = 25694/30000 | Total reward = 29.44
2022-01-26 14:18:31.233 | DEBUG    | __main__:trials:24 - Trial = 25695/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.234 | DEBUG    | __main__:trials:29 - Trial = 25695/30000 | Total reward = 37.51
2022-01-26 14:18:31.237 | DEBUG    | __main__:trials:24 - Trial = 25696/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.238 | DEBUG    | __main__:trials:29 - Trial = 25696/30000 | Total reward = 22.22
2022-01-26 14:18:31.241 | DEBUG    | __main__:trials:24 - Trial = 25697/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.242 | DEBUG    | __main__:trials:29 - Trial = 25697/30000 | Total reward = 41.86
2022-01-26 14:18:31.245 | DEBUG    | __main__:trials:24 - Trial = 25698/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.246 | DEBUG    | __main__:trials:29 - Trial = 25698/30000 | Total reward = 32.93
2022-01-26 14:18:31.249 | DEBUG    | __main__:trials:26 - Trial = 25699/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.249 | DEBUG    | __main__:trials:29 - Trial = 25699/30000 | Total reward = 21.08
2022-01-26 14:18:31.253 | DEBUG    | __main__:trials:24 - Trial = 25700/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.253 | DEBUG    | __main__:trials:29 - Trial = 25700/30000 | Total reward = 47.23
2022-01-26 14:18:31.257 | DEBUG    | __main__:trials:24 - Trial = 25701/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.258 | DEBUG    | __main__:trials:29 - Trial = 25701/30000 | Total reward = 36.12
2022-01-26 14:18:31.261 | DEBUG    | __main__:trials:24 - Trial = 25702/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.262 | DEBUG    | __main__:trials:29 - Trial = 25702/30000 | Total reward = 44.04
2022-01-26 14:18:31.265 | DEBUG    | __main__:trials:24 - Trial = 25703/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.266 | DEBUG    | __main__:trials:29 - Trial = 25703/30000 | Total reward = 37.08
2022-01-26 14:18:31.270 | DEBUG    | __main__:trials:24 - Trial = 25704/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.271 | DEBUG    | __main__:trials:29 - Trial = 25704/30000 | Total reward = 42.37
2022-01-26 14:18:31.275 | DEBUG    | __main__:trials:24 - Trial = 25705/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.277 | DEBUG    | __main__:trials:29 - Trial = 25705/30000 | Total reward = 39.90
2022-01-26 14:18:31.280 | DEBUG    | __main__:trials:24 - Trial = 25706/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.282 | DEBUG    | __main__:trials:29 - Trial = 25706/30000 | Total reward = 44.30
2022-01-26 14:18:31.286 | DEBUG    | __main__:trials:24 - Trial = 25707/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.286 | DEBUG    | __main__:trials:29 - Trial = 25707/30000 | Total reward = 45.21
2022-01-26 14:18:31.291 | DEBUG    | __main__:trials:24 - Trial = 25708/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.291 | DEBUG    | __main__:trials:29 - Trial = 25708/30000 | Total reward = 42.43
2022-01-26 14:18:31.296 | DEBUG    | __main__:trials:24 - Trial = 25709/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.296 | DEBUG    | __main__:trials:29 - Trial = 25709/30000 | Total reward = 42.36
2022-01-26 14:18:31.301 | DEBUG    | __main__:trials:24 - Trial = 25710/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.302 | DEBUG    | __main__:trials:29 - Trial = 25710/30000 | Total reward = 43.52
2022-01-26 14:18:31.306 | DEBUG    | __main__:trials:24 - Trial = 25711/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.307 | DEBUG    | __main__:trials:29 - Trial = 25711/30000 | Total reward = 42.42
2022-01-26 14:18:31.311 | DEBUG    | __main__:trials:24 - Trial = 25712/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.312 | DEBUG    | __main__:trials:29 - Trial = 25712/30000 | Total reward = 41.77
2022-01-26 14:18:31.316 | DEBUG    | __main__:trials:24 - Trial = 25713/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.317 | DEBUG    | __main__:trials:29 - Trial = 25713/30000 | Total reward = 46.04
2022-01-26 14:18:31.321 | DEBUG    | __main__:trials:24 - Trial = 25714/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.322 | DEBUG    | __main__:trials:29 - Trial = 25714/30000 | Total reward = 37.17
2022-01-26 14:18:31.326 | DEBUG    | __main__:trials:24 - Trial = 25715/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.326 | DEBUG    | __main__:trials:29 - Trial = 25715/30000 | Total reward = 36.03
2022-01-26 14:18:31.331 | DEBUG    | __main__:trials:24 - Trial = 25716/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.331 | DEBUG    | __main__:trials:29 - Trial = 25716/30000 | Total reward = 43.06
2022-01-26 14:18:31.335 | DEBUG    | __main__:trials:24 - Trial = 25717/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.337 | DEBUG    | __main__:trials:29 - Trial = 25717/30000 | Total reward = 36.11
2022-01-26 14:18:31.341 | DEBUG    | __main__:trials:24 - Trial = 25718/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.341 | DEBUG    | __main__:trials:29 - Trial = 25718/30000 | Total reward = 43.06
2022-01-26 14:18:31.345 | DEBUG    | __main__:trials:24 - Trial = 25719/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.346 | DEBUG    | __main__:trials:29 - Trial = 25719/30000 | Total reward = 54.68
2022-01-26 14:18:31.350 | DEBUG    | __main__:trials:24 - Trial = 25720/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.351 | DEBUG    | __main__:trials:29 - Trial = 25720/30000 | Total reward = 27.70
2022-01-26 14:18:31.355 | DEBUG    | __main__:trials:24 - Trial = 25721/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.357 | DEBUG    | __main__:trials:29 - Trial = 25721/30000 | Total reward = 49.45
2022-01-26 14:18:31.360 | DEBUG    | __main__:trials:24 - Trial = 25722/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.362 | DEBUG    | __main__:trials:29 - Trial = 25722/30000 | Total reward = 33.02
2022-01-26 14:18:31.365 | DEBUG    | __main__:trials:26 - Trial = 25723/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.367 | DEBUG    | __main__:trials:29 - Trial = 25723/30000 | Total reward = 26.66
2022-01-26 14:18:31.370 | DEBUG    | __main__:trials:24 - Trial = 25724/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.372 | DEBUG    | __main__:trials:29 - Trial = 25724/30000 | Total reward = 41.28
2022-01-26 14:18:31.375 | DEBUG    | __main__:trials:24 - Trial = 25725/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.376 | DEBUG    | __main__:trials:29 - Trial = 25725/30000 | Total reward = 29.98
2022-01-26 14:18:31.380 | DEBUG    | __main__:trials:24 - Trial = 25726/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.381 | DEBUG    | __main__:trials:29 - Trial = 25726/30000 | Total reward = 34.34
2022-01-26 14:18:31.384 | DEBUG    | __main__:trials:24 - Trial = 25727/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.386 | DEBUG    | __main__:trials:29 - Trial = 25727/30000 | Total reward = 43.06
2022-01-26 14:18:31.390 | DEBUG    | __main__:trials:24 - Trial = 25728/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.391 | DEBUG    | __main__:trials:29 - Trial = 25728/30000 | Total reward = 37.20
2022-01-26 14:18:31.394 | DEBUG    | __main__:trials:24 - Trial = 25729/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.396 | DEBUG    | __main__:trials:29 - Trial = 25729/30000 | Total reward = 41.80
2022-01-26 14:18:31.398 | DEBUG    | __main__:trials:26 - Trial = 25730/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.400 | DEBUG    | __main__:trials:29 - Trial = 25730/30000 | Total reward = 15.24
2022-01-26 14:18:31.403 | DEBUG    | __main__:trials:24 - Trial = 25731/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.404 | DEBUG    | __main__:trials:29 - Trial = 25731/30000 | Total reward = 34.27
2022-01-26 14:18:31.408 | DEBUG    | __main__:trials:24 - Trial = 25732/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.409 | DEBUG    | __main__:trials:29 - Trial = 25732/30000 | Total reward = 36.15
2022-01-26 14:18:31.412 | DEBUG    | __main__:trials:26 - Trial = 25733/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.414 | DEBUG    | __main__:trials:29 - Trial = 25733/30000 | Total reward = 20.96
2022-01-26 14:18:31.416 | DEBUG    | __main__:trials:24 - Trial = 25734/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.418 | DEBUG    | __main__:trials:29 - Trial = 25734/30000 | Total reward = 43.53
2022-01-26 14:18:31.421 | DEBUG    | __main__:trials:24 - Trial = 25735/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.422 | DEBUG    | __main__:trials:29 - Trial = 25735/30000 | Total reward = 44.23
2022-01-26 14:18:31.425 | DEBUG    | __main__:trials:26 - Trial = 25736/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.425 | DEBUG    | __main__:trials:29 - Trial = 25736/30000 | Total reward = 19.35
2022-01-26 14:18:31.429 | DEBUG    | __main__:trials:24 - Trial = 25737/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.431 | DEBUG    | __main__:trials:29 - Trial = 25737/30000 | Total reward = 36.56
2022-01-26 14:18:31.434 | DEBUG    | __main__:trials:24 - Trial = 25738/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.436 | DEBUG    | __main__:trials:29 - Trial = 25738/30000 | Total reward = 33.72
2022-01-26 14:18:31.439 | DEBUG    | __main__:trials:24 - Trial = 25739/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.440 | DEBUG    | __main__:trials:29 - Trial = 25739/30000 | Total reward = 26.33
2022-01-26 14:18:31.444 | DEBUG    | __main__:trials:26 - Trial = 25740/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.445 | DEBUG    | __main__:trials:29 - Trial = 25740/30000 | Total reward = 14.74
2022-01-26 14:18:31.448 | DEBUG    | __main__:trials:24 - Trial = 25741/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.450 | DEBUG    | __main__:trials:29 - Trial = 25741/30000 | Total reward = 34.16
2022-01-26 14:18:31.454 | DEBUG    | __main__:trials:24 - Trial = 25742/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.455 | DEBUG    | __main__:trials:29 - Trial = 25742/30000 | Total reward = 40.95
2022-01-26 14:18:31.459 | DEBUG    | __main__:trials:24 - Trial = 25743/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.460 | DEBUG    | __main__:trials:29 - Trial = 25743/30000 | Total reward = 35.94
2022-01-26 14:18:31.463 | DEBUG    | __main__:trials:26 - Trial = 25744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.465 | DEBUG    | __main__:trials:29 - Trial = 25744/30000 | Total reward = 20.61
2022-01-26 14:18:31.468 | DEBUG    | __main__:trials:24 - Trial = 25745/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.470 | DEBUG    | __main__:trials:29 - Trial = 25745/30000 | Total reward = 47.24
2022-01-26 14:18:31.473 | DEBUG    | __main__:trials:24 - Trial = 25746/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.474 | DEBUG    | __main__:trials:29 - Trial = 25746/30000 | Total reward = 30.85
2022-01-26 14:18:31.478 | DEBUG    | __main__:trials:24 - Trial = 25747/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.479 | DEBUG    | __main__:trials:29 - Trial = 25747/30000 | Total reward = 39.64
2022-01-26 14:18:31.482 | DEBUG    | __main__:trials:24 - Trial = 25748/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.483 | DEBUG    | __main__:trials:29 - Trial = 25748/30000 | Total reward = 46.56
2022-01-26 14:18:31.486 | DEBUG    | __main__:trials:24 - Trial = 25749/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.488 | DEBUG    | __main__:trials:29 - Trial = 25749/30000 | Total reward = 38.39
2022-01-26 14:18:31.492 | DEBUG    | __main__:trials:24 - Trial = 25750/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.493 | DEBUG    | __main__:trials:29 - Trial = 25750/30000 | Total reward = 46.12
2022-01-26 14:18:31.497 | DEBUG    | __main__:trials:24 - Trial = 25751/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.498 | DEBUG    | __main__:trials:29 - Trial = 25751/30000 | Total reward = 44.49
2022-01-26 14:18:31.502 | DEBUG    | __main__:trials:24 - Trial = 25752/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.503 | DEBUG    | __main__:trials:29 - Trial = 25752/30000 | Total reward = 46.56
2022-01-26 14:18:31.507 | DEBUG    | __main__:trials:24 - Trial = 25753/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.507 | DEBUG    | __main__:trials:29 - Trial = 25753/30000 | Total reward = 39.21
2022-01-26 14:18:31.512 | DEBUG    | __main__:trials:24 - Trial = 25754/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.512 | DEBUG    | __main__:trials:29 - Trial = 25754/30000 | Total reward = 41.03
2022-01-26 14:18:31.517 | DEBUG    | __main__:trials:24 - Trial = 25755/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.518 | DEBUG    | __main__:trials:29 - Trial = 25755/30000 | Total reward = 39.77
2022-01-26 14:18:31.522 | DEBUG    | __main__:trials:24 - Trial = 25756/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.523 | DEBUG    | __main__:trials:29 - Trial = 25756/30000 | Total reward = 51.01
2022-01-26 14:18:31.526 | DEBUG    | __main__:trials:26 - Trial = 25757/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.528 | DEBUG    | __main__:trials:29 - Trial = 25757/30000 | Total reward = 28.03
2022-01-26 14:18:31.532 | DEBUG    | __main__:trials:24 - Trial = 25758/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.533 | DEBUG    | __main__:trials:29 - Trial = 25758/30000 | Total reward = 32.68
2022-01-26 14:18:31.537 | DEBUG    | __main__:trials:24 - Trial = 25759/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.538 | DEBUG    | __main__:trials:29 - Trial = 25759/30000 | Total reward = 30.05
2022-01-26 14:18:31.542 | DEBUG    | __main__:trials:24 - Trial = 25760/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.543 | DEBUG    | __main__:trials:29 - Trial = 25760/30000 | Total reward = 46.56
2022-01-26 14:18:31.547 | DEBUG    | __main__:trials:26 - Trial = 25761/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.548 | DEBUG    | __main__:trials:29 - Trial = 25761/30000 | Total reward = 11.06
2022-01-26 14:18:31.550 | DEBUG    | __main__:trials:26 - Trial = 25762/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.551 | DEBUG    | __main__:trials:29 - Trial = 25762/30000 | Total reward = 13.80
2022-01-26 14:18:31.555 | DEBUG    | __main__:trials:24 - Trial = 25763/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.557 | DEBUG    | __main__:trials:29 - Trial = 25763/30000 | Total reward = 47.65
2022-01-26 14:18:31.560 | DEBUG    | __main__:trials:24 - Trial = 25764/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.561 | DEBUG    | __main__:trials:29 - Trial = 25764/30000 | Total reward = 27.82
2022-01-26 14:18:31.565 | DEBUG    | __main__:trials:24 - Trial = 25765/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.567 | DEBUG    | __main__:trials:29 - Trial = 25765/30000 | Total reward = 46.56
2022-01-26 14:18:31.570 | DEBUG    | __main__:trials:24 - Trial = 25766/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.571 | DEBUG    | __main__:trials:29 - Trial = 25766/30000 | Total reward = 41.16
2022-01-26 14:18:31.575 | DEBUG    | __main__:trials:24 - Trial = 25767/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.577 | DEBUG    | __main__:trials:29 - Trial = 25767/30000 | Total reward = 38.19
2022-01-26 14:18:31.579 | DEBUG    | __main__:trials:26 - Trial = 25768/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.581 | DEBUG    | __main__:trials:29 - Trial = 25768/30000 | Total reward = 12.55
2022-01-26 14:18:31.584 | DEBUG    | __main__:trials:24 - Trial = 25769/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.586 | DEBUG    | __main__:trials:29 - Trial = 25769/30000 | Total reward = 36.01
2022-01-26 14:18:31.589 | DEBUG    | __main__:trials:24 - Trial = 25770/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.591 | DEBUG    | __main__:trials:29 - Trial = 25770/30000 | Total reward = 38.89
2022-01-26 14:18:31.595 | DEBUG    | __main__:trials:24 - Trial = 25771/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.595 | DEBUG    | __main__:trials:29 - Trial = 25771/30000 | Total reward = 50.27
2022-01-26 14:18:31.600 | DEBUG    | __main__:trials:24 - Trial = 25772/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.601 | DEBUG    | __main__:trials:29 - Trial = 25772/30000 | Total reward = 35.47
2022-01-26 14:18:31.604 | DEBUG    | __main__:trials:24 - Trial = 25773/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.606 | DEBUG    | __main__:trials:29 - Trial = 25773/30000 | Total reward = 37.31
2022-01-26 14:18:31.609 | DEBUG    | __main__:trials:24 - Trial = 25774/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.610 | DEBUG    | __main__:trials:29 - Trial = 25774/30000 | Total reward = 42.55
2022-01-26 14:18:31.614 | DEBUG    | __main__:trials:24 - Trial = 25775/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.615 | DEBUG    | __main__:trials:29 - Trial = 25775/30000 | Total reward = 25.24
2022-01-26 14:18:31.618 | DEBUG    | __main__:trials:24 - Trial = 25776/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.619 | DEBUG    | __main__:trials:29 - Trial = 25776/30000 | Total reward = 36.21
2022-01-26 14:18:31.622 | DEBUG    | __main__:trials:24 - Trial = 25777/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.624 | DEBUG    | __main__:trials:29 - Trial = 25777/30000 | Total reward = 36.53
2022-01-26 14:18:31.627 | DEBUG    | __main__:trials:24 - Trial = 25778/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.628 | DEBUG    | __main__:trials:29 - Trial = 25778/30000 | Total reward = 39.83
2022-01-26 14:18:31.631 | DEBUG    | __main__:trials:24 - Trial = 25779/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.633 | DEBUG    | __main__:trials:29 - Trial = 25779/30000 | Total reward = 36.18
2022-01-26 14:18:31.635 | DEBUG    | __main__:trials:26 - Trial = 25780/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.636 | DEBUG    | __main__:trials:29 - Trial = 25780/30000 | Total reward = 23.36
2022-01-26 14:18:31.639 | DEBUG    | __main__:trials:26 - Trial = 25781/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.641 | DEBUG    | __main__:trials:29 - Trial = 25781/30000 | Total reward = 28.15
2022-01-26 14:18:31.644 | DEBUG    | __main__:trials:26 - Trial = 25782/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.645 | DEBUG    | __main__:trials:29 - Trial = 25782/30000 | Total reward = 12.35
2022-01-26 14:18:31.648 | DEBUG    | __main__:trials:24 - Trial = 25783/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.650 | DEBUG    | __main__:trials:29 - Trial = 25783/30000 | Total reward = 35.66
2022-01-26 14:18:31.654 | DEBUG    | __main__:trials:24 - Trial = 25784/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.655 | DEBUG    | __main__:trials:29 - Trial = 25784/30000 | Total reward = 36.24
2022-01-26 14:18:31.658 | DEBUG    | __main__:trials:24 - Trial = 25785/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.660 | DEBUG    | __main__:trials:29 - Trial = 25785/30000 | Total reward = 27.20
2022-01-26 14:18:31.664 | DEBUG    | __main__:trials:24 - Trial = 25786/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.664 | DEBUG    | __main__:trials:29 - Trial = 25786/30000 | Total reward = 35.22
2022-01-26 14:18:31.669 | DEBUG    | __main__:trials:24 - Trial = 25787/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.670 | DEBUG    | __main__:trials:29 - Trial = 25787/30000 | Total reward = 37.21
2022-01-26 14:18:31.674 | DEBUG    | __main__:trials:24 - Trial = 25788/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.676 | DEBUG    | __main__:trials:29 - Trial = 25788/30000 | Total reward = 46.56
2022-01-26 14:18:31.679 | DEBUG    | __main__:trials:26 - Trial = 25789/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.681 | DEBUG    | __main__:trials:29 - Trial = 25789/30000 | Total reward = 22.20
2022-01-26 14:18:31.684 | DEBUG    | __main__:trials:24 - Trial = 25790/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.685 | DEBUG    | __main__:trials:29 - Trial = 25790/30000 | Total reward = 46.85
2022-01-26 14:18:31.690 | DEBUG    | __main__:trials:24 - Trial = 25791/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.690 | DEBUG    | __main__:trials:29 - Trial = 25791/30000 | Total reward = 38.47
2022-01-26 14:18:31.695 | DEBUG    | __main__:trials:24 - Trial = 25792/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.696 | DEBUG    | __main__:trials:29 - Trial = 25792/30000 | Total reward = 33.00
2022-01-26 14:18:31.700 | DEBUG    | __main__:trials:24 - Trial = 25793/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.701 | DEBUG    | __main__:trials:29 - Trial = 25793/30000 | Total reward = 45.40
2022-01-26 14:18:31.705 | DEBUG    | __main__:trials:24 - Trial = 25794/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.707 | DEBUG    | __main__:trials:29 - Trial = 25794/30000 | Total reward = 49.39
2022-01-26 14:18:31.710 | DEBUG    | __main__:trials:24 - Trial = 25795/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.712 | DEBUG    | __main__:trials:29 - Trial = 25795/30000 | Total reward = 39.83
2022-01-26 14:18:31.716 | DEBUG    | __main__:trials:24 - Trial = 25796/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.716 | DEBUG    | __main__:trials:29 - Trial = 25796/30000 | Total reward = 36.43
2022-01-26 14:18:31.720 | DEBUG    | __main__:trials:24 - Trial = 25797/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.721 | DEBUG    | __main__:trials:29 - Trial = 25797/30000 | Total reward = 43.55
2022-01-26 14:18:31.724 | DEBUG    | __main__:trials:26 - Trial = 25798/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.725 | DEBUG    | __main__:trials:29 - Trial = 25798/30000 | Total reward = 21.04
2022-01-26 14:18:31.727 | DEBUG    | __main__:trials:26 - Trial = 25799/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.728 | DEBUG    | __main__:trials:29 - Trial = 25799/30000 | Total reward = 14.47
2022-01-26 14:18:31.731 | DEBUG    | __main__:trials:24 - Trial = 25800/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.733 | DEBUG    | __main__:trials:29 - Trial = 25800/30000 | Total reward = 43.58
2022-01-26 14:18:31.737 | DEBUG    | __main__:trials:26 - Trial = 25801/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.737 | DEBUG    | __main__:trials:29 - Trial = 25801/30000 | Total reward = 28.26
2022-01-26 14:18:31.742 | DEBUG    | __main__:trials:24 - Trial = 25802/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.742 | DEBUG    | __main__:trials:29 - Trial = 25802/30000 | Total reward = 39.43
2022-01-26 14:18:31.747 | DEBUG    | __main__:trials:24 - Trial = 25803/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.747 | DEBUG    | __main__:trials:29 - Trial = 25803/30000 | Total reward = 48.89
2022-01-26 14:18:31.752 | DEBUG    | __main__:trials:24 - Trial = 25804/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.753 | DEBUG    | __main__:trials:29 - Trial = 25804/30000 | Total reward = 39.46
2022-01-26 14:18:31.757 | DEBUG    | __main__:trials:24 - Trial = 25805/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.758 | DEBUG    | __main__:trials:29 - Trial = 25805/30000 | Total reward = 39.80
2022-01-26 14:18:31.762 | DEBUG    | __main__:trials:24 - Trial = 25806/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.764 | DEBUG    | __main__:trials:29 - Trial = 25806/30000 | Total reward = 36.27
2022-01-26 14:18:31.766 | DEBUG    | __main__:trials:24 - Trial = 25807/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.768 | DEBUG    | __main__:trials:29 - Trial = 25807/30000 | Total reward = 35.48
2022-01-26 14:18:31.771 | DEBUG    | __main__:trials:26 - Trial = 25808/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.773 | DEBUG    | __main__:trials:29 - Trial = 25808/30000 | Total reward = 22.19
2022-01-26 14:18:31.776 | DEBUG    | __main__:trials:24 - Trial = 25809/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.778 | DEBUG    | __main__:trials:29 - Trial = 25809/30000 | Total reward = 39.52
2022-01-26 14:18:31.781 | DEBUG    | __main__:trials:24 - Trial = 25810/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.782 | DEBUG    | __main__:trials:29 - Trial = 25810/30000 | Total reward = 46.34
2022-01-26 14:18:31.786 | DEBUG    | __main__:trials:24 - Trial = 25811/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.788 | DEBUG    | __main__:trials:29 - Trial = 25811/30000 | Total reward = 33.47
2022-01-26 14:18:31.792 | DEBUG    | __main__:trials:24 - Trial = 25812/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.793 | DEBUG    | __main__:trials:29 - Trial = 25812/30000 | Total reward = 36.09
2022-01-26 14:18:31.797 | DEBUG    | __main__:trials:24 - Trial = 25813/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.798 | DEBUG    | __main__:trials:29 - Trial = 25813/30000 | Total reward = 35.85
2022-01-26 14:18:31.801 | DEBUG    | __main__:trials:24 - Trial = 25814/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.802 | DEBUG    | __main__:trials:29 - Trial = 25814/30000 | Total reward = 34.05
2022-01-26 14:18:31.804 | DEBUG    | __main__:trials:26 - Trial = 25815/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.806 | DEBUG    | __main__:trials:29 - Trial = 25815/30000 | Total reward = 10.12
2022-01-26 14:18:31.809 | DEBUG    | __main__:trials:24 - Trial = 25816/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.810 | DEBUG    | __main__:trials:29 - Trial = 25816/30000 | Total reward = 38.85
2022-01-26 14:18:31.814 | DEBUG    | __main__:trials:24 - Trial = 25817/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.815 | DEBUG    | __main__:trials:29 - Trial = 25817/30000 | Total reward = 35.74
2022-01-26 14:18:31.818 | DEBUG    | __main__:trials:24 - Trial = 25818/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.819 | DEBUG    | __main__:trials:29 - Trial = 25818/30000 | Total reward = 30.56
2022-01-26 14:18:31.823 | DEBUG    | __main__:trials:24 - Trial = 25819/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.825 | DEBUG    | __main__:trials:29 - Trial = 25819/30000 | Total reward = 28.76
2022-01-26 14:18:31.828 | DEBUG    | __main__:trials:24 - Trial = 25820/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.830 | DEBUG    | __main__:trials:29 - Trial = 25820/30000 | Total reward = 33.24
2022-01-26 14:18:31.832 | DEBUG    | __main__:trials:26 - Trial = 25821/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.834 | DEBUG    | __main__:trials:29 - Trial = 25821/30000 | Total reward = 11.09
2022-01-26 14:18:31.837 | DEBUG    | __main__:trials:24 - Trial = 25822/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.839 | DEBUG    | __main__:trials:29 - Trial = 25822/30000 | Total reward = 39.02
2022-01-26 14:18:31.843 | DEBUG    | __main__:trials:24 - Trial = 25823/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.843 | DEBUG    | __main__:trials:29 - Trial = 25823/30000 | Total reward = 38.24
2022-01-26 14:18:31.848 | DEBUG    | __main__:trials:24 - Trial = 25824/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.848 | DEBUG    | __main__:trials:29 - Trial = 25824/30000 | Total reward = 35.76
2022-01-26 14:18:31.853 | DEBUG    | __main__:trials:24 - Trial = 25825/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.855 | DEBUG    | __main__:trials:29 - Trial = 25825/30000 | Total reward = 37.46
2022-01-26 14:18:31.858 | DEBUG    | __main__:trials:24 - Trial = 25826/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.859 | DEBUG    | __main__:trials:29 - Trial = 25826/30000 | Total reward = 36.09
2022-01-26 14:18:31.863 | DEBUG    | __main__:trials:24 - Trial = 25827/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.864 | DEBUG    | __main__:trials:29 - Trial = 25827/30000 | Total reward = 36.60
2022-01-26 14:18:31.868 | DEBUG    | __main__:trials:26 - Trial = 25828/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.870 | DEBUG    | __main__:trials:29 - Trial = 25828/30000 | Total reward = 26.99
2022-01-26 14:18:31.873 | DEBUG    | __main__:trials:24 - Trial = 25829/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.875 | DEBUG    | __main__:trials:29 - Trial = 25829/30000 | Total reward = 36.07
2022-01-26 14:18:31.879 | DEBUG    | __main__:trials:24 - Trial = 25830/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.879 | DEBUG    | __main__:trials:29 - Trial = 25830/30000 | Total reward = 36.09
2022-01-26 14:18:31.884 | DEBUG    | __main__:trials:24 - Trial = 25831/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.885 | DEBUG    | __main__:trials:29 - Trial = 25831/30000 | Total reward = 36.80
2022-01-26 14:18:31.888 | DEBUG    | __main__:trials:24 - Trial = 25832/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.890 | DEBUG    | __main__:trials:29 - Trial = 25832/30000 | Total reward = 38.17
2022-01-26 14:18:31.894 | DEBUG    | __main__:trials:24 - Trial = 25833/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.894 | DEBUG    | __main__:trials:29 - Trial = 25833/30000 | Total reward = 34.60
2022-01-26 14:18:31.898 | DEBUG    | __main__:trials:24 - Trial = 25834/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.900 | DEBUG    | __main__:trials:29 - Trial = 25834/30000 | Total reward = 36.56
2022-01-26 14:18:31.903 | DEBUG    | __main__:trials:24 - Trial = 25835/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.904 | DEBUG    | __main__:trials:29 - Trial = 25835/30000 | Total reward = 28.45
2022-01-26 14:18:31.908 | DEBUG    | __main__:trials:26 - Trial = 25836/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.910 | DEBUG    | __main__:trials:29 - Trial = 25836/30000 | Total reward = 29.32
2022-01-26 14:18:31.913 | DEBUG    | __main__:trials:24 - Trial = 25837/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.915 | DEBUG    | __main__:trials:29 - Trial = 25837/30000 | Total reward = 29.58
2022-01-26 14:18:31.919 | DEBUG    | __main__:trials:24 - Trial = 25838/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.920 | DEBUG    | __main__:trials:29 - Trial = 25838/30000 | Total reward = 40.54
2022-01-26 14:18:31.924 | DEBUG    | __main__:trials:24 - Trial = 25839/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.925 | DEBUG    | __main__:trials:29 - Trial = 25839/30000 | Total reward = 34.19
2022-01-26 14:18:31.929 | DEBUG    | __main__:trials:26 - Trial = 25840/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.929 | DEBUG    | __main__:trials:29 - Trial = 25840/30000 | Total reward = 32.47
2022-01-26 14:18:31.933 | DEBUG    | __main__:trials:24 - Trial = 25841/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.933 | DEBUG    | __main__:trials:29 - Trial = 25841/30000 | Total reward = 43.70
2022-01-26 14:18:31.936 | DEBUG    | __main__:trials:26 - Trial = 25842/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.937 | DEBUG    | __main__:trials:29 - Trial = 25842/30000 | Total reward = 11.06
2022-01-26 14:18:31.941 | DEBUG    | __main__:trials:24 - Trial = 25843/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.943 | DEBUG    | __main__:trials:29 - Trial = 25843/30000 | Total reward = 34.99
2022-01-26 14:18:31.945 | DEBUG    | __main__:trials:26 - Trial = 25844/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.946 | DEBUG    | __main__:trials:29 - Trial = 25844/30000 | Total reward = 10.12
2022-01-26 14:18:31.950 | DEBUG    | __main__:trials:24 - Trial = 25845/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.951 | DEBUG    | __main__:trials:29 - Trial = 25845/30000 | Total reward = 39.58
2022-01-26 14:18:31.955 | DEBUG    | __main__:trials:24 - Trial = 25846/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.957 | DEBUG    | __main__:trials:29 - Trial = 25846/30000 | Total reward = 34.37
2022-01-26 14:18:31.960 | DEBUG    | __main__:trials:24 - Trial = 25847/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.962 | DEBUG    | __main__:trials:29 - Trial = 25847/30000 | Total reward = 32.26
2022-01-26 14:18:31.966 | DEBUG    | __main__:trials:24 - Trial = 25848/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.966 | DEBUG    | __main__:trials:29 - Trial = 25848/30000 | Total reward = 38.85
2022-01-26 14:18:31.971 | DEBUG    | __main__:trials:24 - Trial = 25849/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.972 | DEBUG    | __main__:trials:29 - Trial = 25849/30000 | Total reward = 38.60
2022-01-26 14:18:31.975 | DEBUG    | __main__:trials:26 - Trial = 25850/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.976 | DEBUG    | __main__:trials:29 - Trial = 25850/30000 | Total reward = 15.24
2022-01-26 14:18:31.980 | DEBUG    | __main__:trials:24 - Trial = 25851/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.981 | DEBUG    | __main__:trials:29 - Trial = 25851/30000 | Total reward = 24.20
2022-01-26 14:18:31.984 | DEBUG    | __main__:trials:26 - Trial = 25852/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:31.986 | DEBUG    | __main__:trials:29 - Trial = 25852/30000 | Total reward = 18.25
2022-01-26 14:18:31.988 | DEBUG    | __main__:trials:24 - Trial = 25853/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.990 | DEBUG    | __main__:trials:29 - Trial = 25853/30000 | Total reward = 40.87
2022-01-26 14:18:31.994 | DEBUG    | __main__:trials:24 - Trial = 25854/30000 | Max number of steps (20) reached
2022-01-26 14:18:31.994 | DEBUG    | __main__:trials:29 - Trial = 25854/30000 | Total reward = 36.30
2022-01-26 14:18:31.998 | DEBUG    | __main__:trials:24 - Trial = 25855/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.000 | DEBUG    | __main__:trials:29 - Trial = 25855/30000 | Total reward = 52.35
2022-01-26 14:18:32.002 | DEBUG    | __main__:trials:24 - Trial = 25856/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.004 | DEBUG    | __main__:trials:29 - Trial = 25856/30000 | Total reward = 50.44
2022-01-26 14:18:32.008 | DEBUG    | __main__:trials:26 - Trial = 25857/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.009 | DEBUG    | __main__:trials:29 - Trial = 25857/30000 | Total reward = 31.93
2022-01-26 14:18:32.013 | DEBUG    | __main__:trials:24 - Trial = 25858/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.014 | DEBUG    | __main__:trials:29 - Trial = 25858/30000 | Total reward = 30.59
2022-01-26 14:18:32.018 | DEBUG    | __main__:trials:26 - Trial = 25859/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.019 | DEBUG    | __main__:trials:29 - Trial = 25859/30000 | Total reward = 17.40
2022-01-26 14:18:32.023 | DEBUG    | __main__:trials:24 - Trial = 25860/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.024 | DEBUG    | __main__:trials:29 - Trial = 25860/30000 | Total reward = 26.36
2022-01-26 14:18:32.028 | DEBUG    | __main__:trials:24 - Trial = 25861/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.029 | DEBUG    | __main__:trials:29 - Trial = 25861/30000 | Total reward = 35.84
2022-01-26 14:18:32.032 | DEBUG    | __main__:trials:24 - Trial = 25862/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.034 | DEBUG    | __main__:trials:29 - Trial = 25862/30000 | Total reward = 51.89
2022-01-26 14:18:32.038 | DEBUG    | __main__:trials:24 - Trial = 25863/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.039 | DEBUG    | __main__:trials:29 - Trial = 25863/30000 | Total reward = 43.22
2022-01-26 14:18:32.042 | DEBUG    | __main__:trials:24 - Trial = 25864/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.044 | DEBUG    | __main__:trials:29 - Trial = 25864/30000 | Total reward = 36.66
2022-01-26 14:18:32.047 | DEBUG    | __main__:trials:24 - Trial = 25865/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.049 | DEBUG    | __main__:trials:29 - Trial = 25865/30000 | Total reward = 49.50
2022-01-26 14:18:32.052 | DEBUG    | __main__:trials:24 - Trial = 25866/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.053 | DEBUG    | __main__:trials:29 - Trial = 25866/30000 | Total reward = 33.36
2022-01-26 14:18:32.056 | DEBUG    | __main__:trials:24 - Trial = 25867/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.058 | DEBUG    | __main__:trials:29 - Trial = 25867/30000 | Total reward = 50.29
2022-01-26 14:18:32.061 | DEBUG    | __main__:trials:24 - Trial = 25868/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.063 | DEBUG    | __main__:trials:29 - Trial = 25868/30000 | Total reward = 34.58
2022-01-26 14:18:32.066 | DEBUG    | __main__:trials:24 - Trial = 25869/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.068 | DEBUG    | __main__:trials:29 - Trial = 25869/30000 | Total reward = 33.79
2022-01-26 14:18:32.071 | DEBUG    | __main__:trials:24 - Trial = 25870/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.072 | DEBUG    | __main__:trials:29 - Trial = 25870/30000 | Total reward = 38.00
2022-01-26 14:18:32.075 | DEBUG    | __main__:trials:24 - Trial = 25871/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.077 | DEBUG    | __main__:trials:29 - Trial = 25871/30000 | Total reward = 35.71
2022-01-26 14:18:32.079 | DEBUG    | __main__:trials:26 - Trial = 25872/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.080 | DEBUG    | __main__:trials:29 - Trial = 25872/30000 | Total reward = 9.62
2022-01-26 14:18:32.084 | DEBUG    | __main__:trials:26 - Trial = 25873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.085 | DEBUG    | __main__:trials:29 - Trial = 25873/30000 | Total reward = 28.69
2022-01-26 14:18:32.088 | DEBUG    | __main__:trials:24 - Trial = 25874/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.090 | DEBUG    | __main__:trials:29 - Trial = 25874/30000 | Total reward = 45.00
2022-01-26 14:18:32.093 | DEBUG    | __main__:trials:24 - Trial = 25875/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.095 | DEBUG    | __main__:trials:29 - Trial = 25875/30000 | Total reward = 36.23
2022-01-26 14:18:32.099 | DEBUG    | __main__:trials:24 - Trial = 25876/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.100 | DEBUG    | __main__:trials:29 - Trial = 25876/30000 | Total reward = 43.34
2022-01-26 14:18:32.103 | DEBUG    | __main__:trials:24 - Trial = 25877/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.105 | DEBUG    | __main__:trials:29 - Trial = 25877/30000 | Total reward = 52.28
2022-01-26 14:18:32.108 | DEBUG    | __main__:trials:24 - Trial = 25878/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.109 | DEBUG    | __main__:trials:29 - Trial = 25878/30000 | Total reward = 33.22
2022-01-26 14:18:32.112 | DEBUG    | __main__:trials:24 - Trial = 25879/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.114 | DEBUG    | __main__:trials:29 - Trial = 25879/30000 | Total reward = 37.06
2022-01-26 14:18:32.118 | DEBUG    | __main__:trials:24 - Trial = 25880/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.119 | DEBUG    | __main__:trials:29 - Trial = 25880/30000 | Total reward = 39.30
2022-01-26 14:18:32.123 | DEBUG    | __main__:trials:24 - Trial = 25881/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.124 | DEBUG    | __main__:trials:29 - Trial = 25881/30000 | Total reward = 38.68
2022-01-26 14:18:32.128 | DEBUG    | __main__:trials:24 - Trial = 25882/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.129 | DEBUG    | __main__:trials:29 - Trial = 25882/30000 | Total reward = 30.92
2022-01-26 14:18:32.132 | DEBUG    | __main__:trials:24 - Trial = 25883/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.134 | DEBUG    | __main__:trials:29 - Trial = 25883/30000 | Total reward = 46.77
2022-01-26 14:18:32.138 | DEBUG    | __main__:trials:24 - Trial = 25884/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.140 | DEBUG    | __main__:trials:29 - Trial = 25884/30000 | Total reward = 42.81
2022-01-26 14:18:32.143 | DEBUG    | __main__:trials:24 - Trial = 25885/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.144 | DEBUG    | __main__:trials:29 - Trial = 25885/30000 | Total reward = 47.39
2022-01-26 14:18:32.148 | DEBUG    | __main__:trials:24 - Trial = 25886/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.149 | DEBUG    | __main__:trials:29 - Trial = 25886/30000 | Total reward = 41.98
2022-01-26 14:18:32.153 | DEBUG    | __main__:trials:26 - Trial = 25887/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.155 | DEBUG    | __main__:trials:29 - Trial = 25887/30000 | Total reward = 31.39
2022-01-26 14:18:32.158 | DEBUG    | __main__:trials:24 - Trial = 25888/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.160 | DEBUG    | __main__:trials:29 - Trial = 25888/30000 | Total reward = 39.88
2022-01-26 14:18:32.164 | DEBUG    | __main__:trials:24 - Trial = 25889/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.165 | DEBUG    | __main__:trials:29 - Trial = 25889/30000 | Total reward = 39.74
2022-01-26 14:18:32.169 | DEBUG    | __main__:trials:24 - Trial = 25890/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.171 | DEBUG    | __main__:trials:29 - Trial = 25890/30000 | Total reward = 39.28
2022-01-26 14:18:32.174 | DEBUG    | __main__:trials:24 - Trial = 25891/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.176 | DEBUG    | __main__:trials:29 - Trial = 25891/30000 | Total reward = 34.61
2022-01-26 14:18:32.180 | DEBUG    | __main__:trials:24 - Trial = 25892/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.180 | DEBUG    | __main__:trials:29 - Trial = 25892/30000 | Total reward = 40.77
2022-01-26 14:18:32.184 | DEBUG    | __main__:trials:26 - Trial = 25893/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.185 | DEBUG    | __main__:trials:29 - Trial = 25893/30000 | Total reward = 11.80
2022-01-26 14:18:32.188 | DEBUG    | __main__:trials:26 - Trial = 25894/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.190 | DEBUG    | __main__:trials:29 - Trial = 25894/30000 | Total reward = 28.26
2022-01-26 14:18:32.193 | DEBUG    | __main__:trials:24 - Trial = 25895/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.194 | DEBUG    | __main__:trials:29 - Trial = 25895/30000 | Total reward = 37.41
2022-01-26 14:18:32.198 | DEBUG    | __main__:trials:24 - Trial = 25896/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.199 | DEBUG    | __main__:trials:29 - Trial = 25896/30000 | Total reward = 45.62
2022-01-26 14:18:32.203 | DEBUG    | __main__:trials:24 - Trial = 25897/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.204 | DEBUG    | __main__:trials:29 - Trial = 25897/30000 | Total reward = 39.57
2022-01-26 14:18:32.208 | DEBUG    | __main__:trials:24 - Trial = 25898/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.209 | DEBUG    | __main__:trials:29 - Trial = 25898/30000 | Total reward = 37.78
2022-01-26 14:18:32.213 | DEBUG    | __main__:trials:24 - Trial = 25899/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.215 | DEBUG    | __main__:trials:29 - Trial = 25899/30000 | Total reward = 44.13
2022-01-26 14:18:32.218 | DEBUG    | __main__:trials:26 - Trial = 25900/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.219 | DEBUG    | __main__:trials:29 - Trial = 25900/30000 | Total reward = 24.09
2022-01-26 14:18:32.223 | DEBUG    | __main__:trials:24 - Trial = 25901/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.225 | DEBUG    | __main__:trials:29 - Trial = 25901/30000 | Total reward = 47.94
2022-01-26 14:18:32.228 | DEBUG    | __main__:trials:24 - Trial = 25902/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.230 | DEBUG    | __main__:trials:29 - Trial = 25902/30000 | Total reward = 38.39
2022-01-26 14:18:32.234 | DEBUG    | __main__:trials:24 - Trial = 25903/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.235 | DEBUG    | __main__:trials:29 - Trial = 25903/30000 | Total reward = 32.31
2022-01-26 14:18:32.238 | DEBUG    | __main__:trials:24 - Trial = 25904/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.240 | DEBUG    | __main__:trials:29 - Trial = 25904/30000 | Total reward = 41.69
2022-01-26 14:18:32.243 | DEBUG    | __main__:trials:24 - Trial = 25905/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.245 | DEBUG    | __main__:trials:29 - Trial = 25905/30000 | Total reward = 40.66
2022-01-26 14:18:32.248 | DEBUG    | __main__:trials:24 - Trial = 25906/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.250 | DEBUG    | __main__:trials:29 - Trial = 25906/30000 | Total reward = 41.45
2022-01-26 14:18:32.254 | DEBUG    | __main__:trials:24 - Trial = 25907/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.255 | DEBUG    | __main__:trials:29 - Trial = 25907/30000 | Total reward = 40.39
2022-01-26 14:18:32.258 | DEBUG    | __main__:trials:24 - Trial = 25908/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.260 | DEBUG    | __main__:trials:29 - Trial = 25908/30000 | Total reward = 53.11
2022-01-26 14:18:32.263 | DEBUG    | __main__:trials:24 - Trial = 25909/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.264 | DEBUG    | __main__:trials:29 - Trial = 25909/30000 | Total reward = 26.06
2022-01-26 14:18:32.269 | DEBUG    | __main__:trials:24 - Trial = 25910/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.270 | DEBUG    | __main__:trials:29 - Trial = 25910/30000 | Total reward = 45.62
2022-01-26 14:18:32.274 | DEBUG    | __main__:trials:24 - Trial = 25911/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.276 | DEBUG    | __main__:trials:29 - Trial = 25911/30000 | Total reward = 55.15
2022-01-26 14:18:32.280 | DEBUG    | __main__:trials:24 - Trial = 25912/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.281 | DEBUG    | __main__:trials:29 - Trial = 25912/30000 | Total reward = 42.61
2022-01-26 14:18:32.284 | DEBUG    | __main__:trials:24 - Trial = 25913/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.285 | DEBUG    | __main__:trials:29 - Trial = 25913/30000 | Total reward = 50.37
2022-01-26 14:18:32.288 | DEBUG    | __main__:trials:24 - Trial = 25914/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.289 | DEBUG    | __main__:trials:29 - Trial = 25914/30000 | Total reward = 31.40
2022-01-26 14:18:32.292 | DEBUG    | __main__:trials:24 - Trial = 25915/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.293 | DEBUG    | __main__:trials:29 - Trial = 25915/30000 | Total reward = 35.54
2022-01-26 14:18:32.296 | DEBUG    | __main__:trials:24 - Trial = 25916/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.299 | DEBUG    | __main__:trials:29 - Trial = 25916/30000 | Total reward = 32.29
2022-01-26 14:18:32.301 | DEBUG    | __main__:trials:24 - Trial = 25917/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.304 | DEBUG    | __main__:trials:29 - Trial = 25917/30000 | Total reward = 47.84
2022-01-26 14:18:32.307 | DEBUG    | __main__:trials:24 - Trial = 25918/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.308 | DEBUG    | __main__:trials:29 - Trial = 25918/30000 | Total reward = 44.39
2022-01-26 14:18:32.312 | DEBUG    | __main__:trials:24 - Trial = 25919/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.314 | DEBUG    | __main__:trials:29 - Trial = 25919/30000 | Total reward = 45.34
2022-01-26 14:18:32.317 | DEBUG    | __main__:trials:24 - Trial = 25920/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.319 | DEBUG    | __main__:trials:29 - Trial = 25920/30000 | Total reward = 45.54
2022-01-26 14:18:32.322 | DEBUG    | __main__:trials:24 - Trial = 25921/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.323 | DEBUG    | __main__:trials:29 - Trial = 25921/30000 | Total reward = 44.21
2022-01-26 14:18:32.326 | DEBUG    | __main__:trials:24 - Trial = 25922/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.328 | DEBUG    | __main__:trials:29 - Trial = 25922/30000 | Total reward = 44.21
2022-01-26 14:18:32.331 | DEBUG    | __main__:trials:24 - Trial = 25923/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.332 | DEBUG    | __main__:trials:29 - Trial = 25923/30000 | Total reward = 45.76
2022-01-26 14:18:32.335 | DEBUG    | __main__:trials:24 - Trial = 25924/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.336 | DEBUG    | __main__:trials:29 - Trial = 25924/30000 | Total reward = 46.72
2022-01-26 14:18:32.339 | DEBUG    | __main__:trials:24 - Trial = 25925/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.341 | DEBUG    | __main__:trials:29 - Trial = 25925/30000 | Total reward = 42.66
2022-01-26 14:18:32.344 | DEBUG    | __main__:trials:24 - Trial = 25926/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.344 | DEBUG    | __main__:trials:29 - Trial = 25926/30000 | Total reward = 32.91
2022-01-26 14:18:32.348 | DEBUG    | __main__:trials:24 - Trial = 25927/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.349 | DEBUG    | __main__:trials:29 - Trial = 25927/30000 | Total reward = 24.66
2022-01-26 14:18:32.352 | DEBUG    | __main__:trials:24 - Trial = 25928/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.354 | DEBUG    | __main__:trials:29 - Trial = 25928/30000 | Total reward = 34.82
2022-01-26 14:18:32.358 | DEBUG    | __main__:trials:24 - Trial = 25929/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.358 | DEBUG    | __main__:trials:29 - Trial = 25929/30000 | Total reward = 42.39
2022-01-26 14:18:32.363 | DEBUG    | __main__:trials:24 - Trial = 25930/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.364 | DEBUG    | __main__:trials:29 - Trial = 25930/30000 | Total reward = 44.68
2022-01-26 14:18:32.368 | DEBUG    | __main__:trials:24 - Trial = 25931/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.369 | DEBUG    | __main__:trials:29 - Trial = 25931/30000 | Total reward = 45.62
2022-01-26 14:18:32.372 | DEBUG    | __main__:trials:24 - Trial = 25932/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.374 | DEBUG    | __main__:trials:29 - Trial = 25932/30000 | Total reward = 41.06
2022-01-26 14:18:32.377 | DEBUG    | __main__:trials:24 - Trial = 25933/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.378 | DEBUG    | __main__:trials:29 - Trial = 25933/30000 | Total reward = 36.32
2022-01-26 14:18:32.382 | DEBUG    | __main__:trials:24 - Trial = 25934/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.383 | DEBUG    | __main__:trials:29 - Trial = 25934/30000 | Total reward = 49.23
2022-01-26 14:18:32.386 | DEBUG    | __main__:trials:24 - Trial = 25935/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.387 | DEBUG    | __main__:trials:29 - Trial = 25935/30000 | Total reward = 45.41
2022-01-26 14:18:32.390 | DEBUG    | __main__:trials:26 - Trial = 25936/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.391 | DEBUG    | __main__:trials:29 - Trial = 25936/30000 | Total reward = 15.87
2022-01-26 14:18:32.395 | DEBUG    | __main__:trials:24 - Trial = 25937/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.396 | DEBUG    | __main__:trials:29 - Trial = 25937/30000 | Total reward = 41.10
2022-01-26 14:18:32.399 | DEBUG    | __main__:trials:24 - Trial = 25938/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.401 | DEBUG    | __main__:trials:29 - Trial = 25938/30000 | Total reward = 35.44
2022-01-26 14:18:32.404 | DEBUG    | __main__:trials:24 - Trial = 25939/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.406 | DEBUG    | __main__:trials:29 - Trial = 25939/30000 | Total reward = 37.98
2022-01-26 14:18:32.408 | DEBUG    | __main__:trials:26 - Trial = 25940/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.410 | DEBUG    | __main__:trials:29 - Trial = 25940/30000 | Total reward = 24.58
2022-01-26 14:18:32.413 | DEBUG    | __main__:trials:24 - Trial = 25941/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.414 | DEBUG    | __main__:trials:29 - Trial = 25941/30000 | Total reward = 31.78
2022-01-26 14:18:32.417 | DEBUG    | __main__:trials:24 - Trial = 25942/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.419 | DEBUG    | __main__:trials:29 - Trial = 25942/30000 | Total reward = 37.67
2022-01-26 14:18:32.422 | DEBUG    | __main__:trials:26 - Trial = 25943/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.422 | DEBUG    | __main__:trials:29 - Trial = 25943/30000 | Total reward = 17.90
2022-01-26 14:18:32.426 | DEBUG    | __main__:trials:24 - Trial = 25944/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.427 | DEBUG    | __main__:trials:29 - Trial = 25944/30000 | Total reward = 40.18
2022-01-26 14:18:32.431 | DEBUG    | __main__:trials:24 - Trial = 25945/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.431 | DEBUG    | __main__:trials:29 - Trial = 25945/30000 | Total reward = 39.40
2022-01-26 14:18:32.435 | DEBUG    | __main__:trials:24 - Trial = 25946/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.435 | DEBUG    | __main__:trials:29 - Trial = 25946/30000 | Total reward = 45.62
2022-01-26 14:18:32.439 | DEBUG    | __main__:trials:26 - Trial = 25947/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.439 | DEBUG    | __main__:trials:29 - Trial = 25947/30000 | Total reward = 23.89
2022-01-26 14:18:32.443 | DEBUG    | __main__:trials:24 - Trial = 25948/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.444 | DEBUG    | __main__:trials:29 - Trial = 25948/30000 | Total reward = 46.08
2022-01-26 14:18:32.447 | DEBUG    | __main__:trials:24 - Trial = 25949/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.448 | DEBUG    | __main__:trials:29 - Trial = 25949/30000 | Total reward = 43.38
2022-01-26 14:18:32.451 | DEBUG    | __main__:trials:24 - Trial = 25950/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.451 | DEBUG    | __main__:trials:29 - Trial = 25950/30000 | Total reward = 29.46
2022-01-26 14:18:32.455 | DEBUG    | __main__:trials:24 - Trial = 25951/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.455 | DEBUG    | __main__:trials:29 - Trial = 25951/30000 | Total reward = 34.87
2022-01-26 14:18:32.459 | DEBUG    | __main__:trials:24 - Trial = 25952/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.459 | DEBUG    | __main__:trials:29 - Trial = 25952/30000 | Total reward = 45.79
2022-01-26 14:18:32.463 | DEBUG    | __main__:trials:26 - Trial = 25953/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.464 | DEBUG    | __main__:trials:29 - Trial = 25953/30000 | Total reward = 14.61
2022-01-26 14:18:32.468 | DEBUG    | __main__:trials:26 - Trial = 25954/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.469 | DEBUG    | __main__:trials:29 - Trial = 25954/30000 | Total reward = 20.57
2022-01-26 14:18:32.472 | DEBUG    | __main__:trials:24 - Trial = 25955/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.473 | DEBUG    | __main__:trials:29 - Trial = 25955/30000 | Total reward = 28.13
2022-01-26 14:18:32.476 | DEBUG    | __main__:trials:24 - Trial = 25956/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.477 | DEBUG    | __main__:trials:29 - Trial = 25956/30000 | Total reward = 36.05
2022-01-26 14:18:32.481 | DEBUG    | __main__:trials:24 - Trial = 25957/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.481 | DEBUG    | __main__:trials:29 - Trial = 25957/30000 | Total reward = 41.02
2022-01-26 14:18:32.485 | DEBUG    | __main__:trials:24 - Trial = 25958/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.486 | DEBUG    | __main__:trials:29 - Trial = 25958/30000 | Total reward = 40.47
2022-01-26 14:18:32.490 | DEBUG    | __main__:trials:24 - Trial = 25959/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.491 | DEBUG    | __main__:trials:29 - Trial = 25959/30000 | Total reward = 39.31
2022-01-26 14:18:32.494 | DEBUG    | __main__:trials:24 - Trial = 25960/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.495 | DEBUG    | __main__:trials:29 - Trial = 25960/30000 | Total reward = 17.08
2022-01-26 14:18:32.498 | DEBUG    | __main__:trials:24 - Trial = 25961/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.499 | DEBUG    | __main__:trials:29 - Trial = 25961/30000 | Total reward = 41.66
2022-01-26 14:18:32.503 | DEBUG    | __main__:trials:24 - Trial = 25962/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.503 | DEBUG    | __main__:trials:29 - Trial = 25962/30000 | Total reward = 34.88
2022-01-26 14:18:32.507 | DEBUG    | __main__:trials:26 - Trial = 25963/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.507 | DEBUG    | __main__:trials:29 - Trial = 25963/30000 | Total reward = 23.52
2022-01-26 14:18:32.512 | DEBUG    | __main__:trials:24 - Trial = 25964/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.514 | DEBUG    | __main__:trials:29 - Trial = 25964/30000 | Total reward = 41.98
2022-01-26 14:18:32.517 | DEBUG    | __main__:trials:24 - Trial = 25965/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.517 | DEBUG    | __main__:trials:29 - Trial = 25965/30000 | Total reward = 44.16
2022-01-26 14:18:32.520 | DEBUG    | __main__:trials:24 - Trial = 25966/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.521 | DEBUG    | __main__:trials:29 - Trial = 25966/30000 | Total reward = 37.62
2022-01-26 14:18:32.524 | DEBUG    | __main__:trials:24 - Trial = 25967/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.525 | DEBUG    | __main__:trials:29 - Trial = 25967/30000 | Total reward = 44.32
2022-01-26 14:18:32.529 | DEBUG    | __main__:trials:24 - Trial = 25968/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.530 | DEBUG    | __main__:trials:29 - Trial = 25968/30000 | Total reward = 41.06
2022-01-26 14:18:32.533 | DEBUG    | __main__:trials:24 - Trial = 25969/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.534 | DEBUG    | __main__:trials:29 - Trial = 25969/30000 | Total reward = 46.03
2022-01-26 14:18:32.537 | DEBUG    | __main__:trials:24 - Trial = 25970/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.538 | DEBUG    | __main__:trials:29 - Trial = 25970/30000 | Total reward = 43.30
2022-01-26 14:18:32.541 | DEBUG    | __main__:trials:26 - Trial = 25971/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.542 | DEBUG    | __main__:trials:29 - Trial = 25971/30000 | Total reward = 23.42
2022-01-26 14:18:32.545 | DEBUG    | __main__:trials:24 - Trial = 25972/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.547 | DEBUG    | __main__:trials:29 - Trial = 25972/30000 | Total reward = 43.58
2022-01-26 14:18:32.550 | DEBUG    | __main__:trials:24 - Trial = 25973/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.550 | DEBUG    | __main__:trials:29 - Trial = 25973/30000 | Total reward = 41.36
2022-01-26 14:18:32.554 | DEBUG    | __main__:trials:24 - Trial = 25974/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.554 | DEBUG    | __main__:trials:29 - Trial = 25974/30000 | Total reward = 41.89
2022-01-26 14:18:32.558 | DEBUG    | __main__:trials:24 - Trial = 25975/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.560 | DEBUG    | __main__:trials:29 - Trial = 25975/30000 | Total reward = 61.34
2022-01-26 14:18:32.563 | DEBUG    | __main__:trials:24 - Trial = 25976/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.563 | DEBUG    | __main__:trials:29 - Trial = 25976/30000 | Total reward = 30.91
2022-01-26 14:18:32.566 | DEBUG    | __main__:trials:26 - Trial = 25977/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.567 | DEBUG    | __main__:trials:29 - Trial = 25977/30000 | Total reward = 17.11
2022-01-26 14:18:32.570 | DEBUG    | __main__:trials:24 - Trial = 25978/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.571 | DEBUG    | __main__:trials:29 - Trial = 25978/30000 | Total reward = 35.92
2022-01-26 14:18:32.574 | DEBUG    | __main__:trials:24 - Trial = 25979/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.575 | DEBUG    | __main__:trials:29 - Trial = 25979/30000 | Total reward = 37.10
2022-01-26 14:18:32.578 | DEBUG    | __main__:trials:24 - Trial = 25980/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.580 | DEBUG    | __main__:trials:29 - Trial = 25980/30000 | Total reward = 45.88
2022-01-26 14:18:32.583 | DEBUG    | __main__:trials:24 - Trial = 25981/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.584 | DEBUG    | __main__:trials:29 - Trial = 25981/30000 | Total reward = 41.30
2022-01-26 14:18:32.587 | DEBUG    | __main__:trials:26 - Trial = 25982/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.587 | DEBUG    | __main__:trials:29 - Trial = 25982/30000 | Total reward = 20.66
2022-01-26 14:18:32.591 | DEBUG    | __main__:trials:24 - Trial = 25983/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.592 | DEBUG    | __main__:trials:29 - Trial = 25983/30000 | Total reward = 46.45
2022-01-26 14:18:32.595 | DEBUG    | __main__:trials:24 - Trial = 25984/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.597 | DEBUG    | __main__:trials:29 - Trial = 25984/30000 | Total reward = 41.02
2022-01-26 14:18:32.599 | DEBUG    | __main__:trials:26 - Trial = 25985/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.601 | DEBUG    | __main__:trials:29 - Trial = 25985/30000 | Total reward = 28.00
2022-01-26 14:18:32.604 | DEBUG    | __main__:trials:26 - Trial = 25986/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.604 | DEBUG    | __main__:trials:29 - Trial = 25986/30000 | Total reward = 27.65
2022-01-26 14:18:32.608 | DEBUG    | __main__:trials:24 - Trial = 25987/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.609 | DEBUG    | __main__:trials:29 - Trial = 25987/30000 | Total reward = 52.40
2022-01-26 14:18:32.612 | DEBUG    | __main__:trials:24 - Trial = 25988/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.613 | DEBUG    | __main__:trials:29 - Trial = 25988/30000 | Total reward = 44.57
2022-01-26 14:18:32.616 | DEBUG    | __main__:trials:24 - Trial = 25989/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.617 | DEBUG    | __main__:trials:29 - Trial = 25989/30000 | Total reward = 27.15
2022-01-26 14:18:32.620 | DEBUG    | __main__:trials:24 - Trial = 25990/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.621 | DEBUG    | __main__:trials:29 - Trial = 25990/30000 | Total reward = 41.09
2022-01-26 14:18:32.624 | DEBUG    | __main__:trials:24 - Trial = 25991/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.625 | DEBUG    | __main__:trials:29 - Trial = 25991/30000 | Total reward = 31.57
2022-01-26 14:18:32.628 | DEBUG    | __main__:trials:24 - Trial = 25992/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.630 | DEBUG    | __main__:trials:29 - Trial = 25992/30000 | Total reward = 41.62
2022-01-26 14:18:32.634 | DEBUG    | __main__:trials:26 - Trial = 25993/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.634 | DEBUG    | __main__:trials:29 - Trial = 25993/30000 | Total reward = 26.70
2022-01-26 14:18:32.637 | DEBUG    | __main__:trials:26 - Trial = 25994/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.638 | DEBUG    | __main__:trials:29 - Trial = 25994/30000 | Total reward = 11.06
2022-01-26 14:18:32.641 | DEBUG    | __main__:trials:24 - Trial = 25995/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.642 | DEBUG    | __main__:trials:29 - Trial = 25995/30000 | Total reward = 38.71
2022-01-26 14:18:32.645 | DEBUG    | __main__:trials:24 - Trial = 25996/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.646 | DEBUG    | __main__:trials:29 - Trial = 25996/30000 | Total reward = 37.93
2022-01-26 14:18:32.650 | DEBUG    | __main__:trials:24 - Trial = 25997/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.650 | DEBUG    | __main__:trials:29 - Trial = 25997/30000 | Total reward = 47.22
2022-01-26 14:18:32.654 | DEBUG    | __main__:trials:24 - Trial = 25998/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.655 | DEBUG    | __main__:trials:29 - Trial = 25998/30000 | Total reward = 41.09
2022-01-26 14:18:32.657 | DEBUG    | __main__:trials:26 - Trial = 25999/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.658 | DEBUG    | __main__:trials:29 - Trial = 25999/30000 | Total reward = 14.19
2022-01-26 14:18:32.661 | DEBUG    | __main__:trials:26 - Trial = 26000/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.662 | DEBUG    | __main__:trials:29 - Trial = 26000/30000 | Total reward = 23.01
2022-01-26 14:18:32.666 | DEBUG    | __main__:trials:24 - Trial = 26001/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.666 | DEBUG    | __main__:trials:29 - Trial = 26001/30000 | Total reward = 41.76
2022-01-26 14:18:32.669 | DEBUG    | __main__:trials:24 - Trial = 26002/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.671 | DEBUG    | __main__:trials:29 - Trial = 26002/30000 | Total reward = 44.05
2022-01-26 14:18:32.674 | DEBUG    | __main__:trials:24 - Trial = 26003/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.676 | DEBUG    | __main__:trials:29 - Trial = 26003/30000 | Total reward = 34.94
2022-01-26 14:18:32.679 | DEBUG    | __main__:trials:24 - Trial = 26004/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.680 | DEBUG    | __main__:trials:29 - Trial = 26004/30000 | Total reward = 46.14
2022-01-26 14:18:32.683 | DEBUG    | __main__:trials:24 - Trial = 26005/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.685 | DEBUG    | __main__:trials:29 - Trial = 26005/30000 | Total reward = 45.45
2022-01-26 14:18:32.688 | DEBUG    | __main__:trials:24 - Trial = 26006/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.688 | DEBUG    | __main__:trials:29 - Trial = 26006/30000 | Total reward = 36.60
2022-01-26 14:18:32.692 | DEBUG    | __main__:trials:24 - Trial = 26007/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.692 | DEBUG    | __main__:trials:29 - Trial = 26007/30000 | Total reward = 39.57
2022-01-26 14:18:32.695 | DEBUG    | __main__:trials:26 - Trial = 26008/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.696 | DEBUG    | __main__:trials:29 - Trial = 26008/30000 | Total reward = 23.42
2022-01-26 14:18:32.699 | DEBUG    | __main__:trials:24 - Trial = 26009/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.700 | DEBUG    | __main__:trials:29 - Trial = 26009/30000 | Total reward = 31.65
2022-01-26 14:18:32.704 | DEBUG    | __main__:trials:24 - Trial = 26010/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.706 | DEBUG    | __main__:trials:29 - Trial = 26010/30000 | Total reward = 33.44
2022-01-26 14:18:32.708 | DEBUG    | __main__:trials:24 - Trial = 26011/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.709 | DEBUG    | __main__:trials:29 - Trial = 26011/30000 | Total reward = 32.31
2022-01-26 14:18:32.713 | DEBUG    | __main__:trials:24 - Trial = 26012/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.714 | DEBUG    | __main__:trials:29 - Trial = 26012/30000 | Total reward = 34.47
2022-01-26 14:18:32.717 | DEBUG    | __main__:trials:24 - Trial = 26013/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.718 | DEBUG    | __main__:trials:29 - Trial = 26013/30000 | Total reward = 36.72
2022-01-26 14:18:32.721 | DEBUG    | __main__:trials:26 - Trial = 26014/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.721 | DEBUG    | __main__:trials:29 - Trial = 26014/30000 | Total reward = 24.87
2022-01-26 14:18:32.725 | DEBUG    | __main__:trials:24 - Trial = 26015/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.727 | DEBUG    | __main__:trials:29 - Trial = 26015/30000 | Total reward = 31.93
2022-01-26 14:18:32.729 | DEBUG    | __main__:trials:26 - Trial = 26016/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.730 | DEBUG    | __main__:trials:29 - Trial = 26016/30000 | Total reward = 18.00
2022-01-26 14:18:32.733 | DEBUG    | __main__:trials:26 - Trial = 26017/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.733 | DEBUG    | __main__:trials:29 - Trial = 26017/30000 | Total reward = 20.31
2022-01-26 14:18:32.737 | DEBUG    | __main__:trials:24 - Trial = 26018/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.737 | DEBUG    | __main__:trials:29 - Trial = 26018/30000 | Total reward = 33.75
2022-01-26 14:18:32.741 | DEBUG    | __main__:trials:24 - Trial = 26019/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.741 | DEBUG    | __main__:trials:29 - Trial = 26019/30000 | Total reward = 41.01
2022-01-26 14:18:32.744 | DEBUG    | __main__:trials:26 - Trial = 26020/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.744 | DEBUG    | __main__:trials:29 - Trial = 26020/30000 | Total reward = 17.03
2022-01-26 14:18:32.748 | DEBUG    | __main__:trials:24 - Trial = 26021/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.748 | DEBUG    | __main__:trials:29 - Trial = 26021/30000 | Total reward = 39.76
2022-01-26 14:18:32.752 | DEBUG    | __main__:trials:24 - Trial = 26022/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.752 | DEBUG    | __main__:trials:29 - Trial = 26022/30000 | Total reward = 35.65
2022-01-26 14:18:32.757 | DEBUG    | __main__:trials:24 - Trial = 26023/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.759 | DEBUG    | __main__:trials:29 - Trial = 26023/30000 | Total reward = 35.57
2022-01-26 14:18:32.762 | DEBUG    | __main__:trials:24 - Trial = 26024/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.764 | DEBUG    | __main__:trials:29 - Trial = 26024/30000 | Total reward = 39.51
2022-01-26 14:18:32.767 | DEBUG    | __main__:trials:26 - Trial = 26025/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.768 | DEBUG    | __main__:trials:29 - Trial = 26025/30000 | Total reward = 23.42
2022-01-26 14:18:32.771 | DEBUG    | __main__:trials:24 - Trial = 26026/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.773 | DEBUG    | __main__:trials:29 - Trial = 26026/30000 | Total reward = 36.44
2022-01-26 14:18:32.776 | DEBUG    | __main__:trials:24 - Trial = 26027/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.777 | DEBUG    | __main__:trials:29 - Trial = 26027/30000 | Total reward = 39.49
2022-01-26 14:18:32.781 | DEBUG    | __main__:trials:24 - Trial = 26028/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.782 | DEBUG    | __main__:trials:29 - Trial = 26028/30000 | Total reward = 42.78
2022-01-26 14:18:32.786 | DEBUG    | __main__:trials:24 - Trial = 26029/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.787 | DEBUG    | __main__:trials:29 - Trial = 26029/30000 | Total reward = 44.92
2022-01-26 14:18:32.790 | DEBUG    | __main__:trials:26 - Trial = 26030/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.792 | DEBUG    | __main__:trials:29 - Trial = 26030/30000 | Total reward = 25.09
2022-01-26 14:18:32.795 | DEBUG    | __main__:trials:24 - Trial = 26031/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.796 | DEBUG    | __main__:trials:29 - Trial = 26031/30000 | Total reward = 36.34
2022-01-26 14:18:32.799 | DEBUG    | __main__:trials:24 - Trial = 26032/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.801 | DEBUG    | __main__:trials:29 - Trial = 26032/30000 | Total reward = 47.02
2022-01-26 14:18:32.804 | DEBUG    | __main__:trials:24 - Trial = 26033/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.805 | DEBUG    | __main__:trials:29 - Trial = 26033/30000 | Total reward = 45.79
2022-01-26 14:18:32.809 | DEBUG    | __main__:trials:24 - Trial = 26034/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.809 | DEBUG    | __main__:trials:29 - Trial = 26034/30000 | Total reward = 52.27
2022-01-26 14:18:32.813 | DEBUG    | __main__:trials:24 - Trial = 26035/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.814 | DEBUG    | __main__:trials:29 - Trial = 26035/30000 | Total reward = 54.65
2022-01-26 14:18:32.817 | DEBUG    | __main__:trials:24 - Trial = 26036/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.818 | DEBUG    | __main__:trials:29 - Trial = 26036/30000 | Total reward = 31.75
2022-01-26 14:18:32.821 | DEBUG    | __main__:trials:24 - Trial = 26037/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.822 | DEBUG    | __main__:trials:29 - Trial = 26037/30000 | Total reward = 47.64
2022-01-26 14:18:32.825 | DEBUG    | __main__:trials:24 - Trial = 26038/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.826 | DEBUG    | __main__:trials:29 - Trial = 26038/30000 | Total reward = 43.38
2022-01-26 14:18:32.829 | DEBUG    | __main__:trials:24 - Trial = 26039/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.830 | DEBUG    | __main__:trials:29 - Trial = 26039/30000 | Total reward = 13.79
2022-01-26 14:18:32.833 | DEBUG    | __main__:trials:24 - Trial = 26040/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.834 | DEBUG    | __main__:trials:29 - Trial = 26040/30000 | Total reward = 19.19
2022-01-26 14:18:32.837 | DEBUG    | __main__:trials:24 - Trial = 26041/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.838 | DEBUG    | __main__:trials:29 - Trial = 26041/30000 | Total reward = 34.31
2022-01-26 14:18:32.841 | DEBUG    | __main__:trials:24 - Trial = 26042/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.843 | DEBUG    | __main__:trials:29 - Trial = 26042/30000 | Total reward = 37.56
2022-01-26 14:18:32.846 | DEBUG    | __main__:trials:24 - Trial = 26043/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.847 | DEBUG    | __main__:trials:29 - Trial = 26043/30000 | Total reward = 36.10
2022-01-26 14:18:32.850 | DEBUG    | __main__:trials:24 - Trial = 26044/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.851 | DEBUG    | __main__:trials:29 - Trial = 26044/30000 | Total reward = 49.77
2022-01-26 14:18:32.854 | DEBUG    | __main__:trials:24 - Trial = 26045/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.855 | DEBUG    | __main__:trials:29 - Trial = 26045/30000 | Total reward = 42.90
2022-01-26 14:18:32.859 | DEBUG    | __main__:trials:24 - Trial = 26046/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.860 | DEBUG    | __main__:trials:29 - Trial = 26046/30000 | Total reward = 34.79
2022-01-26 14:18:32.863 | DEBUG    | __main__:trials:24 - Trial = 26047/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.865 | DEBUG    | __main__:trials:29 - Trial = 26047/30000 | Total reward = 33.17
2022-01-26 14:18:32.868 | DEBUG    | __main__:trials:24 - Trial = 26048/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.869 | DEBUG    | __main__:trials:29 - Trial = 26048/30000 | Total reward = 46.68
2022-01-26 14:18:32.872 | DEBUG    | __main__:trials:26 - Trial = 26049/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.874 | DEBUG    | __main__:trials:29 - Trial = 26049/30000 | Total reward = 34.75
2022-01-26 14:18:32.877 | DEBUG    | __main__:trials:24 - Trial = 26050/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.877 | DEBUG    | __main__:trials:29 - Trial = 26050/30000 | Total reward = 36.25
2022-01-26 14:18:32.881 | DEBUG    | __main__:trials:24 - Trial = 26051/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.881 | DEBUG    | __main__:trials:29 - Trial = 26051/30000 | Total reward = 45.54
2022-01-26 14:18:32.885 | DEBUG    | __main__:trials:24 - Trial = 26052/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.886 | DEBUG    | __main__:trials:29 - Trial = 26052/30000 | Total reward = 34.03
2022-01-26 14:18:32.889 | DEBUG    | __main__:trials:24 - Trial = 26053/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.890 | DEBUG    | __main__:trials:29 - Trial = 26053/30000 | Total reward = 28.53
2022-01-26 14:18:32.893 | DEBUG    | __main__:trials:24 - Trial = 26054/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.894 | DEBUG    | __main__:trials:29 - Trial = 26054/30000 | Total reward = 32.84
2022-01-26 14:18:32.897 | DEBUG    | __main__:trials:24 - Trial = 26055/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.898 | DEBUG    | __main__:trials:29 - Trial = 26055/30000 | Total reward = 30.00
2022-01-26 14:18:32.901 | DEBUG    | __main__:trials:26 - Trial = 26056/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.902 | DEBUG    | __main__:trials:29 - Trial = 26056/30000 | Total reward = 14.92
2022-01-26 14:18:32.906 | DEBUG    | __main__:trials:24 - Trial = 26057/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.907 | DEBUG    | __main__:trials:29 - Trial = 26057/30000 | Total reward = 18.97
2022-01-26 14:18:32.910 | DEBUG    | __main__:trials:24 - Trial = 26058/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.911 | DEBUG    | __main__:trials:29 - Trial = 26058/30000 | Total reward = 36.69
2022-01-26 14:18:32.915 | DEBUG    | __main__:trials:24 - Trial = 26059/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.915 | DEBUG    | __main__:trials:29 - Trial = 26059/30000 | Total reward = 44.16
2022-01-26 14:18:32.919 | DEBUG    | __main__:trials:24 - Trial = 26060/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.920 | DEBUG    | __main__:trials:29 - Trial = 26060/30000 | Total reward = 41.48
2022-01-26 14:18:32.923 | DEBUG    | __main__:trials:24 - Trial = 26061/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.925 | DEBUG    | __main__:trials:29 - Trial = 26061/30000 | Total reward = 26.95
2022-01-26 14:18:32.927 | DEBUG    | __main__:trials:26 - Trial = 26062/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.928 | DEBUG    | __main__:trials:29 - Trial = 26062/30000 | Total reward = 14.73
2022-01-26 14:18:32.931 | DEBUG    | __main__:trials:24 - Trial = 26063/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.932 | DEBUG    | __main__:trials:29 - Trial = 26063/30000 | Total reward = 36.42
2022-01-26 14:18:32.935 | DEBUG    | __main__:trials:24 - Trial = 26064/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.936 | DEBUG    | __main__:trials:29 - Trial = 26064/30000 | Total reward = 15.86
2022-01-26 14:18:32.939 | DEBUG    | __main__:trials:24 - Trial = 26065/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.940 | DEBUG    | __main__:trials:29 - Trial = 26065/30000 | Total reward = 40.28
2022-01-26 14:18:32.943 | DEBUG    | __main__:trials:24 - Trial = 26066/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.945 | DEBUG    | __main__:trials:29 - Trial = 26066/30000 | Total reward = 42.70
2022-01-26 14:18:32.948 | DEBUG    | __main__:trials:26 - Trial = 26067/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.948 | DEBUG    | __main__:trials:29 - Trial = 26067/30000 | Total reward = 14.61
2022-01-26 14:18:32.952 | DEBUG    | __main__:trials:26 - Trial = 26068/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.954 | DEBUG    | __main__:trials:29 - Trial = 26068/30000 | Total reward = 30.77
2022-01-26 14:18:32.957 | DEBUG    | __main__:trials:24 - Trial = 26069/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.959 | DEBUG    | __main__:trials:29 - Trial = 26069/30000 | Total reward = 34.82
2022-01-26 14:18:32.962 | DEBUG    | __main__:trials:24 - Trial = 26070/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.964 | DEBUG    | __main__:trials:29 - Trial = 26070/30000 | Total reward = 35.96
2022-01-26 14:18:32.968 | DEBUG    | __main__:trials:24 - Trial = 26071/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.969 | DEBUG    | __main__:trials:29 - Trial = 26071/30000 | Total reward = 35.98
2022-01-26 14:18:32.972 | DEBUG    | __main__:trials:24 - Trial = 26072/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.974 | DEBUG    | __main__:trials:29 - Trial = 26072/30000 | Total reward = 36.31
2022-01-26 14:18:32.977 | DEBUG    | __main__:trials:26 - Trial = 26073/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.978 | DEBUG    | __main__:trials:29 - Trial = 26073/30000 | Total reward = 22.42
2022-01-26 14:18:32.982 | DEBUG    | __main__:trials:24 - Trial = 26074/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.983 | DEBUG    | __main__:trials:29 - Trial = 26074/30000 | Total reward = 38.66
2022-01-26 14:18:32.985 | DEBUG    | __main__:trials:26 - Trial = 26075/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.987 | DEBUG    | __main__:trials:29 - Trial = 26075/30000 | Total reward = 17.40
2022-01-26 14:18:32.991 | DEBUG    | __main__:trials:24 - Trial = 26076/30000 | Max number of steps (20) reached
2022-01-26 14:18:32.992 | DEBUG    | __main__:trials:29 - Trial = 26076/30000 | Total reward = 36.76
2022-01-26 14:18:32.996 | DEBUG    | __main__:trials:26 - Trial = 26077/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:32.997 | DEBUG    | __main__:trials:29 - Trial = 26077/30000 | Total reward = 24.61
2022-01-26 14:18:33.001 | DEBUG    | __main__:trials:24 - Trial = 26078/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.002 | DEBUG    | __main__:trials:29 - Trial = 26078/30000 | Total reward = 37.66
2022-01-26 14:18:33.006 | DEBUG    | __main__:trials:26 - Trial = 26079/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.007 | DEBUG    | __main__:trials:29 - Trial = 26079/30000 | Total reward = 23.42
2022-01-26 14:18:33.011 | DEBUG    | __main__:trials:24 - Trial = 26080/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.012 | DEBUG    | __main__:trials:29 - Trial = 26080/30000 | Total reward = 25.89
2022-01-26 14:18:33.016 | DEBUG    | __main__:trials:24 - Trial = 26081/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.017 | DEBUG    | __main__:trials:29 - Trial = 26081/30000 | Total reward = 26.95
2022-01-26 14:18:33.021 | DEBUG    | __main__:trials:24 - Trial = 26082/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.022 | DEBUG    | __main__:trials:29 - Trial = 26082/30000 | Total reward = 30.53
2022-01-26 14:18:33.025 | DEBUG    | __main__:trials:24 - Trial = 26083/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.027 | DEBUG    | __main__:trials:29 - Trial = 26083/30000 | Total reward = 36.71
2022-01-26 14:18:33.030 | DEBUG    | __main__:trials:24 - Trial = 26084/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.032 | DEBUG    | __main__:trials:29 - Trial = 26084/30000 | Total reward = 35.46
2022-01-26 14:18:33.035 | DEBUG    | __main__:trials:24 - Trial = 26085/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.037 | DEBUG    | __main__:trials:29 - Trial = 26085/30000 | Total reward = 39.59
2022-01-26 14:18:33.040 | DEBUG    | __main__:trials:24 - Trial = 26086/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.041 | DEBUG    | __main__:trials:29 - Trial = 26086/30000 | Total reward = 37.62
2022-01-26 14:18:33.045 | DEBUG    | __main__:trials:24 - Trial = 26087/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.047 | DEBUG    | __main__:trials:29 - Trial = 26087/30000 | Total reward = 30.12
2022-01-26 14:18:33.051 | DEBUG    | __main__:trials:24 - Trial = 26088/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.053 | DEBUG    | __main__:trials:29 - Trial = 26088/30000 | Total reward = 37.84
2022-01-26 14:18:33.056 | DEBUG    | __main__:trials:24 - Trial = 26089/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.058 | DEBUG    | __main__:trials:29 - Trial = 26089/30000 | Total reward = 43.78
2022-01-26 14:18:33.061 | DEBUG    | __main__:trials:24 - Trial = 26090/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.063 | DEBUG    | __main__:trials:29 - Trial = 26090/30000 | Total reward = 23.02
2022-01-26 14:18:33.066 | DEBUG    | __main__:trials:24 - Trial = 26091/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.068 | DEBUG    | __main__:trials:29 - Trial = 26091/30000 | Total reward = 43.20
2022-01-26 14:18:33.071 | DEBUG    | __main__:trials:24 - Trial = 26092/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.072 | DEBUG    | __main__:trials:29 - Trial = 26092/30000 | Total reward = 35.36
2022-01-26 14:18:33.076 | DEBUG    | __main__:trials:24 - Trial = 26093/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.077 | DEBUG    | __main__:trials:29 - Trial = 26093/30000 | Total reward = 39.85
2022-01-26 14:18:33.081 | DEBUG    | __main__:trials:24 - Trial = 26094/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.082 | DEBUG    | __main__:trials:29 - Trial = 26094/30000 | Total reward = 41.49
2022-01-26 14:18:33.087 | DEBUG    | __main__:trials:24 - Trial = 26095/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.087 | DEBUG    | __main__:trials:29 - Trial = 26095/30000 | Total reward = 29.88
2022-01-26 14:18:33.091 | DEBUG    | __main__:trials:24 - Trial = 26096/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.093 | DEBUG    | __main__:trials:29 - Trial = 26096/30000 | Total reward = 35.01
2022-01-26 14:18:33.096 | DEBUG    | __main__:trials:24 - Trial = 26097/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.097 | DEBUG    | __main__:trials:29 - Trial = 26097/30000 | Total reward = 37.58
2022-01-26 14:18:33.102 | DEBUG    | __main__:trials:24 - Trial = 26098/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.102 | DEBUG    | __main__:trials:29 - Trial = 26098/30000 | Total reward = 31.30
2022-01-26 14:18:33.106 | DEBUG    | __main__:trials:24 - Trial = 26099/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.107 | DEBUG    | __main__:trials:29 - Trial = 26099/30000 | Total reward = 27.86
2022-01-26 14:18:33.112 | DEBUG    | __main__:trials:24 - Trial = 26100/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.112 | DEBUG    | __main__:trials:29 - Trial = 26100/30000 | Total reward = 37.07
2022-01-26 14:18:33.117 | DEBUG    | __main__:trials:24 - Trial = 26101/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.117 | DEBUG    | __main__:trials:29 - Trial = 26101/30000 | Total reward = 45.03
2022-01-26 14:18:33.122 | DEBUG    | __main__:trials:24 - Trial = 26102/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.124 | DEBUG    | __main__:trials:29 - Trial = 26102/30000 | Total reward = 47.70
2022-01-26 14:18:33.127 | DEBUG    | __main__:trials:24 - Trial = 26103/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.129 | DEBUG    | __main__:trials:29 - Trial = 26103/30000 | Total reward = 47.89
2022-01-26 14:18:33.132 | DEBUG    | __main__:trials:24 - Trial = 26104/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.133 | DEBUG    | __main__:trials:29 - Trial = 26104/30000 | Total reward = 32.50
2022-01-26 14:18:33.137 | DEBUG    | __main__:trials:24 - Trial = 26105/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.137 | DEBUG    | __main__:trials:29 - Trial = 26105/30000 | Total reward = 36.12
2022-01-26 14:18:33.141 | DEBUG    | __main__:trials:24 - Trial = 26106/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.142 | DEBUG    | __main__:trials:29 - Trial = 26106/30000 | Total reward = 21.42
2022-01-26 14:18:33.146 | DEBUG    | __main__:trials:24 - Trial = 26107/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.148 | DEBUG    | __main__:trials:29 - Trial = 26107/30000 | Total reward = 41.75
2022-01-26 14:18:33.151 | DEBUG    | __main__:trials:24 - Trial = 26108/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.152 | DEBUG    | __main__:trials:29 - Trial = 26108/30000 | Total reward = 35.46
2022-01-26 14:18:33.156 | DEBUG    | __main__:trials:24 - Trial = 26109/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.158 | DEBUG    | __main__:trials:29 - Trial = 26109/30000 | Total reward = 37.05
2022-01-26 14:18:33.162 | DEBUG    | __main__:trials:24 - Trial = 26110/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.163 | DEBUG    | __main__:trials:29 - Trial = 26110/30000 | Total reward = 27.79
2022-01-26 14:18:33.167 | DEBUG    | __main__:trials:24 - Trial = 26111/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.167 | DEBUG    | __main__:trials:29 - Trial = 26111/30000 | Total reward = 29.16
2022-01-26 14:18:33.172 | DEBUG    | __main__:trials:24 - Trial = 26112/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.173 | DEBUG    | __main__:trials:29 - Trial = 26112/30000 | Total reward = 29.78
2022-01-26 14:18:33.177 | DEBUG    | __main__:trials:24 - Trial = 26113/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.178 | DEBUG    | __main__:trials:29 - Trial = 26113/30000 | Total reward = 31.05
2022-01-26 14:18:33.182 | DEBUG    | __main__:trials:24 - Trial = 26114/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.182 | DEBUG    | __main__:trials:29 - Trial = 26114/30000 | Total reward = 29.11
2022-01-26 14:18:33.187 | DEBUG    | __main__:trials:24 - Trial = 26115/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.188 | DEBUG    | __main__:trials:29 - Trial = 26115/30000 | Total reward = 36.20
2022-01-26 14:18:33.192 | DEBUG    | __main__:trials:24 - Trial = 26116/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.193 | DEBUG    | __main__:trials:29 - Trial = 26116/30000 | Total reward = 31.47
2022-01-26 14:18:33.196 | DEBUG    | __main__:trials:24 - Trial = 26117/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.197 | DEBUG    | __main__:trials:29 - Trial = 26117/30000 | Total reward = 38.36
2022-01-26 14:18:33.200 | DEBUG    | __main__:trials:26 - Trial = 26118/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.201 | DEBUG    | __main__:trials:29 - Trial = 26118/30000 | Total reward = 17.06
2022-01-26 14:18:33.204 | DEBUG    | __main__:trials:24 - Trial = 26119/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.205 | DEBUG    | __main__:trials:29 - Trial = 26119/30000 | Total reward = 24.93
2022-01-26 14:18:33.208 | DEBUG    | __main__:trials:24 - Trial = 26120/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.210 | DEBUG    | __main__:trials:29 - Trial = 26120/30000 | Total reward = 30.19
2022-01-26 14:18:33.213 | DEBUG    | __main__:trials:24 - Trial = 26121/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.214 | DEBUG    | __main__:trials:29 - Trial = 26121/30000 | Total reward = 39.72
2022-01-26 14:18:33.218 | DEBUG    | __main__:trials:24 - Trial = 26122/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.220 | DEBUG    | __main__:trials:29 - Trial = 26122/30000 | Total reward = 33.14
2022-01-26 14:18:33.223 | DEBUG    | __main__:trials:24 - Trial = 26123/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.224 | DEBUG    | __main__:trials:29 - Trial = 26123/30000 | Total reward = 41.71
2022-01-26 14:18:33.228 | DEBUG    | __main__:trials:24 - Trial = 26124/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.229 | DEBUG    | __main__:trials:29 - Trial = 26124/30000 | Total reward = 34.75
2022-01-26 14:18:33.232 | DEBUG    | __main__:trials:24 - Trial = 26125/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.234 | DEBUG    | __main__:trials:29 - Trial = 26125/30000 | Total reward = 57.95
2022-01-26 14:18:33.238 | DEBUG    | __main__:trials:24 - Trial = 26126/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.239 | DEBUG    | __main__:trials:29 - Trial = 26126/30000 | Total reward = 32.32
2022-01-26 14:18:33.242 | DEBUG    | __main__:trials:24 - Trial = 26127/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.244 | DEBUG    | __main__:trials:29 - Trial = 26127/30000 | Total reward = 38.12
2022-01-26 14:18:33.247 | DEBUG    | __main__:trials:24 - Trial = 26128/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.249 | DEBUG    | __main__:trials:29 - Trial = 26128/30000 | Total reward = 38.89
2022-01-26 14:18:33.252 | DEBUG    | __main__:trials:24 - Trial = 26129/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.254 | DEBUG    | __main__:trials:29 - Trial = 26129/30000 | Total reward = 35.74
2022-01-26 14:18:33.258 | DEBUG    | __main__:trials:24 - Trial = 26130/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.259 | DEBUG    | __main__:trials:29 - Trial = 26130/30000 | Total reward = 44.96
2022-01-26 14:18:33.263 | DEBUG    | __main__:trials:24 - Trial = 26131/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.265 | DEBUG    | __main__:trials:29 - Trial = 26131/30000 | Total reward = 31.01
2022-01-26 14:18:33.268 | DEBUG    | __main__:trials:24 - Trial = 26132/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.269 | DEBUG    | __main__:trials:29 - Trial = 26132/30000 | Total reward = 37.29
2022-01-26 14:18:33.272 | DEBUG    | __main__:trials:24 - Trial = 26133/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.274 | DEBUG    | __main__:trials:29 - Trial = 26133/30000 | Total reward = 36.31
2022-01-26 14:18:33.278 | DEBUG    | __main__:trials:24 - Trial = 26134/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.279 | DEBUG    | __main__:trials:29 - Trial = 26134/30000 | Total reward = 32.76
2022-01-26 14:18:33.283 | DEBUG    | __main__:trials:24 - Trial = 26135/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.285 | DEBUG    | __main__:trials:29 - Trial = 26135/30000 | Total reward = 35.12
2022-01-26 14:18:33.288 | DEBUG    | __main__:trials:24 - Trial = 26136/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.289 | DEBUG    | __main__:trials:29 - Trial = 26136/30000 | Total reward = 40.53
2022-01-26 14:18:33.292 | DEBUG    | __main__:trials:24 - Trial = 26137/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.294 | DEBUG    | __main__:trials:29 - Trial = 26137/30000 | Total reward = 53.95
2022-01-26 14:18:33.298 | DEBUG    | __main__:trials:24 - Trial = 26138/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.299 | DEBUG    | __main__:trials:29 - Trial = 26138/30000 | Total reward = 39.99
2022-01-26 14:18:33.302 | DEBUG    | __main__:trials:24 - Trial = 26139/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.304 | DEBUG    | __main__:trials:29 - Trial = 26139/30000 | Total reward = 27.96
2022-01-26 14:18:33.307 | DEBUG    | __main__:trials:24 - Trial = 26140/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.309 | DEBUG    | __main__:trials:29 - Trial = 26140/30000 | Total reward = 36.19
2022-01-26 14:18:33.312 | DEBUG    | __main__:trials:24 - Trial = 26141/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.314 | DEBUG    | __main__:trials:29 - Trial = 26141/30000 | Total reward = 36.48
2022-01-26 14:18:33.317 | DEBUG    | __main__:trials:24 - Trial = 26142/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.319 | DEBUG    | __main__:trials:29 - Trial = 26142/30000 | Total reward = 36.34
2022-01-26 14:18:33.323 | DEBUG    | __main__:trials:26 - Trial = 26143/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.323 | DEBUG    | __main__:trials:29 - Trial = 26143/30000 | Total reward = 26.67
2022-01-26 14:18:33.328 | DEBUG    | __main__:trials:24 - Trial = 26144/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.329 | DEBUG    | __main__:trials:29 - Trial = 26144/30000 | Total reward = 48.33
2022-01-26 14:18:33.332 | DEBUG    | __main__:trials:24 - Trial = 26145/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.334 | DEBUG    | __main__:trials:29 - Trial = 26145/30000 | Total reward = 35.30
2022-01-26 14:18:33.337 | DEBUG    | __main__:trials:26 - Trial = 26146/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.339 | DEBUG    | __main__:trials:29 - Trial = 26146/30000 | Total reward = 16.76
2022-01-26 14:18:33.342 | DEBUG    | __main__:trials:24 - Trial = 26147/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.343 | DEBUG    | __main__:trials:29 - Trial = 26147/30000 | Total reward = 34.77
2022-01-26 14:18:33.347 | DEBUG    | __main__:trials:24 - Trial = 26148/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.348 | DEBUG    | __main__:trials:29 - Trial = 26148/30000 | Total reward = 32.91
2022-01-26 14:18:33.351 | DEBUG    | __main__:trials:26 - Trial = 26149/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.352 | DEBUG    | __main__:trials:29 - Trial = 26149/30000 | Total reward = 14.76
2022-01-26 14:18:33.355 | DEBUG    | __main__:trials:24 - Trial = 26150/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.357 | DEBUG    | __main__:trials:29 - Trial = 26150/30000 | Total reward = 28.70
2022-01-26 14:18:33.360 | DEBUG    | __main__:trials:24 - Trial = 26151/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.362 | DEBUG    | __main__:trials:29 - Trial = 26151/30000 | Total reward = 35.39
2022-01-26 14:18:33.365 | DEBUG    | __main__:trials:24 - Trial = 26152/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.365 | DEBUG    | __main__:trials:29 - Trial = 26152/30000 | Total reward = 21.61
2022-01-26 14:18:33.369 | DEBUG    | __main__:trials:24 - Trial = 26153/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.370 | DEBUG    | __main__:trials:29 - Trial = 26153/30000 | Total reward = 29.59
2022-01-26 14:18:33.373 | DEBUG    | __main__:trials:24 - Trial = 26154/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.374 | DEBUG    | __main__:trials:29 - Trial = 26154/30000 | Total reward = 28.45
2022-01-26 14:18:33.377 | DEBUG    | __main__:trials:24 - Trial = 26155/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.378 | DEBUG    | __main__:trials:29 - Trial = 26155/30000 | Total reward = 48.20
2022-01-26 14:18:33.381 | DEBUG    | __main__:trials:24 - Trial = 26156/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.382 | DEBUG    | __main__:trials:29 - Trial = 26156/30000 | Total reward = 36.94
2022-01-26 14:18:33.385 | DEBUG    | __main__:trials:24 - Trial = 26157/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.386 | DEBUG    | __main__:trials:29 - Trial = 26157/30000 | Total reward = 35.22
2022-01-26 14:18:33.389 | DEBUG    | __main__:trials:24 - Trial = 26158/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.391 | DEBUG    | __main__:trials:29 - Trial = 26158/30000 | Total reward = 29.43
2022-01-26 14:18:33.394 | DEBUG    | __main__:trials:24 - Trial = 26159/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.396 | DEBUG    | __main__:trials:29 - Trial = 26159/30000 | Total reward = 52.29
2022-01-26 14:18:33.399 | DEBUG    | __main__:trials:26 - Trial = 26160/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.400 | DEBUG    | __main__:trials:29 - Trial = 26160/30000 | Total reward = 26.67
2022-01-26 14:18:33.403 | DEBUG    | __main__:trials:24 - Trial = 26161/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.405 | DEBUG    | __main__:trials:29 - Trial = 26161/30000 | Total reward = 34.79
2022-01-26 14:18:33.407 | DEBUG    | __main__:trials:24 - Trial = 26162/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.409 | DEBUG    | __main__:trials:29 - Trial = 26162/30000 | Total reward = 35.79
2022-01-26 14:18:33.412 | DEBUG    | __main__:trials:24 - Trial = 26163/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.413 | DEBUG    | __main__:trials:29 - Trial = 26163/30000 | Total reward = 27.75
2022-01-26 14:18:33.416 | DEBUG    | __main__:trials:24 - Trial = 26164/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.417 | DEBUG    | __main__:trials:29 - Trial = 26164/30000 | Total reward = 27.50
2022-01-26 14:18:33.420 | DEBUG    | __main__:trials:24 - Trial = 26165/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.421 | DEBUG    | __main__:trials:29 - Trial = 26165/30000 | Total reward = 27.25
2022-01-26 14:18:33.424 | DEBUG    | __main__:trials:24 - Trial = 26166/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.426 | DEBUG    | __main__:trials:29 - Trial = 26166/30000 | Total reward = 36.20
2022-01-26 14:18:33.429 | DEBUG    | __main__:trials:24 - Trial = 26167/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.429 | DEBUG    | __main__:trials:29 - Trial = 26167/30000 | Total reward = 41.92
2022-01-26 14:18:33.433 | DEBUG    | __main__:trials:24 - Trial = 26168/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.433 | DEBUG    | __main__:trials:29 - Trial = 26168/30000 | Total reward = 37.83
2022-01-26 14:18:33.437 | DEBUG    | __main__:trials:26 - Trial = 26169/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.439 | DEBUG    | __main__:trials:29 - Trial = 26169/30000 | Total reward = 28.11
2022-01-26 14:18:33.442 | DEBUG    | __main__:trials:24 - Trial = 26170/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.443 | DEBUG    | __main__:trials:29 - Trial = 26170/30000 | Total reward = 34.06
2022-01-26 14:18:33.446 | DEBUG    | __main__:trials:24 - Trial = 26171/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.447 | DEBUG    | __main__:trials:29 - Trial = 26171/30000 | Total reward = 38.31
2022-01-26 14:18:33.450 | DEBUG    | __main__:trials:24 - Trial = 26172/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.452 | DEBUG    | __main__:trials:29 - Trial = 26172/30000 | Total reward = 46.71
2022-01-26 14:18:33.455 | DEBUG    | __main__:trials:24 - Trial = 26173/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.456 | DEBUG    | __main__:trials:29 - Trial = 26173/30000 | Total reward = 20.93
2022-01-26 14:18:33.459 | DEBUG    | __main__:trials:24 - Trial = 26174/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.461 | DEBUG    | __main__:trials:29 - Trial = 26174/30000 | Total reward = 37.36
2022-01-26 14:18:33.464 | DEBUG    | __main__:trials:24 - Trial = 26175/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.465 | DEBUG    | __main__:trials:29 - Trial = 26175/30000 | Total reward = 44.66
2022-01-26 14:18:33.468 | DEBUG    | __main__:trials:24 - Trial = 26176/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.469 | DEBUG    | __main__:trials:29 - Trial = 26176/30000 | Total reward = 44.14
2022-01-26 14:18:33.472 | DEBUG    | __main__:trials:24 - Trial = 26177/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.474 | DEBUG    | __main__:trials:29 - Trial = 26177/30000 | Total reward = 30.34
2022-01-26 14:18:33.477 | DEBUG    | __main__:trials:24 - Trial = 26178/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.478 | DEBUG    | __main__:trials:29 - Trial = 26178/30000 | Total reward = 34.44
2022-01-26 14:18:33.481 | DEBUG    | __main__:trials:24 - Trial = 26179/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.482 | DEBUG    | __main__:trials:29 - Trial = 26179/30000 | Total reward = 57.40
2022-01-26 14:18:33.485 | DEBUG    | __main__:trials:24 - Trial = 26180/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.486 | DEBUG    | __main__:trials:29 - Trial = 26180/30000 | Total reward = 34.61
2022-01-26 14:18:33.490 | DEBUG    | __main__:trials:24 - Trial = 26181/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.490 | DEBUG    | __main__:trials:29 - Trial = 26181/30000 | Total reward = 51.47
2022-01-26 14:18:33.494 | DEBUG    | __main__:trials:24 - Trial = 26182/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.495 | DEBUG    | __main__:trials:29 - Trial = 26182/30000 | Total reward = 33.75
2022-01-26 14:18:33.498 | DEBUG    | __main__:trials:24 - Trial = 26183/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.499 | DEBUG    | __main__:trials:29 - Trial = 26183/30000 | Total reward = 43.03
2022-01-26 14:18:33.503 | DEBUG    | __main__:trials:24 - Trial = 26184/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.504 | DEBUG    | __main__:trials:29 - Trial = 26184/30000 | Total reward = 45.15
2022-01-26 14:18:33.508 | DEBUG    | __main__:trials:24 - Trial = 26185/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.509 | DEBUG    | __main__:trials:29 - Trial = 26185/30000 | Total reward = 30.57
2022-01-26 14:18:33.513 | DEBUG    | __main__:trials:24 - Trial = 26186/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.513 | DEBUG    | __main__:trials:29 - Trial = 26186/30000 | Total reward = 42.55
2022-01-26 14:18:33.517 | DEBUG    | __main__:trials:24 - Trial = 26187/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.518 | DEBUG    | __main__:trials:29 - Trial = 26187/30000 | Total reward = 43.03
2022-01-26 14:18:33.521 | DEBUG    | __main__:trials:24 - Trial = 26188/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.522 | DEBUG    | __main__:trials:29 - Trial = 26188/30000 | Total reward = 47.45
2022-01-26 14:18:33.525 | DEBUG    | __main__:trials:24 - Trial = 26189/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.526 | DEBUG    | __main__:trials:29 - Trial = 26189/30000 | Total reward = 44.56
2022-01-26 14:18:33.530 | DEBUG    | __main__:trials:24 - Trial = 26190/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.531 | DEBUG    | __main__:trials:29 - Trial = 26190/30000 | Total reward = 38.51
2022-01-26 14:18:33.533 | DEBUG    | __main__:trials:26 - Trial = 26191/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.534 | DEBUG    | __main__:trials:29 - Trial = 26191/30000 | Total reward = 21.69
2022-01-26 14:18:33.538 | DEBUG    | __main__:trials:24 - Trial = 26192/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.539 | DEBUG    | __main__:trials:29 - Trial = 26192/30000 | Total reward = 43.80
2022-01-26 14:18:33.542 | DEBUG    | __main__:trials:24 - Trial = 26193/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.544 | DEBUG    | __main__:trials:29 - Trial = 26193/30000 | Total reward = 39.12
2022-01-26 14:18:33.547 | DEBUG    | __main__:trials:24 - Trial = 26194/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.549 | DEBUG    | __main__:trials:29 - Trial = 26194/30000 | Total reward = 32.73
2022-01-26 14:18:33.552 | DEBUG    | __main__:trials:24 - Trial = 26195/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.554 | DEBUG    | __main__:trials:29 - Trial = 26195/30000 | Total reward = 29.60
2022-01-26 14:18:33.557 | DEBUG    | __main__:trials:24 - Trial = 26196/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.558 | DEBUG    | __main__:trials:29 - Trial = 26196/30000 | Total reward = 42.03
2022-01-26 14:18:33.561 | DEBUG    | __main__:trials:26 - Trial = 26197/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.562 | DEBUG    | __main__:trials:29 - Trial = 26197/30000 | Total reward = 23.25
2022-01-26 14:18:33.566 | DEBUG    | __main__:trials:24 - Trial = 26198/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.568 | DEBUG    | __main__:trials:29 - Trial = 26198/30000 | Total reward = 36.10
2022-01-26 14:18:33.570 | DEBUG    | __main__:trials:26 - Trial = 26199/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.572 | DEBUG    | __main__:trials:29 - Trial = 26199/30000 | Total reward = 22.01
2022-01-26 14:18:33.575 | DEBUG    | __main__:trials:24 - Trial = 26200/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.576 | DEBUG    | __main__:trials:29 - Trial = 26200/30000 | Total reward = 45.28
2022-01-26 14:18:33.578 | DEBUG    | __main__:trials:26 - Trial = 26201/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.580 | DEBUG    | __main__:trials:29 - Trial = 26201/30000 | Total reward = 15.20
2022-01-26 14:18:33.583 | DEBUG    | __main__:trials:24 - Trial = 26202/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.583 | DEBUG    | __main__:trials:29 - Trial = 26202/30000 | Total reward = 37.48
2022-01-26 14:18:33.587 | DEBUG    | __main__:trials:24 - Trial = 26203/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.587 | DEBUG    | __main__:trials:29 - Trial = 26203/30000 | Total reward = 36.19
2022-01-26 14:18:33.591 | DEBUG    | __main__:trials:26 - Trial = 26204/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.592 | DEBUG    | __main__:trials:29 - Trial = 26204/30000 | Total reward = 24.27
2022-01-26 14:18:33.594 | DEBUG    | __main__:trials:26 - Trial = 26205/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.595 | DEBUG    | __main__:trials:29 - Trial = 26205/30000 | Total reward = 17.58
2022-01-26 14:18:33.599 | DEBUG    | __main__:trials:24 - Trial = 26206/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.600 | DEBUG    | __main__:trials:29 - Trial = 26206/30000 | Total reward = 36.53
2022-01-26 14:18:33.603 | DEBUG    | __main__:trials:24 - Trial = 26207/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.604 | DEBUG    | __main__:trials:29 - Trial = 26207/30000 | Total reward = 34.89
2022-01-26 14:18:33.607 | DEBUG    | __main__:trials:24 - Trial = 26208/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.608 | DEBUG    | __main__:trials:29 - Trial = 26208/30000 | Total reward = 30.28
2022-01-26 14:18:33.612 | DEBUG    | __main__:trials:24 - Trial = 26209/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.614 | DEBUG    | __main__:trials:29 - Trial = 26209/30000 | Total reward = 35.31
2022-01-26 14:18:33.617 | DEBUG    | __main__:trials:24 - Trial = 26210/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.617 | DEBUG    | __main__:trials:29 - Trial = 26210/30000 | Total reward = 47.69
2022-01-26 14:18:33.621 | DEBUG    | __main__:trials:24 - Trial = 26211/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.621 | DEBUG    | __main__:trials:29 - Trial = 26211/30000 | Total reward = 34.71
2022-01-26 14:18:33.624 | DEBUG    | __main__:trials:26 - Trial = 26212/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.625 | DEBUG    | __main__:trials:29 - Trial = 26212/30000 | Total reward = 34.82
2022-01-26 14:18:33.628 | DEBUG    | __main__:trials:24 - Trial = 26213/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.630 | DEBUG    | __main__:trials:29 - Trial = 26213/30000 | Total reward = 44.41
2022-01-26 14:18:33.633 | DEBUG    | __main__:trials:24 - Trial = 26214/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.635 | DEBUG    | __main__:trials:29 - Trial = 26214/30000 | Total reward = 35.63
2022-01-26 14:18:33.638 | DEBUG    | __main__:trials:24 - Trial = 26215/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.639 | DEBUG    | __main__:trials:29 - Trial = 26215/30000 | Total reward = 43.73
2022-01-26 14:18:33.642 | DEBUG    | __main__:trials:24 - Trial = 26216/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.643 | DEBUG    | __main__:trials:29 - Trial = 26216/30000 | Total reward = 41.68
2022-01-26 14:18:33.646 | DEBUG    | __main__:trials:24 - Trial = 26217/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.647 | DEBUG    | __main__:trials:29 - Trial = 26217/30000 | Total reward = 20.06
2022-01-26 14:18:33.651 | DEBUG    | __main__:trials:24 - Trial = 26218/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.651 | DEBUG    | __main__:trials:29 - Trial = 26218/30000 | Total reward = 34.20
2022-01-26 14:18:33.655 | DEBUG    | __main__:trials:24 - Trial = 26219/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.655 | DEBUG    | __main__:trials:29 - Trial = 26219/30000 | Total reward = 39.58
2022-01-26 14:18:33.660 | DEBUG    | __main__:trials:24 - Trial = 26220/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.661 | DEBUG    | __main__:trials:29 - Trial = 26220/30000 | Total reward = 39.58
2022-01-26 14:18:33.664 | DEBUG    | __main__:trials:24 - Trial = 26221/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.665 | DEBUG    | __main__:trials:29 - Trial = 26221/30000 | Total reward = 46.34
2022-01-26 14:18:33.668 | DEBUG    | __main__:trials:24 - Trial = 26222/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.670 | DEBUG    | __main__:trials:29 - Trial = 26222/30000 | Total reward = 45.81
2022-01-26 14:18:33.673 | DEBUG    | __main__:trials:24 - Trial = 26223/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.674 | DEBUG    | __main__:trials:29 - Trial = 26223/30000 | Total reward = 42.02
2022-01-26 14:18:33.676 | DEBUG    | __main__:trials:26 - Trial = 26224/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.677 | DEBUG    | __main__:trials:29 - Trial = 26224/30000 | Total reward = 10.00
2022-01-26 14:18:33.681 | DEBUG    | __main__:trials:24 - Trial = 26225/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.682 | DEBUG    | __main__:trials:29 - Trial = 26225/30000 | Total reward = 34.38
2022-01-26 14:18:33.685 | DEBUG    | __main__:trials:24 - Trial = 26226/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.686 | DEBUG    | __main__:trials:29 - Trial = 26226/30000 | Total reward = 39.64
2022-01-26 14:18:33.690 | DEBUG    | __main__:trials:24 - Trial = 26227/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.690 | DEBUG    | __main__:trials:29 - Trial = 26227/30000 | Total reward = 27.36
2022-01-26 14:18:33.694 | DEBUG    | __main__:trials:24 - Trial = 26228/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.695 | DEBUG    | __main__:trials:29 - Trial = 26228/30000 | Total reward = 41.15
2022-01-26 14:18:33.698 | DEBUG    | __main__:trials:24 - Trial = 26229/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.699 | DEBUG    | __main__:trials:29 - Trial = 26229/30000 | Total reward = 27.39
2022-01-26 14:18:33.703 | DEBUG    | __main__:trials:24 - Trial = 26230/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.703 | DEBUG    | __main__:trials:29 - Trial = 26230/30000 | Total reward = 46.85
2022-01-26 14:18:33.707 | DEBUG    | __main__:trials:24 - Trial = 26231/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.708 | DEBUG    | __main__:trials:29 - Trial = 26231/30000 | Total reward = 53.60
2022-01-26 14:18:33.711 | DEBUG    | __main__:trials:24 - Trial = 26232/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.713 | DEBUG    | __main__:trials:29 - Trial = 26232/30000 | Total reward = 43.47
2022-01-26 14:18:33.716 | DEBUG    | __main__:trials:24 - Trial = 26233/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.717 | DEBUG    | __main__:trials:29 - Trial = 26233/30000 | Total reward = 38.23
2022-01-26 14:18:33.721 | DEBUG    | __main__:trials:24 - Trial = 26234/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.721 | DEBUG    | __main__:trials:29 - Trial = 26234/30000 | Total reward = 40.48
2022-01-26 14:18:33.725 | DEBUG    | __main__:trials:24 - Trial = 26235/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.726 | DEBUG    | __main__:trials:29 - Trial = 26235/30000 | Total reward = 45.99
2022-01-26 14:18:33.729 | DEBUG    | __main__:trials:26 - Trial = 26236/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.730 | DEBUG    | __main__:trials:29 - Trial = 26236/30000 | Total reward = 28.54
2022-01-26 14:18:33.733 | DEBUG    | __main__:trials:24 - Trial = 26237/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.734 | DEBUG    | __main__:trials:29 - Trial = 26237/30000 | Total reward = 45.41
2022-01-26 14:18:33.737 | DEBUG    | __main__:trials:24 - Trial = 26238/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.738 | DEBUG    | __main__:trials:29 - Trial = 26238/30000 | Total reward = 32.30
2022-01-26 14:18:33.741 | DEBUG    | __main__:trials:24 - Trial = 26239/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.742 | DEBUG    | __main__:trials:29 - Trial = 26239/30000 | Total reward = 30.62
2022-01-26 14:18:33.745 | DEBUG    | __main__:trials:26 - Trial = 26240/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.746 | DEBUG    | __main__:trials:29 - Trial = 26240/30000 | Total reward = 17.30
2022-01-26 14:18:33.749 | DEBUG    | __main__:trials:24 - Trial = 26241/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.750 | DEBUG    | __main__:trials:29 - Trial = 26241/30000 | Total reward = 44.66
2022-01-26 14:18:33.754 | DEBUG    | __main__:trials:24 - Trial = 26242/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.755 | DEBUG    | __main__:trials:29 - Trial = 26242/30000 | Total reward = 46.40
2022-01-26 14:18:33.758 | DEBUG    | __main__:trials:24 - Trial = 26243/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.759 | DEBUG    | __main__:trials:29 - Trial = 26243/30000 | Total reward = 45.62
2022-01-26 14:18:33.762 | DEBUG    | __main__:trials:26 - Trial = 26244/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.763 | DEBUG    | __main__:trials:29 - Trial = 26244/30000 | Total reward = 24.93
2022-01-26 14:18:33.766 | DEBUG    | __main__:trials:24 - Trial = 26245/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.767 | DEBUG    | __main__:trials:29 - Trial = 26245/30000 | Total reward = 50.45
2022-01-26 14:18:33.771 | DEBUG    | __main__:trials:24 - Trial = 26246/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.773 | DEBUG    | __main__:trials:29 - Trial = 26246/30000 | Total reward = 43.25
2022-01-26 14:18:33.775 | DEBUG    | __main__:trials:24 - Trial = 26247/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.776 | DEBUG    | __main__:trials:29 - Trial = 26247/30000 | Total reward = 42.81
2022-01-26 14:18:33.780 | DEBUG    | __main__:trials:24 - Trial = 26248/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.781 | DEBUG    | __main__:trials:29 - Trial = 26248/30000 | Total reward = 33.71
2022-01-26 14:18:33.784 | DEBUG    | __main__:trials:24 - Trial = 26249/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.785 | DEBUG    | __main__:trials:29 - Trial = 26249/30000 | Total reward = 44.45
2022-01-26 14:18:33.789 | DEBUG    | __main__:trials:24 - Trial = 26250/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.789 | DEBUG    | __main__:trials:29 - Trial = 26250/30000 | Total reward = 36.98
2022-01-26 14:18:33.793 | DEBUG    | __main__:trials:24 - Trial = 26251/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.794 | DEBUG    | __main__:trials:29 - Trial = 26251/30000 | Total reward = 43.73
2022-01-26 14:18:33.797 | DEBUG    | __main__:trials:24 - Trial = 26252/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.797 | DEBUG    | __main__:trials:29 - Trial = 26252/30000 | Total reward = 38.17
2022-01-26 14:18:33.802 | DEBUG    | __main__:trials:24 - Trial = 26253/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.803 | DEBUG    | __main__:trials:29 - Trial = 26253/30000 | Total reward = 46.15
2022-01-26 14:18:33.806 | DEBUG    | __main__:trials:24 - Trial = 26254/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.807 | DEBUG    | __main__:trials:29 - Trial = 26254/30000 | Total reward = 40.35
2022-01-26 14:18:33.810 | DEBUG    | __main__:trials:24 - Trial = 26255/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.811 | DEBUG    | __main__:trials:29 - Trial = 26255/30000 | Total reward = 33.90
2022-01-26 14:18:33.814 | DEBUG    | __main__:trials:24 - Trial = 26256/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.816 | DEBUG    | __main__:trials:29 - Trial = 26256/30000 | Total reward = 39.82
2022-01-26 14:18:33.819 | DEBUG    | __main__:trials:24 - Trial = 26257/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.820 | DEBUG    | __main__:trials:29 - Trial = 26257/30000 | Total reward = 44.57
2022-01-26 14:18:33.823 | DEBUG    | __main__:trials:24 - Trial = 26258/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.825 | DEBUG    | __main__:trials:29 - Trial = 26258/30000 | Total reward = 42.10
2022-01-26 14:18:33.829 | DEBUG    | __main__:trials:24 - Trial = 26259/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.829 | DEBUG    | __main__:trials:29 - Trial = 26259/30000 | Total reward = 46.17
2022-01-26 14:18:33.833 | DEBUG    | __main__:trials:24 - Trial = 26260/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.834 | DEBUG    | __main__:trials:29 - Trial = 26260/30000 | Total reward = 24.33
2022-01-26 14:18:33.838 | DEBUG    | __main__:trials:24 - Trial = 26261/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.839 | DEBUG    | __main__:trials:29 - Trial = 26261/30000 | Total reward = 26.67
2022-01-26 14:18:33.842 | DEBUG    | __main__:trials:24 - Trial = 26262/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.844 | DEBUG    | __main__:trials:29 - Trial = 26262/30000 | Total reward = 45.62
2022-01-26 14:18:33.847 | DEBUG    | __main__:trials:24 - Trial = 26263/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.848 | DEBUG    | __main__:trials:29 - Trial = 26263/30000 | Total reward = 30.30
2022-01-26 14:18:33.851 | DEBUG    | __main__:trials:24 - Trial = 26264/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.852 | DEBUG    | __main__:trials:29 - Trial = 26264/30000 | Total reward = 40.08
2022-01-26 14:18:33.856 | DEBUG    | __main__:trials:24 - Trial = 26265/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.857 | DEBUG    | __main__:trials:29 - Trial = 26265/30000 | Total reward = 37.48
2022-01-26 14:18:33.860 | DEBUG    | __main__:trials:24 - Trial = 26266/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.861 | DEBUG    | __main__:trials:29 - Trial = 26266/30000 | Total reward = 33.41
2022-01-26 14:18:33.864 | DEBUG    | __main__:trials:24 - Trial = 26267/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.865 | DEBUG    | __main__:trials:29 - Trial = 26267/30000 | Total reward = 40.58
2022-01-26 14:18:33.868 | DEBUG    | __main__:trials:24 - Trial = 26268/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.870 | DEBUG    | __main__:trials:29 - Trial = 26268/30000 | Total reward = 32.13
2022-01-26 14:18:33.873 | DEBUG    | __main__:trials:26 - Trial = 26269/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:33.874 | DEBUG    | __main__:trials:29 - Trial = 26269/30000 | Total reward = 25.93
2022-01-26 14:18:33.877 | DEBUG    | __main__:trials:24 - Trial = 26270/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.878 | DEBUG    | __main__:trials:29 - Trial = 26270/30000 | Total reward = 31.06
2022-01-26 14:18:33.881 | DEBUG    | __main__:trials:24 - Trial = 26271/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.882 | DEBUG    | __main__:trials:29 - Trial = 26271/30000 | Total reward = 49.47
2022-01-26 14:18:33.885 | DEBUG    | __main__:trials:24 - Trial = 26272/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.886 | DEBUG    | __main__:trials:29 - Trial = 26272/30000 | Total reward = 45.71
2022-01-26 14:18:33.889 | DEBUG    | __main__:trials:24 - Trial = 26273/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.889 | DEBUG    | __main__:trials:29 - Trial = 26273/30000 | Total reward = 45.46
2022-01-26 14:18:33.893 | DEBUG    | __main__:trials:24 - Trial = 26274/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.894 | DEBUG    | __main__:trials:29 - Trial = 26274/30000 | Total reward = 45.07
2022-01-26 14:18:33.898 | DEBUG    | __main__:trials:24 - Trial = 26275/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.898 | DEBUG    | __main__:trials:29 - Trial = 26275/30000 | Total reward = 45.03
2022-01-26 14:18:33.902 | DEBUG    | __main__:trials:24 - Trial = 26276/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.903 | DEBUG    | __main__:trials:29 - Trial = 26276/30000 | Total reward = 43.48
2022-01-26 14:18:33.906 | DEBUG    | __main__:trials:24 - Trial = 26277/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.907 | DEBUG    | __main__:trials:29 - Trial = 26277/30000 | Total reward = 44.95
2022-01-26 14:18:33.911 | DEBUG    | __main__:trials:24 - Trial = 26278/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.911 | DEBUG    | __main__:trials:29 - Trial = 26278/30000 | Total reward = 43.98
2022-01-26 14:18:33.915 | DEBUG    | __main__:trials:24 - Trial = 26279/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.916 | DEBUG    | __main__:trials:29 - Trial = 26279/30000 | Total reward = 45.62
2022-01-26 14:18:33.919 | DEBUG    | __main__:trials:24 - Trial = 26280/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.920 | DEBUG    | __main__:trials:29 - Trial = 26280/30000 | Total reward = 45.09
2022-01-26 14:18:33.923 | DEBUG    | __main__:trials:24 - Trial = 26281/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.924 | DEBUG    | __main__:trials:29 - Trial = 26281/30000 | Total reward = 43.32
2022-01-26 14:18:33.927 | DEBUG    | __main__:trials:24 - Trial = 26282/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.928 | DEBUG    | __main__:trials:29 - Trial = 26282/30000 | Total reward = 43.73
2022-01-26 14:18:33.931 | DEBUG    | __main__:trials:24 - Trial = 26283/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.932 | DEBUG    | __main__:trials:29 - Trial = 26283/30000 | Total reward = 44.39
2022-01-26 14:18:33.936 | DEBUG    | __main__:trials:24 - Trial = 26284/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.936 | DEBUG    | __main__:trials:29 - Trial = 26284/30000 | Total reward = 34.66
2022-01-26 14:18:33.940 | DEBUG    | __main__:trials:24 - Trial = 26285/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.940 | DEBUG    | __main__:trials:29 - Trial = 26285/30000 | Total reward = 34.90
2022-01-26 14:18:33.944 | DEBUG    | __main__:trials:24 - Trial = 26286/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.946 | DEBUG    | __main__:trials:29 - Trial = 26286/30000 | Total reward = 29.83
2022-01-26 14:18:33.949 | DEBUG    | __main__:trials:24 - Trial = 26287/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.950 | DEBUG    | __main__:trials:29 - Trial = 26287/30000 | Total reward = 32.50
2022-01-26 14:18:33.953 | DEBUG    | __main__:trials:24 - Trial = 26288/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.955 | DEBUG    | __main__:trials:29 - Trial = 26288/30000 | Total reward = 39.49
2022-01-26 14:18:33.958 | DEBUG    | __main__:trials:24 - Trial = 26289/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.958 | DEBUG    | __main__:trials:29 - Trial = 26289/30000 | Total reward = 43.45
2022-01-26 14:18:33.961 | DEBUG    | __main__:trials:24 - Trial = 26290/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.962 | DEBUG    | __main__:trials:29 - Trial = 26290/30000 | Total reward = 33.17
2022-01-26 14:18:33.965 | DEBUG    | __main__:trials:24 - Trial = 26291/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.966 | DEBUG    | __main__:trials:29 - Trial = 26291/30000 | Total reward = 34.75
2022-01-26 14:18:33.969 | DEBUG    | __main__:trials:24 - Trial = 26292/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.971 | DEBUG    | __main__:trials:29 - Trial = 26292/30000 | Total reward = 47.45
2022-01-26 14:18:33.974 | DEBUG    | __main__:trials:24 - Trial = 26293/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.976 | DEBUG    | __main__:trials:29 - Trial = 26293/30000 | Total reward = 41.62
2022-01-26 14:18:33.980 | DEBUG    | __main__:trials:24 - Trial = 26294/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.980 | DEBUG    | __main__:trials:29 - Trial = 26294/30000 | Total reward = 30.14
2022-01-26 14:18:33.984 | DEBUG    | __main__:trials:24 - Trial = 26295/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.985 | DEBUG    | __main__:trials:29 - Trial = 26295/30000 | Total reward = 45.84
2022-01-26 14:18:33.988 | DEBUG    | __main__:trials:24 - Trial = 26296/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.989 | DEBUG    | __main__:trials:29 - Trial = 26296/30000 | Total reward = 39.38
2022-01-26 14:18:33.992 | DEBUG    | __main__:trials:24 - Trial = 26297/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.993 | DEBUG    | __main__:trials:29 - Trial = 26297/30000 | Total reward = 45.62
2022-01-26 14:18:33.996 | DEBUG    | __main__:trials:24 - Trial = 26298/30000 | Max number of steps (20) reached
2022-01-26 14:18:33.997 | DEBUG    | __main__:trials:29 - Trial = 26298/30000 | Total reward = 44.14
2022-01-26 14:18:33.999 | DEBUG    | __main__:trials:26 - Trial = 26299/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.000 | DEBUG    | __main__:trials:29 - Trial = 26299/30000 | Total reward = 19.68
2022-01-26 14:18:34.003 | DEBUG    | __main__:trials:24 - Trial = 26300/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.005 | DEBUG    | __main__:trials:29 - Trial = 26300/30000 | Total reward = 44.07
2022-01-26 14:18:34.009 | DEBUG    | __main__:trials:24 - Trial = 26301/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.010 | DEBUG    | __main__:trials:29 - Trial = 26301/30000 | Total reward = 34.93
2022-01-26 14:18:34.013 | DEBUG    | __main__:trials:24 - Trial = 26302/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.014 | DEBUG    | __main__:trials:29 - Trial = 26302/30000 | Total reward = 34.03
2022-01-26 14:18:34.017 | DEBUG    | __main__:trials:24 - Trial = 26303/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.018 | DEBUG    | __main__:trials:29 - Trial = 26303/30000 | Total reward = 36.16
2022-01-26 14:18:34.021 | DEBUG    | __main__:trials:24 - Trial = 26304/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.022 | DEBUG    | __main__:trials:29 - Trial = 26304/30000 | Total reward = 44.13
2022-01-26 14:18:34.025 | DEBUG    | __main__:trials:24 - Trial = 26305/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.026 | DEBUG    | __main__:trials:29 - Trial = 26305/30000 | Total reward = 30.92
2022-01-26 14:18:34.029 | DEBUG    | __main__:trials:26 - Trial = 26306/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.030 | DEBUG    | __main__:trials:29 - Trial = 26306/30000 | Total reward = 22.91
2022-01-26 14:18:34.033 | DEBUG    | __main__:trials:24 - Trial = 26307/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.035 | DEBUG    | __main__:trials:29 - Trial = 26307/30000 | Total reward = 32.32
2022-01-26 14:18:34.037 | DEBUG    | __main__:trials:26 - Trial = 26308/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.039 | DEBUG    | __main__:trials:29 - Trial = 26308/30000 | Total reward = 17.94
2022-01-26 14:18:34.043 | DEBUG    | __main__:trials:24 - Trial = 26309/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.043 | DEBUG    | __main__:trials:29 - Trial = 26309/30000 | Total reward = 41.69
2022-01-26 14:18:34.048 | DEBUG    | __main__:trials:24 - Trial = 26310/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.049 | DEBUG    | __main__:trials:29 - Trial = 26310/30000 | Total reward = 38.80
2022-01-26 14:18:34.053 | DEBUG    | __main__:trials:24 - Trial = 26311/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.054 | DEBUG    | __main__:trials:29 - Trial = 26311/30000 | Total reward = 33.02
2022-01-26 14:18:34.058 | DEBUG    | __main__:trials:24 - Trial = 26312/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.059 | DEBUG    | __main__:trials:29 - Trial = 26312/30000 | Total reward = 39.11
2022-01-26 14:18:34.063 | DEBUG    | __main__:trials:26 - Trial = 26313/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.064 | DEBUG    | __main__:trials:29 - Trial = 26313/30000 | Total reward = 22.64
2022-01-26 14:18:34.068 | DEBUG    | __main__:trials:24 - Trial = 26314/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.070 | DEBUG    | __main__:trials:29 - Trial = 26314/30000 | Total reward = 35.28
2022-01-26 14:18:34.073 | DEBUG    | __main__:trials:26 - Trial = 26315/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.074 | DEBUG    | __main__:trials:29 - Trial = 26315/30000 | Total reward = 23.24
2022-01-26 14:18:34.077 | DEBUG    | __main__:trials:24 - Trial = 26316/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.079 | DEBUG    | __main__:trials:29 - Trial = 26316/30000 | Total reward = 23.66
2022-01-26 14:18:34.082 | DEBUG    | __main__:trials:24 - Trial = 26317/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.084 | DEBUG    | __main__:trials:29 - Trial = 26317/30000 | Total reward = 28.35
2022-01-26 14:18:34.087 | DEBUG    | __main__:trials:24 - Trial = 26318/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.089 | DEBUG    | __main__:trials:29 - Trial = 26318/30000 | Total reward = 45.15
2022-01-26 14:18:34.092 | DEBUG    | __main__:trials:24 - Trial = 26319/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.094 | DEBUG    | __main__:trials:29 - Trial = 26319/30000 | Total reward = 44.41
2022-01-26 14:18:34.098 | DEBUG    | __main__:trials:24 - Trial = 26320/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.099 | DEBUG    | __main__:trials:29 - Trial = 26320/30000 | Total reward = 36.72
2022-01-26 14:18:34.102 | DEBUG    | __main__:trials:26 - Trial = 26321/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.104 | DEBUG    | __main__:trials:29 - Trial = 26321/30000 | Total reward = 22.01
2022-01-26 14:18:34.107 | DEBUG    | __main__:trials:24 - Trial = 26322/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.109 | DEBUG    | __main__:trials:29 - Trial = 26322/30000 | Total reward = 35.83
2022-01-26 14:18:34.113 | DEBUG    | __main__:trials:24 - Trial = 26323/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.114 | DEBUG    | __main__:trials:29 - Trial = 26323/30000 | Total reward = 31.38
2022-01-26 14:18:34.118 | DEBUG    | __main__:trials:24 - Trial = 26324/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.118 | DEBUG    | __main__:trials:29 - Trial = 26324/30000 | Total reward = 30.68
2022-01-26 14:18:34.122 | DEBUG    | __main__:trials:24 - Trial = 26325/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.124 | DEBUG    | __main__:trials:29 - Trial = 26325/30000 | Total reward = 39.03
2022-01-26 14:18:34.127 | DEBUG    | __main__:trials:26 - Trial = 26326/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.128 | DEBUG    | __main__:trials:29 - Trial = 26326/30000 | Total reward = 24.98
2022-01-26 14:18:34.132 | DEBUG    | __main__:trials:24 - Trial = 26327/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.133 | DEBUG    | __main__:trials:29 - Trial = 26327/30000 | Total reward = 42.15
2022-01-26 14:18:34.136 | DEBUG    | __main__:trials:24 - Trial = 26328/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.138 | DEBUG    | __main__:trials:29 - Trial = 26328/30000 | Total reward = 34.90
2022-01-26 14:18:34.141 | DEBUG    | __main__:trials:24 - Trial = 26329/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.143 | DEBUG    | __main__:trials:29 - Trial = 26329/30000 | Total reward = 39.29
2022-01-26 14:18:34.147 | DEBUG    | __main__:trials:24 - Trial = 26330/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.148 | DEBUG    | __main__:trials:29 - Trial = 26330/30000 | Total reward = 42.22
2022-01-26 14:18:34.152 | DEBUG    | __main__:trials:24 - Trial = 26331/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.153 | DEBUG    | __main__:trials:29 - Trial = 26331/30000 | Total reward = 23.74
2022-01-26 14:18:34.156 | DEBUG    | __main__:trials:24 - Trial = 26332/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.157 | DEBUG    | __main__:trials:29 - Trial = 26332/30000 | Total reward = 31.26
2022-01-26 14:18:34.161 | DEBUG    | __main__:trials:26 - Trial = 26333/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.162 | DEBUG    | __main__:trials:29 - Trial = 26333/30000 | Total reward = 28.91
2022-01-26 14:18:34.165 | DEBUG    | __main__:trials:24 - Trial = 26334/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.167 | DEBUG    | __main__:trials:29 - Trial = 26334/30000 | Total reward = 39.99
2022-01-26 14:18:34.170 | DEBUG    | __main__:trials:24 - Trial = 26335/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.171 | DEBUG    | __main__:trials:29 - Trial = 26335/30000 | Total reward = 25.56
2022-01-26 14:18:34.175 | DEBUG    | __main__:trials:24 - Trial = 26336/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.175 | DEBUG    | __main__:trials:29 - Trial = 26336/30000 | Total reward = 42.15
2022-01-26 14:18:34.179 | DEBUG    | __main__:trials:24 - Trial = 26337/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.181 | DEBUG    | __main__:trials:29 - Trial = 26337/30000 | Total reward = 35.20
2022-01-26 14:18:34.184 | DEBUG    | __main__:trials:24 - Trial = 26338/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.185 | DEBUG    | __main__:trials:29 - Trial = 26338/30000 | Total reward = 34.67
2022-01-26 14:18:34.190 | DEBUG    | __main__:trials:24 - Trial = 26339/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.191 | DEBUG    | __main__:trials:29 - Trial = 26339/30000 | Total reward = 37.19
2022-01-26 14:18:34.194 | DEBUG    | __main__:trials:26 - Trial = 26340/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.195 | DEBUG    | __main__:trials:29 - Trial = 26340/30000 | Total reward = 13.55
2022-01-26 14:18:34.199 | DEBUG    | __main__:trials:24 - Trial = 26341/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.201 | DEBUG    | __main__:trials:29 - Trial = 26341/30000 | Total reward = 22.50
2022-01-26 14:18:34.204 | DEBUG    | __main__:trials:24 - Trial = 26342/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.206 | DEBUG    | __main__:trials:29 - Trial = 26342/30000 | Total reward = 27.19
2022-01-26 14:18:34.209 | DEBUG    | __main__:trials:24 - Trial = 26343/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.211 | DEBUG    | __main__:trials:29 - Trial = 26343/30000 | Total reward = 29.84
2022-01-26 14:18:34.214 | DEBUG    | __main__:trials:24 - Trial = 26344/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.216 | DEBUG    | __main__:trials:29 - Trial = 26344/30000 | Total reward = 33.19
2022-01-26 14:18:34.219 | DEBUG    | __main__:trials:24 - Trial = 26345/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.221 | DEBUG    | __main__:trials:29 - Trial = 26345/30000 | Total reward = 25.13
2022-01-26 14:18:34.224 | DEBUG    | __main__:trials:24 - Trial = 26346/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.226 | DEBUG    | __main__:trials:29 - Trial = 26346/30000 | Total reward = 38.05
2022-01-26 14:18:34.230 | DEBUG    | __main__:trials:24 - Trial = 26347/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.231 | DEBUG    | __main__:trials:29 - Trial = 26347/30000 | Total reward = 31.94
2022-01-26 14:18:34.235 | DEBUG    | __main__:trials:24 - Trial = 26348/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.235 | DEBUG    | __main__:trials:29 - Trial = 26348/30000 | Total reward = 41.81
2022-01-26 14:18:34.240 | DEBUG    | __main__:trials:24 - Trial = 26349/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.242 | DEBUG    | __main__:trials:29 - Trial = 26349/30000 | Total reward = 12.98
2022-01-26 14:18:34.245 | DEBUG    | __main__:trials:24 - Trial = 26350/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.246 | DEBUG    | __main__:trials:29 - Trial = 26350/30000 | Total reward = 45.79
2022-01-26 14:18:34.250 | DEBUG    | __main__:trials:24 - Trial = 26351/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.252 | DEBUG    | __main__:trials:29 - Trial = 26351/30000 | Total reward = 41.53
2022-01-26 14:18:34.255 | DEBUG    | __main__:trials:24 - Trial = 26352/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.257 | DEBUG    | __main__:trials:29 - Trial = 26352/30000 | Total reward = 39.58
2022-01-26 14:18:34.260 | DEBUG    | __main__:trials:24 - Trial = 26353/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.262 | DEBUG    | __main__:trials:29 - Trial = 26353/30000 | Total reward = 36.34
2022-01-26 14:18:34.265 | DEBUG    | __main__:trials:24 - Trial = 26354/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.266 | DEBUG    | __main__:trials:29 - Trial = 26354/30000 | Total reward = 36.15
2022-01-26 14:18:34.269 | DEBUG    | __main__:trials:24 - Trial = 26355/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.270 | DEBUG    | __main__:trials:29 - Trial = 26355/30000 | Total reward = 30.58
2022-01-26 14:18:34.274 | DEBUG    | __main__:trials:24 - Trial = 26356/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.275 | DEBUG    | __main__:trials:29 - Trial = 26356/30000 | Total reward = 41.44
2022-01-26 14:18:34.278 | DEBUG    | __main__:trials:26 - Trial = 26357/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.279 | DEBUG    | __main__:trials:29 - Trial = 26357/30000 | Total reward = 20.40
2022-01-26 14:18:34.282 | DEBUG    | __main__:trials:26 - Trial = 26358/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.284 | DEBUG    | __main__:trials:29 - Trial = 26358/30000 | Total reward = 26.17
2022-01-26 14:18:34.288 | DEBUG    | __main__:trials:24 - Trial = 26359/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.288 | DEBUG    | __main__:trials:29 - Trial = 26359/30000 | Total reward = 58.09
2022-01-26 14:18:34.293 | DEBUG    | __main__:trials:24 - Trial = 26360/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.294 | DEBUG    | __main__:trials:29 - Trial = 26360/30000 | Total reward = 54.58
2022-01-26 14:18:34.298 | DEBUG    | __main__:trials:24 - Trial = 26361/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.299 | DEBUG    | __main__:trials:29 - Trial = 26361/30000 | Total reward = 30.40
2022-01-26 14:18:34.303 | DEBUG    | __main__:trials:24 - Trial = 26362/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.304 | DEBUG    | __main__:trials:29 - Trial = 26362/30000 | Total reward = 27.21
2022-01-26 14:18:34.308 | DEBUG    | __main__:trials:24 - Trial = 26363/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.310 | DEBUG    | __main__:trials:29 - Trial = 26363/30000 | Total reward = 39.19
2022-01-26 14:18:34.313 | DEBUG    | __main__:trials:24 - Trial = 26364/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.315 | DEBUG    | __main__:trials:29 - Trial = 26364/30000 | Total reward = 37.81
2022-01-26 14:18:34.319 | DEBUG    | __main__:trials:24 - Trial = 26365/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.319 | DEBUG    | __main__:trials:29 - Trial = 26365/30000 | Total reward = 34.58
2022-01-26 14:18:34.324 | DEBUG    | __main__:trials:24 - Trial = 26366/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.325 | DEBUG    | __main__:trials:29 - Trial = 26366/30000 | Total reward = 36.03
2022-01-26 14:18:34.328 | DEBUG    | __main__:trials:24 - Trial = 26367/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.330 | DEBUG    | __main__:trials:29 - Trial = 26367/30000 | Total reward = 44.16
2022-01-26 14:18:34.334 | DEBUG    | __main__:trials:24 - Trial = 26368/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.335 | DEBUG    | __main__:trials:29 - Trial = 26368/30000 | Total reward = 28.93
2022-01-26 14:18:34.338 | DEBUG    | __main__:trials:24 - Trial = 26369/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.340 | DEBUG    | __main__:trials:29 - Trial = 26369/30000 | Total reward = 21.54
2022-01-26 14:18:34.343 | DEBUG    | __main__:trials:24 - Trial = 26370/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.345 | DEBUG    | __main__:trials:29 - Trial = 26370/30000 | Total reward = 36.15
2022-01-26 14:18:34.347 | DEBUG    | __main__:trials:24 - Trial = 26371/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.349 | DEBUG    | __main__:trials:29 - Trial = 26371/30000 | Total reward = 51.50
2022-01-26 14:18:34.352 | DEBUG    | __main__:trials:24 - Trial = 26372/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.353 | DEBUG    | __main__:trials:29 - Trial = 26372/30000 | Total reward = 46.22
2022-01-26 14:18:34.356 | DEBUG    | __main__:trials:24 - Trial = 26373/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.358 | DEBUG    | __main__:trials:29 - Trial = 26373/30000 | Total reward = 30.92
2022-01-26 14:18:34.361 | DEBUG    | __main__:trials:26 - Trial = 26374/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.362 | DEBUG    | __main__:trials:29 - Trial = 26374/30000 | Total reward = 19.71
2022-01-26 14:18:34.366 | DEBUG    | __main__:trials:24 - Trial = 26375/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.366 | DEBUG    | __main__:trials:29 - Trial = 26375/30000 | Total reward = 26.71
2022-01-26 14:18:34.371 | DEBUG    | __main__:trials:24 - Trial = 26376/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.372 | DEBUG    | __main__:trials:29 - Trial = 26376/30000 | Total reward = 17.11
2022-01-26 14:18:34.376 | DEBUG    | __main__:trials:24 - Trial = 26377/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.377 | DEBUG    | __main__:trials:29 - Trial = 26377/30000 | Total reward = 31.09
2022-01-26 14:18:34.381 | DEBUG    | __main__:trials:24 - Trial = 26378/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.383 | DEBUG    | __main__:trials:29 - Trial = 26378/30000 | Total reward = 31.21
2022-01-26 14:18:34.386 | DEBUG    | __main__:trials:24 - Trial = 26379/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.388 | DEBUG    | __main__:trials:29 - Trial = 26379/30000 | Total reward = 41.54
2022-01-26 14:18:34.392 | DEBUG    | __main__:trials:24 - Trial = 26380/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.392 | DEBUG    | __main__:trials:29 - Trial = 26380/30000 | Total reward = 32.76
2022-01-26 14:18:34.396 | DEBUG    | __main__:trials:24 - Trial = 26381/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.397 | DEBUG    | __main__:trials:29 - Trial = 26381/30000 | Total reward = 37.41
2022-01-26 14:18:34.401 | DEBUG    | __main__:trials:24 - Trial = 26382/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.403 | DEBUG    | __main__:trials:29 - Trial = 26382/30000 | Total reward = 36.15
2022-01-26 14:18:34.407 | DEBUG    | __main__:trials:24 - Trial = 26383/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.408 | DEBUG    | __main__:trials:29 - Trial = 26383/30000 | Total reward = 44.06
2022-01-26 14:18:34.411 | DEBUG    | __main__:trials:26 - Trial = 26384/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.413 | DEBUG    | __main__:trials:29 - Trial = 26384/30000 | Total reward = 12.86
2022-01-26 14:18:34.416 | DEBUG    | __main__:trials:24 - Trial = 26385/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.417 | DEBUG    | __main__:trials:29 - Trial = 26385/30000 | Total reward = 36.37
2022-01-26 14:18:34.421 | DEBUG    | __main__:trials:26 - Trial = 26386/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.422 | DEBUG    | __main__:trials:29 - Trial = 26386/30000 | Total reward = 33.04
2022-01-26 14:18:34.425 | DEBUG    | __main__:trials:24 - Trial = 26387/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.426 | DEBUG    | __main__:trials:29 - Trial = 26387/30000 | Total reward = 18.56
2022-01-26 14:18:34.431 | DEBUG    | __main__:trials:24 - Trial = 26388/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.432 | DEBUG    | __main__:trials:29 - Trial = 26388/30000 | Total reward = 30.26
2022-01-26 14:18:34.436 | DEBUG    | __main__:trials:24 - Trial = 26389/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.437 | DEBUG    | __main__:trials:29 - Trial = 26389/30000 | Total reward = 26.07
2022-01-26 14:18:34.440 | DEBUG    | __main__:trials:24 - Trial = 26390/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.442 | DEBUG    | __main__:trials:29 - Trial = 26390/30000 | Total reward = 27.73
2022-01-26 14:18:34.445 | DEBUG    | __main__:trials:26 - Trial = 26391/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.445 | DEBUG    | __main__:trials:29 - Trial = 26391/30000 | Total reward = 13.65
2022-01-26 14:18:34.448 | DEBUG    | __main__:trials:24 - Trial = 26392/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.450 | DEBUG    | __main__:trials:29 - Trial = 26392/30000 | Total reward = 29.08
2022-01-26 14:18:34.453 | DEBUG    | __main__:trials:24 - Trial = 26393/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.453 | DEBUG    | __main__:trials:29 - Trial = 26393/30000 | Total reward = 23.99
2022-01-26 14:18:34.457 | DEBUG    | __main__:trials:26 - Trial = 26394/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.457 | DEBUG    | __main__:trials:29 - Trial = 26394/30000 | Total reward = 20.51
2022-01-26 14:18:34.461 | DEBUG    | __main__:trials:24 - Trial = 26395/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.461 | DEBUG    | __main__:trials:29 - Trial = 26395/30000 | Total reward = 26.70
2022-01-26 14:18:34.466 | DEBUG    | __main__:trials:24 - Trial = 26396/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.467 | DEBUG    | __main__:trials:29 - Trial = 26396/30000 | Total reward = 21.24
2022-01-26 14:18:34.470 | DEBUG    | __main__:trials:24 - Trial = 26397/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.472 | DEBUG    | __main__:trials:29 - Trial = 26397/30000 | Total reward = 28.92
2022-01-26 14:18:34.475 | DEBUG    | __main__:trials:24 - Trial = 26398/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.477 | DEBUG    | __main__:trials:29 - Trial = 26398/30000 | Total reward = 26.21
2022-01-26 14:18:34.480 | DEBUG    | __main__:trials:24 - Trial = 26399/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.481 | DEBUG    | __main__:trials:29 - Trial = 26399/30000 | Total reward = 19.37
2022-01-26 14:18:34.484 | DEBUG    | __main__:trials:24 - Trial = 26400/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.485 | DEBUG    | __main__:trials:29 - Trial = 26400/30000 | Total reward = 26.17
2022-01-26 14:18:34.489 | DEBUG    | __main__:trials:24 - Trial = 26401/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.489 | DEBUG    | __main__:trials:29 - Trial = 26401/30000 | Total reward = 25.93
2022-01-26 14:18:34.493 | DEBUG    | __main__:trials:24 - Trial = 26402/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.494 | DEBUG    | __main__:trials:29 - Trial = 26402/30000 | Total reward = 18.35
2022-01-26 14:18:34.498 | DEBUG    | __main__:trials:24 - Trial = 26403/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.499 | DEBUG    | __main__:trials:29 - Trial = 26403/30000 | Total reward = 31.60
2022-01-26 14:18:34.503 | DEBUG    | __main__:trials:24 - Trial = 26404/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.504 | DEBUG    | __main__:trials:29 - Trial = 26404/30000 | Total reward = 26.99
2022-01-26 14:18:34.507 | DEBUG    | __main__:trials:24 - Trial = 26405/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.509 | DEBUG    | __main__:trials:29 - Trial = 26405/30000 | Total reward = 31.94
2022-01-26 14:18:34.513 | DEBUG    | __main__:trials:24 - Trial = 26406/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.513 | DEBUG    | __main__:trials:29 - Trial = 26406/30000 | Total reward = 27.95
2022-01-26 14:18:34.517 | DEBUG    | __main__:trials:24 - Trial = 26407/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.518 | DEBUG    | __main__:trials:29 - Trial = 26407/30000 | Total reward = 27.19
2022-01-26 14:18:34.522 | DEBUG    | __main__:trials:24 - Trial = 26408/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.524 | DEBUG    | __main__:trials:29 - Trial = 26408/30000 | Total reward = 34.93
2022-01-26 14:18:34.527 | DEBUG    | __main__:trials:24 - Trial = 26409/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.527 | DEBUG    | __main__:trials:29 - Trial = 26409/30000 | Total reward = 32.03
2022-01-26 14:18:34.531 | DEBUG    | __main__:trials:24 - Trial = 26410/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.532 | DEBUG    | __main__:trials:29 - Trial = 26410/30000 | Total reward = 27.05
2022-01-26 14:18:34.535 | DEBUG    | __main__:trials:26 - Trial = 26411/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.536 | DEBUG    | __main__:trials:29 - Trial = 26411/30000 | Total reward = 17.46
2022-01-26 14:18:34.539 | DEBUG    | __main__:trials:24 - Trial = 26412/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.541 | DEBUG    | __main__:trials:29 - Trial = 26412/30000 | Total reward = 27.04
2022-01-26 14:18:34.544 | DEBUG    | __main__:trials:24 - Trial = 26413/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.546 | DEBUG    | __main__:trials:29 - Trial = 26413/30000 | Total reward = 32.80
2022-01-26 14:18:34.550 | DEBUG    | __main__:trials:24 - Trial = 26414/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.552 | DEBUG    | __main__:trials:29 - Trial = 26414/30000 | Total reward = 28.25
2022-01-26 14:18:34.554 | DEBUG    | __main__:trials:26 - Trial = 26415/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.556 | DEBUG    | __main__:trials:29 - Trial = 26415/30000 | Total reward = 23.08
2022-01-26 14:18:34.560 | DEBUG    | __main__:trials:24 - Trial = 26416/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.560 | DEBUG    | __main__:trials:29 - Trial = 26416/30000 | Total reward = 24.74
2022-01-26 14:18:34.565 | DEBUG    | __main__:trials:24 - Trial = 26417/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.566 | DEBUG    | __main__:trials:29 - Trial = 26417/30000 | Total reward = 17.73
2022-01-26 14:18:34.569 | DEBUG    | __main__:trials:26 - Trial = 26418/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.570 | DEBUG    | __main__:trials:29 - Trial = 26418/30000 | Total reward = 15.26
2022-01-26 14:18:34.573 | DEBUG    | __main__:trials:24 - Trial = 26419/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.573 | DEBUG    | __main__:trials:29 - Trial = 26419/30000 | Total reward = 11.24
2022-01-26 14:18:34.578 | DEBUG    | __main__:trials:24 - Trial = 26420/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.578 | DEBUG    | __main__:trials:29 - Trial = 26420/30000 | Total reward = 38.98
2022-01-26 14:18:34.583 | DEBUG    | __main__:trials:24 - Trial = 26421/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.583 | DEBUG    | __main__:trials:29 - Trial = 26421/30000 | Total reward = 33.01
2022-01-26 14:18:34.588 | DEBUG    | __main__:trials:24 - Trial = 26422/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.588 | DEBUG    | __main__:trials:29 - Trial = 26422/30000 | Total reward = 44.32
2022-01-26 14:18:34.593 | DEBUG    | __main__:trials:24 - Trial = 26423/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.595 | DEBUG    | __main__:trials:29 - Trial = 26423/30000 | Total reward = 30.15
2022-01-26 14:18:34.598 | DEBUG    | __main__:trials:24 - Trial = 26424/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.599 | DEBUG    | __main__:trials:29 - Trial = 26424/30000 | Total reward = 29.16
2022-01-26 14:18:34.602 | DEBUG    | __main__:trials:26 - Trial = 26425/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.604 | DEBUG    | __main__:trials:29 - Trial = 26425/30000 | Total reward = 12.19
2022-01-26 14:18:34.607 | DEBUG    | __main__:trials:24 - Trial = 26426/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.609 | DEBUG    | __main__:trials:29 - Trial = 26426/30000 | Total reward = 28.15
2022-01-26 14:18:34.612 | DEBUG    | __main__:trials:26 - Trial = 26427/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.613 | DEBUG    | __main__:trials:29 - Trial = 26427/30000 | Total reward = 17.07
2022-01-26 14:18:34.617 | DEBUG    | __main__:trials:24 - Trial = 26428/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.618 | DEBUG    | __main__:trials:29 - Trial = 26428/30000 | Total reward = 16.50
2022-01-26 14:18:34.622 | DEBUG    | __main__:trials:24 - Trial = 26429/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.623 | DEBUG    | __main__:trials:29 - Trial = 26429/30000 | Total reward = 15.86
2022-01-26 14:18:34.628 | DEBUG    | __main__:trials:24 - Trial = 26430/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.629 | DEBUG    | __main__:trials:29 - Trial = 26430/30000 | Total reward = 51.47
2022-01-26 14:18:34.633 | DEBUG    | __main__:trials:24 - Trial = 26431/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.634 | DEBUG    | __main__:trials:29 - Trial = 26431/30000 | Total reward = 43.43
2022-01-26 14:18:34.638 | DEBUG    | __main__:trials:24 - Trial = 26432/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.639 | DEBUG    | __main__:trials:29 - Trial = 26432/30000 | Total reward = 37.73
2022-01-26 14:18:34.642 | DEBUG    | __main__:trials:24 - Trial = 26433/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.643 | DEBUG    | __main__:trials:29 - Trial = 26433/30000 | Total reward = 26.09
2022-01-26 14:18:34.646 | DEBUG    | __main__:trials:24 - Trial = 26434/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.648 | DEBUG    | __main__:trials:29 - Trial = 26434/30000 | Total reward = 42.21
2022-01-26 14:18:34.652 | DEBUG    | __main__:trials:24 - Trial = 26435/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.653 | DEBUG    | __main__:trials:29 - Trial = 26435/30000 | Total reward = 34.98
2022-01-26 14:18:34.657 | DEBUG    | __main__:trials:24 - Trial = 26436/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.659 | DEBUG    | __main__:trials:29 - Trial = 26436/30000 | Total reward = 25.87
2022-01-26 14:18:34.662 | DEBUG    | __main__:trials:24 - Trial = 26437/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.663 | DEBUG    | __main__:trials:29 - Trial = 26437/30000 | Total reward = 36.80
2022-01-26 14:18:34.666 | DEBUG    | __main__:trials:26 - Trial = 26438/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.667 | DEBUG    | __main__:trials:29 - Trial = 26438/30000 | Total reward = 15.35
2022-01-26 14:18:34.671 | DEBUG    | __main__:trials:24 - Trial = 26439/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.672 | DEBUG    | __main__:trials:29 - Trial = 26439/30000 | Total reward = 33.43
2022-01-26 14:18:34.676 | DEBUG    | __main__:trials:24 - Trial = 26440/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.678 | DEBUG    | __main__:trials:29 - Trial = 26440/30000 | Total reward = 34.85
2022-01-26 14:18:34.681 | DEBUG    | __main__:trials:24 - Trial = 26441/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.683 | DEBUG    | __main__:trials:29 - Trial = 26441/30000 | Total reward = 43.19
2022-01-26 14:18:34.687 | DEBUG    | __main__:trials:24 - Trial = 26442/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.688 | DEBUG    | __main__:trials:29 - Trial = 26442/30000 | Total reward = 36.36
2022-01-26 14:18:34.692 | DEBUG    | __main__:trials:24 - Trial = 26443/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.692 | DEBUG    | __main__:trials:29 - Trial = 26443/30000 | Total reward = 44.31
2022-01-26 14:18:34.697 | DEBUG    | __main__:trials:24 - Trial = 26444/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.698 | DEBUG    | __main__:trials:29 - Trial = 26444/30000 | Total reward = 47.73
2022-01-26 14:18:34.702 | DEBUG    | __main__:trials:24 - Trial = 26445/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.703 | DEBUG    | __main__:trials:29 - Trial = 26445/30000 | Total reward = 33.09
2022-01-26 14:18:34.707 | DEBUG    | __main__:trials:24 - Trial = 26446/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.708 | DEBUG    | __main__:trials:29 - Trial = 26446/30000 | Total reward = 30.17
2022-01-26 14:18:34.712 | DEBUG    | __main__:trials:24 - Trial = 26447/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.713 | DEBUG    | __main__:trials:29 - Trial = 26447/30000 | Total reward = 31.61
2022-01-26 14:18:34.716 | DEBUG    | __main__:trials:24 - Trial = 26448/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.718 | DEBUG    | __main__:trials:29 - Trial = 26448/30000 | Total reward = 43.71
2022-01-26 14:18:34.722 | DEBUG    | __main__:trials:24 - Trial = 26449/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.722 | DEBUG    | __main__:trials:29 - Trial = 26449/30000 | Total reward = 38.58
2022-01-26 14:18:34.727 | DEBUG    | __main__:trials:24 - Trial = 26450/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.728 | DEBUG    | __main__:trials:29 - Trial = 26450/30000 | Total reward = 35.17
2022-01-26 14:18:34.732 | DEBUG    | __main__:trials:24 - Trial = 26451/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.734 | DEBUG    | __main__:trials:29 - Trial = 26451/30000 | Total reward = 32.51
2022-01-26 14:18:34.737 | DEBUG    | __main__:trials:24 - Trial = 26452/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.739 | DEBUG    | __main__:trials:29 - Trial = 26452/30000 | Total reward = 43.83
2022-01-26 14:18:34.743 | DEBUG    | __main__:trials:24 - Trial = 26453/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.744 | DEBUG    | __main__:trials:29 - Trial = 26453/30000 | Total reward = 43.83
2022-01-26 14:18:34.747 | DEBUG    | __main__:trials:24 - Trial = 26454/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.749 | DEBUG    | __main__:trials:29 - Trial = 26454/30000 | Total reward = 45.76
2022-01-26 14:18:34.752 | DEBUG    | __main__:trials:24 - Trial = 26455/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.753 | DEBUG    | __main__:trials:29 - Trial = 26455/30000 | Total reward = 23.22
2022-01-26 14:18:34.756 | DEBUG    | __main__:trials:24 - Trial = 26456/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.758 | DEBUG    | __main__:trials:29 - Trial = 26456/30000 | Total reward = 37.74
2022-01-26 14:18:34.761 | DEBUG    | __main__:trials:24 - Trial = 26457/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.761 | DEBUG    | __main__:trials:29 - Trial = 26457/30000 | Total reward = 43.22
2022-01-26 14:18:34.766 | DEBUG    | __main__:trials:24 - Trial = 26458/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.767 | DEBUG    | __main__:trials:29 - Trial = 26458/30000 | Total reward = 26.72
2022-01-26 14:18:34.771 | DEBUG    | __main__:trials:24 - Trial = 26459/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.773 | DEBUG    | __main__:trials:29 - Trial = 26459/30000 | Total reward = 37.19
2022-01-26 14:18:34.775 | DEBUG    | __main__:trials:24 - Trial = 26460/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.777 | DEBUG    | __main__:trials:29 - Trial = 26460/30000 | Total reward = 34.67
2022-01-26 14:18:34.781 | DEBUG    | __main__:trials:24 - Trial = 26461/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.782 | DEBUG    | __main__:trials:29 - Trial = 26461/30000 | Total reward = 39.03
2022-01-26 14:18:34.785 | DEBUG    | __main__:trials:24 - Trial = 26462/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.786 | DEBUG    | __main__:trials:29 - Trial = 26462/30000 | Total reward = 39.18
2022-01-26 14:18:34.789 | DEBUG    | __main__:trials:24 - Trial = 26463/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.791 | DEBUG    | __main__:trials:29 - Trial = 26463/30000 | Total reward = 41.39
2022-01-26 14:18:34.794 | DEBUG    | __main__:trials:24 - Trial = 26464/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.796 | DEBUG    | __main__:trials:29 - Trial = 26464/30000 | Total reward = 48.72
2022-01-26 14:18:34.799 | DEBUG    | __main__:trials:24 - Trial = 26465/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.800 | DEBUG    | __main__:trials:29 - Trial = 26465/30000 | Total reward = 36.01
2022-01-26 14:18:34.804 | DEBUG    | __main__:trials:24 - Trial = 26466/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.806 | DEBUG    | __main__:trials:29 - Trial = 26466/30000 | Total reward = 37.13
2022-01-26 14:18:34.810 | DEBUG    | __main__:trials:24 - Trial = 26467/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.810 | DEBUG    | __main__:trials:29 - Trial = 26467/30000 | Total reward = 29.57
2022-01-26 14:18:34.815 | DEBUG    | __main__:trials:24 - Trial = 26468/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.815 | DEBUG    | __main__:trials:29 - Trial = 26468/30000 | Total reward = 44.56
2022-01-26 14:18:34.820 | DEBUG    | __main__:trials:24 - Trial = 26469/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.821 | DEBUG    | __main__:trials:29 - Trial = 26469/30000 | Total reward = 49.26
2022-01-26 14:18:34.825 | DEBUG    | __main__:trials:24 - Trial = 26470/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.826 | DEBUG    | __main__:trials:29 - Trial = 26470/30000 | Total reward = 25.85
2022-01-26 14:18:34.830 | DEBUG    | __main__:trials:24 - Trial = 26471/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.831 | DEBUG    | __main__:trials:29 - Trial = 26471/30000 | Total reward = 27.64
2022-01-26 14:18:34.835 | DEBUG    | __main__:trials:24 - Trial = 26472/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.836 | DEBUG    | __main__:trials:29 - Trial = 26472/30000 | Total reward = 39.63
2022-01-26 14:18:34.840 | DEBUG    | __main__:trials:24 - Trial = 26473/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.842 | DEBUG    | __main__:trials:29 - Trial = 26473/30000 | Total reward = 29.98
2022-01-26 14:18:34.846 | DEBUG    | __main__:trials:24 - Trial = 26474/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.847 | DEBUG    | __main__:trials:29 - Trial = 26474/30000 | Total reward = 34.30
2022-01-26 14:18:34.851 | DEBUG    | __main__:trials:24 - Trial = 26475/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.853 | DEBUG    | __main__:trials:29 - Trial = 26475/30000 | Total reward = 40.20
2022-01-26 14:18:34.856 | DEBUG    | __main__:trials:24 - Trial = 26476/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.858 | DEBUG    | __main__:trials:29 - Trial = 26476/30000 | Total reward = 30.62
2022-01-26 14:18:34.861 | DEBUG    | __main__:trials:24 - Trial = 26477/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.863 | DEBUG    | __main__:trials:29 - Trial = 26477/30000 | Total reward = 30.24
2022-01-26 14:18:34.866 | DEBUG    | __main__:trials:24 - Trial = 26478/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.867 | DEBUG    | __main__:trials:29 - Trial = 26478/30000 | Total reward = 34.65
2022-01-26 14:18:34.870 | DEBUG    | __main__:trials:24 - Trial = 26479/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.872 | DEBUG    | __main__:trials:29 - Trial = 26479/30000 | Total reward = 48.33
2022-01-26 14:18:34.876 | DEBUG    | __main__:trials:24 - Trial = 26480/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.877 | DEBUG    | __main__:trials:29 - Trial = 26480/30000 | Total reward = 35.21
2022-01-26 14:18:34.881 | DEBUG    | __main__:trials:24 - Trial = 26481/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.882 | DEBUG    | __main__:trials:29 - Trial = 26481/30000 | Total reward = 38.84
2022-01-26 14:18:34.886 | DEBUG    | __main__:trials:24 - Trial = 26482/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.886 | DEBUG    | __main__:trials:29 - Trial = 26482/30000 | Total reward = 36.72
2022-01-26 14:18:34.890 | DEBUG    | __main__:trials:24 - Trial = 26483/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.892 | DEBUG    | __main__:trials:29 - Trial = 26483/30000 | Total reward = 30.99
2022-01-26 14:18:34.896 | DEBUG    | __main__:trials:24 - Trial = 26484/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.896 | DEBUG    | __main__:trials:29 - Trial = 26484/30000 | Total reward = 26.61
2022-01-26 14:18:34.899 | DEBUG    | __main__:trials:26 - Trial = 26485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.901 | DEBUG    | __main__:trials:29 - Trial = 26485/30000 | Total reward = 11.11
2022-01-26 14:18:34.904 | DEBUG    | __main__:trials:24 - Trial = 26486/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.906 | DEBUG    | __main__:trials:29 - Trial = 26486/30000 | Total reward = 37.80
2022-01-26 14:18:34.908 | DEBUG    | __main__:trials:24 - Trial = 26487/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.910 | DEBUG    | __main__:trials:29 - Trial = 26487/30000 | Total reward = 42.19
2022-01-26 14:18:34.914 | DEBUG    | __main__:trials:24 - Trial = 26488/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.915 | DEBUG    | __main__:trials:29 - Trial = 26488/30000 | Total reward = 30.49
2022-01-26 14:18:34.917 | DEBUG    | __main__:trials:26 - Trial = 26489/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.918 | DEBUG    | __main__:trials:29 - Trial = 26489/30000 | Total reward = 10.21
2022-01-26 14:18:34.921 | DEBUG    | __main__:trials:24 - Trial = 26490/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.923 | DEBUG    | __main__:trials:29 - Trial = 26490/30000 | Total reward = 38.43
2022-01-26 14:18:34.925 | DEBUG    | __main__:trials:24 - Trial = 26491/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.927 | DEBUG    | __main__:trials:29 - Trial = 26491/30000 | Total reward = 61.21
2022-01-26 14:18:34.930 | DEBUG    | __main__:trials:24 - Trial = 26492/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.932 | DEBUG    | __main__:trials:29 - Trial = 26492/30000 | Total reward = 35.60
2022-01-26 14:18:34.934 | DEBUG    | __main__:trials:24 - Trial = 26493/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.935 | DEBUG    | __main__:trials:29 - Trial = 26493/30000 | Total reward = 37.83
2022-01-26 14:18:34.939 | DEBUG    | __main__:trials:24 - Trial = 26494/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.940 | DEBUG    | __main__:trials:29 - Trial = 26494/30000 | Total reward = 50.59
2022-01-26 14:18:34.943 | DEBUG    | __main__:trials:24 - Trial = 26495/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.945 | DEBUG    | __main__:trials:29 - Trial = 26495/30000 | Total reward = 50.62
2022-01-26 14:18:34.948 | DEBUG    | __main__:trials:24 - Trial = 26496/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.950 | DEBUG    | __main__:trials:29 - Trial = 26496/30000 | Total reward = 36.40
2022-01-26 14:18:34.953 | DEBUG    | __main__:trials:24 - Trial = 26497/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.954 | DEBUG    | __main__:trials:29 - Trial = 26497/30000 | Total reward = 50.65
2022-01-26 14:18:34.958 | DEBUG    | __main__:trials:24 - Trial = 26498/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.958 | DEBUG    | __main__:trials:29 - Trial = 26498/30000 | Total reward = 35.78
2022-01-26 14:18:34.962 | DEBUG    | __main__:trials:24 - Trial = 26499/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.963 | DEBUG    | __main__:trials:29 - Trial = 26499/30000 | Total reward = 39.42
2022-01-26 14:18:34.967 | DEBUG    | __main__:trials:24 - Trial = 26500/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.968 | DEBUG    | __main__:trials:29 - Trial = 26500/30000 | Total reward = 40.98
2022-01-26 14:18:34.972 | DEBUG    | __main__:trials:24 - Trial = 26501/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.973 | DEBUG    | __main__:trials:29 - Trial = 26501/30000 | Total reward = 45.57
2022-01-26 14:18:34.976 | DEBUG    | __main__:trials:24 - Trial = 26502/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.978 | DEBUG    | __main__:trials:29 - Trial = 26502/30000 | Total reward = 40.38
2022-01-26 14:18:34.981 | DEBUG    | __main__:trials:24 - Trial = 26503/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.982 | DEBUG    | __main__:trials:29 - Trial = 26503/30000 | Total reward = 37.24
2022-01-26 14:18:34.987 | DEBUG    | __main__:trials:24 - Trial = 26504/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.988 | DEBUG    | __main__:trials:29 - Trial = 26504/30000 | Total reward = 36.15
2022-01-26 14:18:34.992 | DEBUG    | __main__:trials:24 - Trial = 26505/30000 | Max number of steps (20) reached
2022-01-26 14:18:34.992 | DEBUG    | __main__:trials:29 - Trial = 26505/30000 | Total reward = 34.88
2022-01-26 14:18:34.996 | DEBUG    | __main__:trials:26 - Trial = 26506/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:34.997 | DEBUG    | __main__:trials:29 - Trial = 26506/30000 | Total reward = 16.60
2022-01-26 14:18:35.000 | DEBUG    | __main__:trials:24 - Trial = 26507/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.001 | DEBUG    | __main__:trials:29 - Trial = 26507/30000 | Total reward = 49.97
2022-01-26 14:18:35.004 | DEBUG    | __main__:trials:26 - Trial = 26508/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.005 | DEBUG    | __main__:trials:29 - Trial = 26508/30000 | Total reward = 15.86
2022-01-26 14:18:35.009 | DEBUG    | __main__:trials:24 - Trial = 26509/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.010 | DEBUG    | __main__:trials:29 - Trial = 26509/30000 | Total reward = 42.48
2022-01-26 14:18:35.014 | DEBUG    | __main__:trials:24 - Trial = 26510/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.016 | DEBUG    | __main__:trials:29 - Trial = 26510/30000 | Total reward = 38.98
2022-01-26 14:18:35.019 | DEBUG    | __main__:trials:24 - Trial = 26511/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.020 | DEBUG    | __main__:trials:29 - Trial = 26511/30000 | Total reward = 38.10
2022-01-26 14:18:35.024 | DEBUG    | __main__:trials:24 - Trial = 26512/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.026 | DEBUG    | __main__:trials:29 - Trial = 26512/30000 | Total reward = 56.67
2022-01-26 14:18:35.029 | DEBUG    | __main__:trials:24 - Trial = 26513/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.030 | DEBUG    | __main__:trials:29 - Trial = 26513/30000 | Total reward = 51.92
2022-01-26 14:18:35.033 | DEBUG    | __main__:trials:26 - Trial = 26514/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.033 | DEBUG    | __main__:trials:29 - Trial = 26514/30000 | Total reward = 23.47
2022-01-26 14:18:35.037 | DEBUG    | __main__:trials:24 - Trial = 26515/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.039 | DEBUG    | __main__:trials:29 - Trial = 26515/30000 | Total reward = 26.74
2022-01-26 14:18:35.042 | DEBUG    | __main__:trials:24 - Trial = 26516/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.044 | DEBUG    | __main__:trials:29 - Trial = 26516/30000 | Total reward = 44.54
2022-01-26 14:18:35.047 | DEBUG    | __main__:trials:24 - Trial = 26517/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.048 | DEBUG    | __main__:trials:29 - Trial = 26517/30000 | Total reward = 36.12
2022-01-26 14:18:35.052 | DEBUG    | __main__:trials:24 - Trial = 26518/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.054 | DEBUG    | __main__:trials:29 - Trial = 26518/30000 | Total reward = 33.48
2022-01-26 14:18:35.057 | DEBUG    | __main__:trials:24 - Trial = 26519/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.058 | DEBUG    | __main__:trials:29 - Trial = 26519/30000 | Total reward = 41.16
2022-01-26 14:18:35.062 | DEBUG    | __main__:trials:24 - Trial = 26520/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.064 | DEBUG    | __main__:trials:29 - Trial = 26520/30000 | Total reward = 41.59
2022-01-26 14:18:35.067 | DEBUG    | __main__:trials:24 - Trial = 26521/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.068 | DEBUG    | __main__:trials:29 - Trial = 26521/30000 | Total reward = 41.81
2022-01-26 14:18:35.072 | DEBUG    | __main__:trials:24 - Trial = 26522/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.074 | DEBUG    | __main__:trials:29 - Trial = 26522/30000 | Total reward = 37.71
2022-01-26 14:18:35.077 | DEBUG    | __main__:trials:24 - Trial = 26523/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.079 | DEBUG    | __main__:trials:29 - Trial = 26523/30000 | Total reward = 30.82
2022-01-26 14:18:35.082 | DEBUG    | __main__:trials:24 - Trial = 26524/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.084 | DEBUG    | __main__:trials:29 - Trial = 26524/30000 | Total reward = 37.64
2022-01-26 14:18:35.087 | DEBUG    | __main__:trials:24 - Trial = 26525/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.089 | DEBUG    | __main__:trials:29 - Trial = 26525/30000 | Total reward = 32.36
2022-01-26 14:18:35.092 | DEBUG    | __main__:trials:24 - Trial = 26526/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.093 | DEBUG    | __main__:trials:29 - Trial = 26526/30000 | Total reward = 47.97
2022-01-26 14:18:35.097 | DEBUG    | __main__:trials:24 - Trial = 26527/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.099 | DEBUG    | __main__:trials:29 - Trial = 26527/30000 | Total reward = 49.15
2022-01-26 14:18:35.102 | DEBUG    | __main__:trials:24 - Trial = 26528/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.104 | DEBUG    | __main__:trials:29 - Trial = 26528/30000 | Total reward = 42.86
2022-01-26 14:18:35.107 | DEBUG    | __main__:trials:24 - Trial = 26529/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.108 | DEBUG    | __main__:trials:29 - Trial = 26529/30000 | Total reward = 15.11
2022-01-26 14:18:35.112 | DEBUG    | __main__:trials:24 - Trial = 26530/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.113 | DEBUG    | __main__:trials:29 - Trial = 26530/30000 | Total reward = 21.84
2022-01-26 14:18:35.115 | DEBUG    | __main__:trials:26 - Trial = 26531/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.117 | DEBUG    | __main__:trials:29 - Trial = 26531/30000 | Total reward = 7.76
2022-01-26 14:18:35.120 | DEBUG    | __main__:trials:24 - Trial = 26532/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.122 | DEBUG    | __main__:trials:29 - Trial = 26532/30000 | Total reward = 50.15
2022-01-26 14:18:35.126 | DEBUG    | __main__:trials:24 - Trial = 26533/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.127 | DEBUG    | __main__:trials:29 - Trial = 26533/30000 | Total reward = 39.84
2022-01-26 14:18:35.130 | DEBUG    | __main__:trials:24 - Trial = 26534/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.132 | DEBUG    | __main__:trials:29 - Trial = 26534/30000 | Total reward = 36.15
2022-01-26 14:18:35.135 | DEBUG    | __main__:trials:24 - Trial = 26535/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.137 | DEBUG    | __main__:trials:29 - Trial = 26535/30000 | Total reward = 45.21
2022-01-26 14:18:35.140 | DEBUG    | __main__:trials:24 - Trial = 26536/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.141 | DEBUG    | __main__:trials:29 - Trial = 26536/30000 | Total reward = 38.04
2022-01-26 14:18:35.145 | DEBUG    | __main__:trials:24 - Trial = 26537/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.146 | DEBUG    | __main__:trials:29 - Trial = 26537/30000 | Total reward = 41.14
2022-01-26 14:18:35.150 | DEBUG    | __main__:trials:24 - Trial = 26538/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.151 | DEBUG    | __main__:trials:29 - Trial = 26538/30000 | Total reward = 48.08
2022-01-26 14:18:35.155 | DEBUG    | __main__:trials:24 - Trial = 26539/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.157 | DEBUG    | __main__:trials:29 - Trial = 26539/30000 | Total reward = 29.52
2022-01-26 14:18:35.160 | DEBUG    | __main__:trials:24 - Trial = 26540/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.162 | DEBUG    | __main__:trials:29 - Trial = 26540/30000 | Total reward = 33.51
2022-01-26 14:18:35.165 | DEBUG    | __main__:trials:24 - Trial = 26541/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.166 | DEBUG    | __main__:trials:29 - Trial = 26541/30000 | Total reward = 37.97
2022-01-26 14:18:35.170 | DEBUG    | __main__:trials:24 - Trial = 26542/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.172 | DEBUG    | __main__:trials:29 - Trial = 26542/30000 | Total reward = 25.59
2022-01-26 14:18:35.175 | DEBUG    | __main__:trials:24 - Trial = 26543/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.176 | DEBUG    | __main__:trials:29 - Trial = 26543/30000 | Total reward = 32.11
2022-01-26 14:18:35.179 | DEBUG    | __main__:trials:24 - Trial = 26544/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.181 | DEBUG    | __main__:trials:29 - Trial = 26544/30000 | Total reward = 41.66
2022-01-26 14:18:35.185 | DEBUG    | __main__:trials:24 - Trial = 26545/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.185 | DEBUG    | __main__:trials:29 - Trial = 26545/30000 | Total reward = 43.71
2022-01-26 14:18:35.190 | DEBUG    | __main__:trials:24 - Trial = 26546/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.191 | DEBUG    | __main__:trials:29 - Trial = 26546/30000 | Total reward = 42.01
2022-01-26 14:18:35.194 | DEBUG    | __main__:trials:24 - Trial = 26547/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.196 | DEBUG    | __main__:trials:29 - Trial = 26547/30000 | Total reward = 23.34
2022-01-26 14:18:35.199 | DEBUG    | __main__:trials:24 - Trial = 26548/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.199 | DEBUG    | __main__:trials:29 - Trial = 26548/30000 | Total reward = 50.32
2022-01-26 14:18:35.203 | DEBUG    | __main__:trials:24 - Trial = 26549/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.205 | DEBUG    | __main__:trials:29 - Trial = 26549/30000 | Total reward = 41.82
2022-01-26 14:18:35.207 | DEBUG    | __main__:trials:24 - Trial = 26550/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.209 | DEBUG    | __main__:trials:29 - Trial = 26550/30000 | Total reward = 25.96
2022-01-26 14:18:35.212 | DEBUG    | __main__:trials:24 - Trial = 26551/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.212 | DEBUG    | __main__:trials:29 - Trial = 26551/30000 | Total reward = 40.56
2022-01-26 14:18:35.216 | DEBUG    | __main__:trials:24 - Trial = 26552/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.217 | DEBUG    | __main__:trials:29 - Trial = 26552/30000 | Total reward = 39.85
2022-01-26 14:18:35.221 | DEBUG    | __main__:trials:24 - Trial = 26553/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.222 | DEBUG    | __main__:trials:29 - Trial = 26553/30000 | Total reward = 24.15
2022-01-26 14:18:35.225 | DEBUG    | __main__:trials:24 - Trial = 26554/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.227 | DEBUG    | __main__:trials:29 - Trial = 26554/30000 | Total reward = 34.44
2022-01-26 14:18:35.230 | DEBUG    | __main__:trials:24 - Trial = 26555/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.232 | DEBUG    | __main__:trials:29 - Trial = 26555/30000 | Total reward = 43.83
2022-01-26 14:18:35.234 | DEBUG    | __main__:trials:24 - Trial = 26556/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.236 | DEBUG    | __main__:trials:29 - Trial = 26556/30000 | Total reward = 51.47
2022-01-26 14:18:35.239 | DEBUG    | __main__:trials:24 - Trial = 26557/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.241 | DEBUG    | __main__:trials:29 - Trial = 26557/30000 | Total reward = 23.23
2022-01-26 14:18:35.244 | DEBUG    | __main__:trials:24 - Trial = 26558/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.245 | DEBUG    | __main__:trials:29 - Trial = 26558/30000 | Total reward = 33.72
2022-01-26 14:18:35.248 | DEBUG    | __main__:trials:24 - Trial = 26559/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.250 | DEBUG    | __main__:trials:29 - Trial = 26559/30000 | Total reward = 41.46
2022-01-26 14:18:35.253 | DEBUG    | __main__:trials:24 - Trial = 26560/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.254 | DEBUG    | __main__:trials:29 - Trial = 26560/30000 | Total reward = 46.25
2022-01-26 14:18:35.258 | DEBUG    | __main__:trials:24 - Trial = 26561/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.259 | DEBUG    | __main__:trials:29 - Trial = 26561/30000 | Total reward = 35.81
2022-01-26 14:18:35.263 | DEBUG    | __main__:trials:24 - Trial = 26562/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.263 | DEBUG    | __main__:trials:29 - Trial = 26562/30000 | Total reward = 47.66
2022-01-26 14:18:35.267 | DEBUG    | __main__:trials:24 - Trial = 26563/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.269 | DEBUG    | __main__:trials:29 - Trial = 26563/30000 | Total reward = 30.82
2022-01-26 14:18:35.272 | DEBUG    | __main__:trials:24 - Trial = 26564/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.273 | DEBUG    | __main__:trials:29 - Trial = 26564/30000 | Total reward = 43.65
2022-01-26 14:18:35.276 | DEBUG    | __main__:trials:24 - Trial = 26565/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.278 | DEBUG    | __main__:trials:29 - Trial = 26565/30000 | Total reward = 37.05
2022-01-26 14:18:35.282 | DEBUG    | __main__:trials:24 - Trial = 26566/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.282 | DEBUG    | __main__:trials:29 - Trial = 26566/30000 | Total reward = 44.64
2022-01-26 14:18:35.286 | DEBUG    | __main__:trials:24 - Trial = 26567/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.286 | DEBUG    | __main__:trials:29 - Trial = 26567/30000 | Total reward = 37.51
2022-01-26 14:18:35.290 | DEBUG    | __main__:trials:24 - Trial = 26568/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.291 | DEBUG    | __main__:trials:29 - Trial = 26568/30000 | Total reward = 29.46
2022-01-26 14:18:35.295 | DEBUG    | __main__:trials:24 - Trial = 26569/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.296 | DEBUG    | __main__:trials:29 - Trial = 26569/30000 | Total reward = 45.03
2022-01-26 14:18:35.300 | DEBUG    | __main__:trials:24 - Trial = 26570/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.302 | DEBUG    | __main__:trials:29 - Trial = 26570/30000 | Total reward = 45.37
2022-01-26 14:18:35.306 | DEBUG    | __main__:trials:24 - Trial = 26571/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.307 | DEBUG    | __main__:trials:29 - Trial = 26571/30000 | Total reward = 28.46
2022-01-26 14:18:35.311 | DEBUG    | __main__:trials:24 - Trial = 26572/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.312 | DEBUG    | __main__:trials:29 - Trial = 26572/30000 | Total reward = 41.37
2022-01-26 14:18:35.316 | DEBUG    | __main__:trials:26 - Trial = 26573/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.317 | DEBUG    | __main__:trials:29 - Trial = 26573/30000 | Total reward = 26.08
2022-01-26 14:18:35.321 | DEBUG    | __main__:trials:24 - Trial = 26574/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.322 | DEBUG    | __main__:trials:29 - Trial = 26574/30000 | Total reward = 45.86
2022-01-26 14:18:35.326 | DEBUG    | __main__:trials:24 - Trial = 26575/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.327 | DEBUG    | __main__:trials:29 - Trial = 26575/30000 | Total reward = 37.61
2022-01-26 14:18:35.331 | DEBUG    | __main__:trials:24 - Trial = 26576/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.332 | DEBUG    | __main__:trials:29 - Trial = 26576/30000 | Total reward = 31.34
2022-01-26 14:18:35.336 | DEBUG    | __main__:trials:24 - Trial = 26577/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.337 | DEBUG    | __main__:trials:29 - Trial = 26577/30000 | Total reward = 42.48
2022-01-26 14:18:35.340 | DEBUG    | __main__:trials:24 - Trial = 26578/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.342 | DEBUG    | __main__:trials:29 - Trial = 26578/30000 | Total reward = 29.16
2022-01-26 14:18:35.346 | DEBUG    | __main__:trials:24 - Trial = 26579/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.346 | DEBUG    | __main__:trials:29 - Trial = 26579/30000 | Total reward = 38.42
2022-01-26 14:18:35.350 | DEBUG    | __main__:trials:24 - Trial = 26580/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.352 | DEBUG    | __main__:trials:29 - Trial = 26580/30000 | Total reward = 42.15
2022-01-26 14:18:35.355 | DEBUG    | __main__:trials:24 - Trial = 26581/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.356 | DEBUG    | __main__:trials:29 - Trial = 26581/30000 | Total reward = 25.70
2022-01-26 14:18:35.359 | DEBUG    | __main__:trials:24 - Trial = 26582/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.361 | DEBUG    | __main__:trials:29 - Trial = 26582/30000 | Total reward = 46.17
2022-01-26 14:18:35.365 | DEBUG    | __main__:trials:24 - Trial = 26583/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.365 | DEBUG    | __main__:trials:29 - Trial = 26583/30000 | Total reward = 37.96
2022-01-26 14:18:35.370 | DEBUG    | __main__:trials:24 - Trial = 26584/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.371 | DEBUG    | __main__:trials:29 - Trial = 26584/30000 | Total reward = 47.54
2022-01-26 14:18:35.375 | DEBUG    | __main__:trials:24 - Trial = 26585/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.376 | DEBUG    | __main__:trials:29 - Trial = 26585/30000 | Total reward = 42.15
2022-01-26 14:18:35.380 | DEBUG    | __main__:trials:24 - Trial = 26586/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.381 | DEBUG    | __main__:trials:29 - Trial = 26586/30000 | Total reward = 28.18
2022-01-26 14:18:35.384 | DEBUG    | __main__:trials:26 - Trial = 26587/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.384 | DEBUG    | __main__:trials:29 - Trial = 26587/30000 | Total reward = 15.55
2022-01-26 14:18:35.388 | DEBUG    | __main__:trials:24 - Trial = 26588/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.390 | DEBUG    | __main__:trials:29 - Trial = 26588/30000 | Total reward = 38.33
2022-01-26 14:18:35.392 | DEBUG    | __main__:trials:26 - Trial = 26589/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.393 | DEBUG    | __main__:trials:29 - Trial = 26589/30000 | Total reward = 15.15
2022-01-26 14:18:35.396 | DEBUG    | __main__:trials:24 - Trial = 26590/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.398 | DEBUG    | __main__:trials:29 - Trial = 26590/30000 | Total reward = 25.24
2022-01-26 14:18:35.401 | DEBUG    | __main__:trials:24 - Trial = 26591/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.403 | DEBUG    | __main__:trials:29 - Trial = 26591/30000 | Total reward = 36.35
2022-01-26 14:18:35.407 | DEBUG    | __main__:trials:24 - Trial = 26592/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.408 | DEBUG    | __main__:trials:29 - Trial = 26592/30000 | Total reward = 36.15
2022-01-26 14:18:35.412 | DEBUG    | __main__:trials:24 - Trial = 26593/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.413 | DEBUG    | __main__:trials:29 - Trial = 26593/30000 | Total reward = 52.50
2022-01-26 14:18:35.416 | DEBUG    | __main__:trials:24 - Trial = 26594/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.418 | DEBUG    | __main__:trials:29 - Trial = 26594/30000 | Total reward = 44.90
2022-01-26 14:18:35.422 | DEBUG    | __main__:trials:24 - Trial = 26595/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.422 | DEBUG    | __main__:trials:29 - Trial = 26595/30000 | Total reward = 43.75
2022-01-26 14:18:35.427 | DEBUG    | __main__:trials:24 - Trial = 26596/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.427 | DEBUG    | __main__:trials:29 - Trial = 26596/30000 | Total reward = 43.70
2022-01-26 14:18:35.432 | DEBUG    | __main__:trials:24 - Trial = 26597/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.433 | DEBUG    | __main__:trials:29 - Trial = 26597/30000 | Total reward = 43.54
2022-01-26 14:18:35.436 | DEBUG    | __main__:trials:24 - Trial = 26598/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.438 | DEBUG    | __main__:trials:29 - Trial = 26598/30000 | Total reward = 37.43
2022-01-26 14:18:35.441 | DEBUG    | __main__:trials:24 - Trial = 26599/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.442 | DEBUG    | __main__:trials:29 - Trial = 26599/30000 | Total reward = 43.85
2022-01-26 14:18:35.446 | DEBUG    | __main__:trials:24 - Trial = 26600/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.448 | DEBUG    | __main__:trials:29 - Trial = 26600/30000 | Total reward = 14.09
2022-01-26 14:18:35.451 | DEBUG    | __main__:trials:24 - Trial = 26601/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.453 | DEBUG    | __main__:trials:29 - Trial = 26601/30000 | Total reward = 36.13
2022-01-26 14:18:35.457 | DEBUG    | __main__:trials:24 - Trial = 26602/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.458 | DEBUG    | __main__:trials:29 - Trial = 26602/30000 | Total reward = 42.37
2022-01-26 14:18:35.462 | DEBUG    | __main__:trials:24 - Trial = 26603/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.463 | DEBUG    | __main__:trials:29 - Trial = 26603/30000 | Total reward = 26.99
2022-01-26 14:18:35.466 | DEBUG    | __main__:trials:24 - Trial = 26604/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.468 | DEBUG    | __main__:trials:29 - Trial = 26604/30000 | Total reward = 45.87
2022-01-26 14:18:35.472 | DEBUG    | __main__:trials:24 - Trial = 26605/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.472 | DEBUG    | __main__:trials:29 - Trial = 26605/30000 | Total reward = 29.06
2022-01-26 14:18:35.476 | DEBUG    | __main__:trials:24 - Trial = 26606/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.478 | DEBUG    | __main__:trials:29 - Trial = 26606/30000 | Total reward = 19.56
2022-01-26 14:18:35.481 | DEBUG    | __main__:trials:24 - Trial = 26607/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.483 | DEBUG    | __main__:trials:29 - Trial = 26607/30000 | Total reward = 19.51
2022-01-26 14:18:35.486 | DEBUG    | __main__:trials:24 - Trial = 26608/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.487 | DEBUG    | __main__:trials:29 - Trial = 26608/30000 | Total reward = 38.39
2022-01-26 14:18:35.491 | DEBUG    | __main__:trials:24 - Trial = 26609/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.491 | DEBUG    | __main__:trials:29 - Trial = 26609/30000 | Total reward = 47.53
2022-01-26 14:18:35.495 | DEBUG    | __main__:trials:24 - Trial = 26610/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.496 | DEBUG    | __main__:trials:29 - Trial = 26610/30000 | Total reward = 41.30
2022-01-26 14:18:35.500 | DEBUG    | __main__:trials:24 - Trial = 26611/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.501 | DEBUG    | __main__:trials:29 - Trial = 26611/30000 | Total reward = 31.03
2022-01-26 14:18:35.504 | DEBUG    | __main__:trials:24 - Trial = 26612/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.505 | DEBUG    | __main__:trials:29 - Trial = 26612/30000 | Total reward = 25.34
2022-01-26 14:18:35.509 | DEBUG    | __main__:trials:24 - Trial = 26613/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.509 | DEBUG    | __main__:trials:29 - Trial = 26613/30000 | Total reward = 31.27
2022-01-26 14:18:35.513 | DEBUG    | __main__:trials:24 - Trial = 26614/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.514 | DEBUG    | __main__:trials:29 - Trial = 26614/30000 | Total reward = 40.77
2022-01-26 14:18:35.516 | DEBUG    | __main__:trials:26 - Trial = 26615/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.518 | DEBUG    | __main__:trials:29 - Trial = 26615/30000 | Total reward = 9.39
2022-01-26 14:18:35.521 | DEBUG    | __main__:trials:24 - Trial = 26616/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.523 | DEBUG    | __main__:trials:29 - Trial = 26616/30000 | Total reward = 22.23
2022-01-26 14:18:35.526 | DEBUG    | __main__:trials:24 - Trial = 26617/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.527 | DEBUG    | __main__:trials:29 - Trial = 26617/30000 | Total reward = 29.42
2022-01-26 14:18:35.531 | DEBUG    | __main__:trials:24 - Trial = 26618/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.532 | DEBUG    | __main__:trials:29 - Trial = 26618/30000 | Total reward = 32.32
2022-01-26 14:18:35.536 | DEBUG    | __main__:trials:24 - Trial = 26619/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.537 | DEBUG    | __main__:trials:29 - Trial = 26619/30000 | Total reward = 24.40
2022-01-26 14:18:35.541 | DEBUG    | __main__:trials:24 - Trial = 26620/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.543 | DEBUG    | __main__:trials:29 - Trial = 26620/30000 | Total reward = 41.46
2022-01-26 14:18:35.546 | DEBUG    | __main__:trials:24 - Trial = 26621/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.548 | DEBUG    | __main__:trials:29 - Trial = 26621/30000 | Total reward = 35.73
2022-01-26 14:18:35.551 | DEBUG    | __main__:trials:24 - Trial = 26622/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.552 | DEBUG    | __main__:trials:29 - Trial = 26622/30000 | Total reward = 30.88
2022-01-26 14:18:35.556 | DEBUG    | __main__:trials:24 - Trial = 26623/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.557 | DEBUG    | __main__:trials:29 - Trial = 26623/30000 | Total reward = 37.11
2022-01-26 14:18:35.561 | DEBUG    | __main__:trials:24 - Trial = 26624/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.562 | DEBUG    | __main__:trials:29 - Trial = 26624/30000 | Total reward = 46.45
2022-01-26 14:18:35.566 | DEBUG    | __main__:trials:24 - Trial = 26625/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.567 | DEBUG    | __main__:trials:29 - Trial = 26625/30000 | Total reward = 35.41
2022-01-26 14:18:35.571 | DEBUG    | __main__:trials:24 - Trial = 26626/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.573 | DEBUG    | __main__:trials:29 - Trial = 26626/30000 | Total reward = 37.64
2022-01-26 14:18:35.576 | DEBUG    | __main__:trials:24 - Trial = 26627/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.578 | DEBUG    | __main__:trials:29 - Trial = 26627/30000 | Total reward = 42.17
2022-01-26 14:18:35.582 | DEBUG    | __main__:trials:24 - Trial = 26628/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.582 | DEBUG    | __main__:trials:29 - Trial = 26628/30000 | Total reward = 34.42
2022-01-26 14:18:35.587 | DEBUG    | __main__:trials:24 - Trial = 26629/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.587 | DEBUG    | __main__:trials:29 - Trial = 26629/30000 | Total reward = 42.38
2022-01-26 14:18:35.592 | DEBUG    | __main__:trials:24 - Trial = 26630/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.593 | DEBUG    | __main__:trials:29 - Trial = 26630/30000 | Total reward = 29.88
2022-01-26 14:18:35.597 | DEBUG    | __main__:trials:24 - Trial = 26631/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.597 | DEBUG    | __main__:trials:29 - Trial = 26631/30000 | Total reward = 40.59
2022-01-26 14:18:35.601 | DEBUG    | __main__:trials:24 - Trial = 26632/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.602 | DEBUG    | __main__:trials:29 - Trial = 26632/30000 | Total reward = 43.38
2022-01-26 14:18:35.606 | DEBUG    | __main__:trials:24 - Trial = 26633/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.606 | DEBUG    | __main__:trials:29 - Trial = 26633/30000 | Total reward = 35.65
2022-01-26 14:18:35.611 | DEBUG    | __main__:trials:24 - Trial = 26634/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.612 | DEBUG    | __main__:trials:29 - Trial = 26634/30000 | Total reward = 41.74
2022-01-26 14:18:35.616 | DEBUG    | __main__:trials:24 - Trial = 26635/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.617 | DEBUG    | __main__:trials:29 - Trial = 26635/30000 | Total reward = 35.83
2022-01-26 14:18:35.621 | DEBUG    | __main__:trials:24 - Trial = 26636/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.622 | DEBUG    | __main__:trials:29 - Trial = 26636/30000 | Total reward = 29.01
2022-01-26 14:18:35.626 | DEBUG    | __main__:trials:24 - Trial = 26637/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.627 | DEBUG    | __main__:trials:29 - Trial = 26637/30000 | Total reward = 45.53
2022-01-26 14:18:35.631 | DEBUG    | __main__:trials:24 - Trial = 26638/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.633 | DEBUG    | __main__:trials:29 - Trial = 26638/30000 | Total reward = 40.28
2022-01-26 14:18:35.636 | DEBUG    | __main__:trials:24 - Trial = 26639/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.637 | DEBUG    | __main__:trials:29 - Trial = 26639/30000 | Total reward = 43.94
2022-01-26 14:18:35.641 | DEBUG    | __main__:trials:24 - Trial = 26640/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.642 | DEBUG    | __main__:trials:29 - Trial = 26640/30000 | Total reward = 29.82
2022-01-26 14:18:35.647 | DEBUG    | __main__:trials:24 - Trial = 26641/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.647 | DEBUG    | __main__:trials:29 - Trial = 26641/30000 | Total reward = 32.76
2022-01-26 14:18:35.652 | DEBUG    | __main__:trials:24 - Trial = 26642/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.653 | DEBUG    | __main__:trials:29 - Trial = 26642/30000 | Total reward = 47.01
2022-01-26 14:18:35.656 | DEBUG    | __main__:trials:26 - Trial = 26643/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.657 | DEBUG    | __main__:trials:29 - Trial = 26643/30000 | Total reward = 15.09
2022-01-26 14:18:35.660 | DEBUG    | __main__:trials:24 - Trial = 26644/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.662 | DEBUG    | __main__:trials:29 - Trial = 26644/30000 | Total reward = 31.40
2022-01-26 14:18:35.666 | DEBUG    | __main__:trials:24 - Trial = 26645/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.666 | DEBUG    | __main__:trials:29 - Trial = 26645/30000 | Total reward = 35.60
2022-01-26 14:18:35.670 | DEBUG    | __main__:trials:24 - Trial = 26646/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.671 | DEBUG    | __main__:trials:29 - Trial = 26646/30000 | Total reward = 36.36
2022-01-26 14:18:35.675 | DEBUG    | __main__:trials:24 - Trial = 26647/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.677 | DEBUG    | __main__:trials:29 - Trial = 26647/30000 | Total reward = 35.74
2022-01-26 14:18:35.680 | DEBUG    | __main__:trials:24 - Trial = 26648/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.682 | DEBUG    | __main__:trials:29 - Trial = 26648/30000 | Total reward = 41.80
2022-01-26 14:18:35.685 | DEBUG    | __main__:trials:24 - Trial = 26649/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.686 | DEBUG    | __main__:trials:29 - Trial = 26649/30000 | Total reward = 41.28
2022-01-26 14:18:35.691 | DEBUG    | __main__:trials:24 - Trial = 26650/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.691 | DEBUG    | __main__:trials:29 - Trial = 26650/30000 | Total reward = 36.56
2022-01-26 14:18:35.696 | DEBUG    | __main__:trials:24 - Trial = 26651/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.697 | DEBUG    | __main__:trials:29 - Trial = 26651/30000 | Total reward = 37.70
2022-01-26 14:18:35.701 | DEBUG    | __main__:trials:24 - Trial = 26652/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.702 | DEBUG    | __main__:trials:29 - Trial = 26652/30000 | Total reward = 34.80
2022-01-26 14:18:35.705 | DEBUG    | __main__:trials:24 - Trial = 26653/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.707 | DEBUG    | __main__:trials:29 - Trial = 26653/30000 | Total reward = 30.17
2022-01-26 14:18:35.710 | DEBUG    | __main__:trials:26 - Trial = 26654/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.711 | DEBUG    | __main__:trials:29 - Trial = 26654/30000 | Total reward = 13.14
2022-01-26 14:18:35.715 | DEBUG    | __main__:trials:24 - Trial = 26655/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.717 | DEBUG    | __main__:trials:29 - Trial = 26655/30000 | Total reward = 25.60
2022-01-26 14:18:35.720 | DEBUG    | __main__:trials:24 - Trial = 26656/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.721 | DEBUG    | __main__:trials:29 - Trial = 26656/30000 | Total reward = 26.72
2022-01-26 14:18:35.726 | DEBUG    | __main__:trials:24 - Trial = 26657/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.726 | DEBUG    | __main__:trials:29 - Trial = 26657/30000 | Total reward = 15.66
2022-01-26 14:18:35.730 | DEBUG    | __main__:trials:26 - Trial = 26658/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.731 | DEBUG    | __main__:trials:29 - Trial = 26658/30000 | Total reward = 13.92
2022-01-26 14:18:35.736 | DEBUG    | __main__:trials:24 - Trial = 26659/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.737 | DEBUG    | __main__:trials:29 - Trial = 26659/30000 | Total reward = 38.15
2022-01-26 14:18:35.740 | DEBUG    | __main__:trials:24 - Trial = 26660/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.742 | DEBUG    | __main__:trials:29 - Trial = 26660/30000 | Total reward = 42.94
2022-01-26 14:18:35.746 | DEBUG    | __main__:trials:24 - Trial = 26661/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.746 | DEBUG    | __main__:trials:29 - Trial = 26661/30000 | Total reward = 46.43
2022-01-26 14:18:35.750 | DEBUG    | __main__:trials:26 - Trial = 26662/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.751 | DEBUG    | __main__:trials:29 - Trial = 26662/30000 | Total reward = 11.81
2022-01-26 14:18:35.755 | DEBUG    | __main__:trials:24 - Trial = 26663/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.756 | DEBUG    | __main__:trials:29 - Trial = 26663/30000 | Total reward = 27.37
2022-01-26 14:18:35.759 | DEBUG    | __main__:trials:24 - Trial = 26664/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.761 | DEBUG    | __main__:trials:29 - Trial = 26664/30000 | Total reward = 25.94
2022-01-26 14:18:35.764 | DEBUG    | __main__:trials:24 - Trial = 26665/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.765 | DEBUG    | __main__:trials:29 - Trial = 26665/30000 | Total reward = 28.25
2022-01-26 14:18:35.769 | DEBUG    | __main__:trials:24 - Trial = 26666/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.770 | DEBUG    | __main__:trials:29 - Trial = 26666/30000 | Total reward = 27.29
2022-01-26 14:18:35.773 | DEBUG    | __main__:trials:26 - Trial = 26667/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.775 | DEBUG    | __main__:trials:29 - Trial = 26667/30000 | Total reward = 13.33
2022-01-26 14:18:35.778 | DEBUG    | __main__:trials:24 - Trial = 26668/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.779 | DEBUG    | __main__:trials:29 - Trial = 26668/30000 | Total reward = 36.15
2022-01-26 14:18:35.782 | DEBUG    | __main__:trials:26 - Trial = 26669/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.783 | DEBUG    | __main__:trials:29 - Trial = 26669/30000 | Total reward = 18.20
2022-01-26 14:18:35.787 | DEBUG    | __main__:trials:26 - Trial = 26670/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.788 | DEBUG    | __main__:trials:29 - Trial = 26670/30000 | Total reward = 17.49
2022-01-26 14:18:35.792 | DEBUG    | __main__:trials:24 - Trial = 26671/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.793 | DEBUG    | __main__:trials:29 - Trial = 26671/30000 | Total reward = 29.36
2022-01-26 14:18:35.797 | DEBUG    | __main__:trials:24 - Trial = 26672/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.797 | DEBUG    | __main__:trials:29 - Trial = 26672/30000 | Total reward = 20.94
2022-01-26 14:18:35.801 | DEBUG    | __main__:trials:24 - Trial = 26673/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.803 | DEBUG    | __main__:trials:29 - Trial = 26673/30000 | Total reward = 29.70
2022-01-26 14:18:35.806 | DEBUG    | __main__:trials:24 - Trial = 26674/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.808 | DEBUG    | __main__:trials:29 - Trial = 26674/30000 | Total reward = 15.25
2022-01-26 14:18:35.811 | DEBUG    | __main__:trials:24 - Trial = 26675/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.813 | DEBUG    | __main__:trials:29 - Trial = 26675/30000 | Total reward = 25.88
2022-01-26 14:18:35.816 | DEBUG    | __main__:trials:24 - Trial = 26676/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.817 | DEBUG    | __main__:trials:29 - Trial = 26676/30000 | Total reward = 25.21
2022-01-26 14:18:35.820 | DEBUG    | __main__:trials:24 - Trial = 26677/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.821 | DEBUG    | __main__:trials:29 - Trial = 26677/30000 | Total reward = 23.44
2022-01-26 14:18:35.825 | DEBUG    | __main__:trials:24 - Trial = 26678/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.826 | DEBUG    | __main__:trials:29 - Trial = 26678/30000 | Total reward = 34.56
2022-01-26 14:18:35.830 | DEBUG    | __main__:trials:24 - Trial = 26679/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.831 | DEBUG    | __main__:trials:29 - Trial = 26679/30000 | Total reward = 25.19
2022-01-26 14:18:35.834 | DEBUG    | __main__:trials:24 - Trial = 26680/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.836 | DEBUG    | __main__:trials:29 - Trial = 26680/30000 | Total reward = 27.13
2022-01-26 14:18:35.839 | DEBUG    | __main__:trials:26 - Trial = 26681/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.841 | DEBUG    | __main__:trials:29 - Trial = 26681/30000 | Total reward = 20.39
2022-01-26 14:18:35.844 | DEBUG    | __main__:trials:26 - Trial = 26682/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.845 | DEBUG    | __main__:trials:29 - Trial = 26682/30000 | Total reward = 18.69
2022-01-26 14:18:35.849 | DEBUG    | __main__:trials:24 - Trial = 26683/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.850 | DEBUG    | __main__:trials:29 - Trial = 26683/30000 | Total reward = 17.95
2022-01-26 14:18:35.853 | DEBUG    | __main__:trials:24 - Trial = 26684/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.855 | DEBUG    | __main__:trials:29 - Trial = 26684/30000 | Total reward = 25.72
2022-01-26 14:18:35.858 | DEBUG    | __main__:trials:24 - Trial = 26685/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.860 | DEBUG    | __main__:trials:29 - Trial = 26685/30000 | Total reward = 41.05
2022-01-26 14:18:35.863 | DEBUG    | __main__:trials:24 - Trial = 26686/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.865 | DEBUG    | __main__:trials:29 - Trial = 26686/30000 | Total reward = 18.39
2022-01-26 14:18:35.868 | DEBUG    | __main__:trials:24 - Trial = 26687/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.870 | DEBUG    | __main__:trials:29 - Trial = 26687/30000 | Total reward = 24.34
2022-01-26 14:18:35.873 | DEBUG    | __main__:trials:24 - Trial = 26688/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.874 | DEBUG    | __main__:trials:29 - Trial = 26688/30000 | Total reward = 20.30
2022-01-26 14:18:35.877 | DEBUG    | __main__:trials:26 - Trial = 26689/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.877 | DEBUG    | __main__:trials:29 - Trial = 26689/30000 | Total reward = 26.81
2022-01-26 14:18:35.881 | DEBUG    | __main__:trials:24 - Trial = 26690/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.883 | DEBUG    | __main__:trials:29 - Trial = 26690/30000 | Total reward = 47.09
2022-01-26 14:18:35.886 | DEBUG    | __main__:trials:24 - Trial = 26691/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.887 | DEBUG    | __main__:trials:29 - Trial = 26691/30000 | Total reward = 25.44
2022-01-26 14:18:35.890 | DEBUG    | __main__:trials:24 - Trial = 26692/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.892 | DEBUG    | __main__:trials:29 - Trial = 26692/30000 | Total reward = 24.97
2022-01-26 14:18:35.895 | DEBUG    | __main__:trials:24 - Trial = 26693/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.896 | DEBUG    | __main__:trials:29 - Trial = 26693/30000 | Total reward = 30.45
2022-01-26 14:18:35.900 | DEBUG    | __main__:trials:24 - Trial = 26694/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.901 | DEBUG    | __main__:trials:29 - Trial = 26694/30000 | Total reward = 25.02
2022-01-26 14:18:35.904 | DEBUG    | __main__:trials:24 - Trial = 26695/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.906 | DEBUG    | __main__:trials:29 - Trial = 26695/30000 | Total reward = 25.49
2022-01-26 14:18:35.909 | DEBUG    | __main__:trials:26 - Trial = 26696/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.910 | DEBUG    | __main__:trials:29 - Trial = 26696/30000 | Total reward = 20.81
2022-01-26 14:18:35.913 | DEBUG    | __main__:trials:24 - Trial = 26697/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.915 | DEBUG    | __main__:trials:29 - Trial = 26697/30000 | Total reward = 26.72
2022-01-26 14:18:35.918 | DEBUG    | __main__:trials:26 - Trial = 26698/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.918 | DEBUG    | __main__:trials:29 - Trial = 26698/30000 | Total reward = 16.20
2022-01-26 14:18:35.922 | DEBUG    | __main__:trials:24 - Trial = 26699/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.923 | DEBUG    | __main__:trials:29 - Trial = 26699/30000 | Total reward = 44.82
2022-01-26 14:18:35.927 | DEBUG    | __main__:trials:24 - Trial = 26700/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.928 | DEBUG    | __main__:trials:29 - Trial = 26700/30000 | Total reward = 26.89
2022-01-26 14:18:35.932 | DEBUG    | __main__:trials:24 - Trial = 26701/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.933 | DEBUG    | __main__:trials:29 - Trial = 26701/30000 | Total reward = 25.94
2022-01-26 14:18:35.936 | DEBUG    | __main__:trials:24 - Trial = 26702/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.938 | DEBUG    | __main__:trials:29 - Trial = 26702/30000 | Total reward = 23.06
2022-01-26 14:18:35.941 | DEBUG    | __main__:trials:26 - Trial = 26703/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.942 | DEBUG    | __main__:trials:29 - Trial = 26703/30000 | Total reward = 18.04
2022-01-26 14:18:35.946 | DEBUG    | __main__:trials:26 - Trial = 26704/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.947 | DEBUG    | __main__:trials:29 - Trial = 26704/30000 | Total reward = 15.46
2022-01-26 14:18:35.949 | DEBUG    | __main__:trials:26 - Trial = 26705/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.951 | DEBUG    | __main__:trials:29 - Trial = 26705/30000 | Total reward = 12.87
2022-01-26 14:18:35.955 | DEBUG    | __main__:trials:24 - Trial = 26706/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.957 | DEBUG    | __main__:trials:29 - Trial = 26706/30000 | Total reward = 18.51
2022-01-26 14:18:35.959 | DEBUG    | __main__:trials:24 - Trial = 26707/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.961 | DEBUG    | __main__:trials:29 - Trial = 26707/30000 | Total reward = 20.52
2022-01-26 14:18:35.963 | DEBUG    | __main__:trials:26 - Trial = 26708/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.964 | DEBUG    | __main__:trials:29 - Trial = 26708/30000 | Total reward = 12.28
2022-01-26 14:18:35.968 | DEBUG    | __main__:trials:24 - Trial = 26709/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.970 | DEBUG    | __main__:trials:29 - Trial = 26709/30000 | Total reward = 32.43
2022-01-26 14:18:35.973 | DEBUG    | __main__:trials:26 - Trial = 26710/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:35.974 | DEBUG    | __main__:trials:29 - Trial = 26710/30000 | Total reward = 15.30
2022-01-26 14:18:35.978 | DEBUG    | __main__:trials:24 - Trial = 26711/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.980 | DEBUG    | __main__:trials:29 - Trial = 26711/30000 | Total reward = 34.47
2022-01-26 14:18:35.984 | DEBUG    | __main__:trials:24 - Trial = 26712/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.985 | DEBUG    | __main__:trials:29 - Trial = 26712/30000 | Total reward = 27.37
2022-01-26 14:18:35.989 | DEBUG    | __main__:trials:24 - Trial = 26713/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.991 | DEBUG    | __main__:trials:29 - Trial = 26713/30000 | Total reward = 49.87
2022-01-26 14:18:35.993 | DEBUG    | __main__:trials:24 - Trial = 26714/30000 | Max number of steps (20) reached
2022-01-26 14:18:35.995 | DEBUG    | __main__:trials:29 - Trial = 26714/30000 | Total reward = 37.25
2022-01-26 14:18:35.999 | DEBUG    | __main__:trials:24 - Trial = 26715/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.000 | DEBUG    | __main__:trials:29 - Trial = 26715/30000 | Total reward = 37.81
2022-01-26 14:18:36.004 | DEBUG    | __main__:trials:24 - Trial = 26716/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.005 | DEBUG    | __main__:trials:29 - Trial = 26716/30000 | Total reward = 41.12
2022-01-26 14:18:36.009 | DEBUG    | __main__:trials:24 - Trial = 26717/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.010 | DEBUG    | __main__:trials:29 - Trial = 26717/30000 | Total reward = 19.91
2022-01-26 14:18:36.013 | DEBUG    | __main__:trials:26 - Trial = 26718/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.014 | DEBUG    | __main__:trials:29 - Trial = 26718/30000 | Total reward = 15.50
2022-01-26 14:18:36.017 | DEBUG    | __main__:trials:24 - Trial = 26719/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.018 | DEBUG    | __main__:trials:29 - Trial = 26719/30000 | Total reward = 42.48
2022-01-26 14:18:36.022 | DEBUG    | __main__:trials:24 - Trial = 26720/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.024 | DEBUG    | __main__:trials:29 - Trial = 26720/30000 | Total reward = 30.24
2022-01-26 14:18:36.028 | DEBUG    | __main__:trials:24 - Trial = 26721/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.029 | DEBUG    | __main__:trials:29 - Trial = 26721/30000 | Total reward = 32.15
2022-01-26 14:18:36.032 | DEBUG    | __main__:trials:26 - Trial = 26722/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.034 | DEBUG    | __main__:trials:29 - Trial = 26722/30000 | Total reward = 14.41
2022-01-26 14:18:36.037 | DEBUG    | __main__:trials:26 - Trial = 26723/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.039 | DEBUG    | __main__:trials:29 - Trial = 26723/30000 | Total reward = 22.78
2022-01-26 14:18:36.043 | DEBUG    | __main__:trials:24 - Trial = 26724/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.044 | DEBUG    | __main__:trials:29 - Trial = 26724/30000 | Total reward = 48.90
2022-01-26 14:18:36.048 | DEBUG    | __main__:trials:24 - Trial = 26725/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.049 | DEBUG    | __main__:trials:29 - Trial = 26725/30000 | Total reward = 10.89
2022-01-26 14:18:36.053 | DEBUG    | __main__:trials:24 - Trial = 26726/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.055 | DEBUG    | __main__:trials:29 - Trial = 26726/30000 | Total reward = 36.80
2022-01-26 14:18:36.058 | DEBUG    | __main__:trials:26 - Trial = 26727/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.059 | DEBUG    | __main__:trials:29 - Trial = 26727/30000 | Total reward = 13.65
2022-01-26 14:18:36.063 | DEBUG    | __main__:trials:24 - Trial = 26728/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.064 | DEBUG    | __main__:trials:29 - Trial = 26728/30000 | Total reward = 20.33
2022-01-26 14:18:36.067 | DEBUG    | __main__:trials:24 - Trial = 26729/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.069 | DEBUG    | __main__:trials:29 - Trial = 26729/30000 | Total reward = 25.94
2022-01-26 14:18:36.073 | DEBUG    | __main__:trials:24 - Trial = 26730/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.074 | DEBUG    | __main__:trials:29 - Trial = 26730/30000 | Total reward = 48.74
2022-01-26 14:18:36.077 | DEBUG    | __main__:trials:24 - Trial = 26731/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.078 | DEBUG    | __main__:trials:29 - Trial = 26731/30000 | Total reward = 15.12
2022-01-26 14:18:36.082 | DEBUG    | __main__:trials:26 - Trial = 26732/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.083 | DEBUG    | __main__:trials:29 - Trial = 26732/30000 | Total reward = 14.95
2022-01-26 14:18:36.087 | DEBUG    | __main__:trials:24 - Trial = 26733/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.089 | DEBUG    | __main__:trials:29 - Trial = 26733/30000 | Total reward = 27.37
2022-01-26 14:18:36.092 | DEBUG    | __main__:trials:24 - Trial = 26734/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.093 | DEBUG    | __main__:trials:29 - Trial = 26734/30000 | Total reward = 29.43
2022-01-26 14:18:36.097 | DEBUG    | __main__:trials:26 - Trial = 26735/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.098 | DEBUG    | __main__:trials:29 - Trial = 26735/30000 | Total reward = 17.28
2022-01-26 14:18:36.101 | DEBUG    | __main__:trials:24 - Trial = 26736/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.102 | DEBUG    | __main__:trials:29 - Trial = 26736/30000 | Total reward = 25.72
2022-01-26 14:18:36.105 | DEBUG    | __main__:trials:26 - Trial = 26737/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.107 | DEBUG    | __main__:trials:29 - Trial = 26737/30000 | Total reward = 20.23
2022-01-26 14:18:36.110 | DEBUG    | __main__:trials:24 - Trial = 26738/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.112 | DEBUG    | __main__:trials:29 - Trial = 26738/30000 | Total reward = 27.06
2022-01-26 14:18:36.115 | DEBUG    | __main__:trials:26 - Trial = 26739/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.117 | DEBUG    | __main__:trials:29 - Trial = 26739/30000 | Total reward = 14.68
2022-01-26 14:18:36.120 | DEBUG    | __main__:trials:26 - Trial = 26740/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.121 | DEBUG    | __main__:trials:29 - Trial = 26740/30000 | Total reward = 19.29
2022-01-26 14:18:36.125 | DEBUG    | __main__:trials:24 - Trial = 26741/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.127 | DEBUG    | __main__:trials:29 - Trial = 26741/30000 | Total reward = 47.60
2022-01-26 14:18:36.131 | DEBUG    | __main__:trials:24 - Trial = 26742/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.132 | DEBUG    | __main__:trials:29 - Trial = 26742/30000 | Total reward = 40.99
2022-01-26 14:18:36.136 | DEBUG    | __main__:trials:26 - Trial = 26743/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.137 | DEBUG    | __main__:trials:29 - Trial = 26743/30000 | Total reward = 17.37
2022-01-26 14:18:36.141 | DEBUG    | __main__:trials:24 - Trial = 26744/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.142 | DEBUG    | __main__:trials:29 - Trial = 26744/30000 | Total reward = 28.16
2022-01-26 14:18:36.144 | DEBUG    | __main__:trials:26 - Trial = 26745/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.145 | DEBUG    | __main__:trials:29 - Trial = 26745/30000 | Total reward = 13.33
2022-01-26 14:18:36.148 | DEBUG    | __main__:trials:26 - Trial = 26746/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.149 | DEBUG    | __main__:trials:29 - Trial = 26746/30000 | Total reward = 18.43
2022-01-26 14:18:36.152 | DEBUG    | __main__:trials:24 - Trial = 26747/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.153 | DEBUG    | __main__:trials:29 - Trial = 26747/30000 | Total reward = 27.54
2022-01-26 14:18:36.156 | DEBUG    | __main__:trials:24 - Trial = 26748/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.157 | DEBUG    | __main__:trials:29 - Trial = 26748/30000 | Total reward = 28.66
2022-01-26 14:18:36.160 | DEBUG    | __main__:trials:24 - Trial = 26749/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.161 | DEBUG    | __main__:trials:29 - Trial = 26749/30000 | Total reward = 27.37
2022-01-26 14:18:36.164 | DEBUG    | __main__:trials:24 - Trial = 26750/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.166 | DEBUG    | __main__:trials:29 - Trial = 26750/30000 | Total reward = 13.17
2022-01-26 14:18:36.168 | DEBUG    | __main__:trials:26 - Trial = 26751/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.170 | DEBUG    | __main__:trials:29 - Trial = 26751/30000 | Total reward = 18.60
2022-01-26 14:18:36.173 | DEBUG    | __main__:trials:26 - Trial = 26752/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.175 | DEBUG    | __main__:trials:29 - Trial = 26752/30000 | Total reward = 20.37
2022-01-26 14:18:36.178 | DEBUG    | __main__:trials:24 - Trial = 26753/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.180 | DEBUG    | __main__:trials:29 - Trial = 26753/30000 | Total reward = 27.06
2022-01-26 14:18:36.183 | DEBUG    | __main__:trials:26 - Trial = 26754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.184 | DEBUG    | __main__:trials:29 - Trial = 26754/30000 | Total reward = 11.79
2022-01-26 14:18:36.188 | DEBUG    | __main__:trials:24 - Trial = 26755/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.189 | DEBUG    | __main__:trials:29 - Trial = 26755/30000 | Total reward = 47.73
2022-01-26 14:18:36.193 | DEBUG    | __main__:trials:24 - Trial = 26756/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.194 | DEBUG    | __main__:trials:29 - Trial = 26756/30000 | Total reward = 18.30
2022-01-26 14:18:36.198 | DEBUG    | __main__:trials:24 - Trial = 26757/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.200 | DEBUG    | __main__:trials:29 - Trial = 26757/30000 | Total reward = 34.80
2022-01-26 14:18:36.203 | DEBUG    | __main__:trials:24 - Trial = 26758/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.205 | DEBUG    | __main__:trials:29 - Trial = 26758/30000 | Total reward = 27.08
2022-01-26 14:18:36.208 | DEBUG    | __main__:trials:24 - Trial = 26759/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.210 | DEBUG    | __main__:trials:29 - Trial = 26759/30000 | Total reward = 30.21
2022-01-26 14:18:36.213 | DEBUG    | __main__:trials:26 - Trial = 26760/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.215 | DEBUG    | __main__:trials:29 - Trial = 26760/30000 | Total reward = 21.84
2022-01-26 14:18:36.219 | DEBUG    | __main__:trials:24 - Trial = 26761/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.220 | DEBUG    | __main__:trials:29 - Trial = 26761/30000 | Total reward = 45.87
2022-01-26 14:18:36.223 | DEBUG    | __main__:trials:24 - Trial = 26762/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.225 | DEBUG    | __main__:trials:29 - Trial = 26762/30000 | Total reward = 31.56
2022-01-26 14:18:36.229 | DEBUG    | __main__:trials:24 - Trial = 26763/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.230 | DEBUG    | __main__:trials:29 - Trial = 26763/30000 | Total reward = 27.09
2022-01-26 14:18:36.234 | DEBUG    | __main__:trials:24 - Trial = 26764/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.235 | DEBUG    | __main__:trials:29 - Trial = 26764/30000 | Total reward = 27.02
2022-01-26 14:18:36.238 | DEBUG    | __main__:trials:24 - Trial = 26765/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.240 | DEBUG    | __main__:trials:29 - Trial = 26765/30000 | Total reward = 40.86
2022-01-26 14:18:36.244 | DEBUG    | __main__:trials:24 - Trial = 26766/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.245 | DEBUG    | __main__:trials:29 - Trial = 26766/30000 | Total reward = 22.65
2022-01-26 14:18:36.249 | DEBUG    | __main__:trials:24 - Trial = 26767/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.250 | DEBUG    | __main__:trials:29 - Trial = 26767/30000 | Total reward = 21.00
2022-01-26 14:18:36.253 | DEBUG    | __main__:trials:26 - Trial = 26768/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.255 | DEBUG    | __main__:trials:29 - Trial = 26768/30000 | Total reward = 15.48
2022-01-26 14:18:36.258 | DEBUG    | __main__:trials:24 - Trial = 26769/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.261 | DEBUG    | __main__:trials:29 - Trial = 26769/30000 | Total reward = 23.06
2022-01-26 14:18:36.265 | DEBUG    | __main__:trials:24 - Trial = 26770/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.267 | DEBUG    | __main__:trials:29 - Trial = 26770/30000 | Total reward = 18.74
2022-01-26 14:18:36.269 | DEBUG    | __main__:trials:24 - Trial = 26771/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.271 | DEBUG    | __main__:trials:29 - Trial = 26771/30000 | Total reward = 23.87
2022-01-26 14:18:36.275 | DEBUG    | __main__:trials:24 - Trial = 26772/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.277 | DEBUG    | __main__:trials:29 - Trial = 26772/30000 | Total reward = 38.73
2022-01-26 14:18:36.280 | DEBUG    | __main__:trials:26 - Trial = 26773/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.281 | DEBUG    | __main__:trials:29 - Trial = 26773/30000 | Total reward = 12.10
2022-01-26 14:18:36.284 | DEBUG    | __main__:trials:26 - Trial = 26774/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.286 | DEBUG    | __main__:trials:29 - Trial = 26774/30000 | Total reward = 14.44
2022-01-26 14:18:36.289 | DEBUG    | __main__:trials:24 - Trial = 26775/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.291 | DEBUG    | __main__:trials:29 - Trial = 26775/30000 | Total reward = 47.73
2022-01-26 14:18:36.295 | DEBUG    | __main__:trials:24 - Trial = 26776/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.296 | DEBUG    | __main__:trials:29 - Trial = 26776/30000 | Total reward = 23.00
2022-01-26 14:18:36.299 | DEBUG    | __main__:trials:24 - Trial = 26777/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.301 | DEBUG    | __main__:trials:29 - Trial = 26777/30000 | Total reward = 23.74
2022-01-26 14:18:36.305 | DEBUG    | __main__:trials:24 - Trial = 26778/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.306 | DEBUG    | __main__:trials:29 - Trial = 26778/30000 | Total reward = 40.44
2022-01-26 14:18:36.309 | DEBUG    | __main__:trials:24 - Trial = 26779/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.311 | DEBUG    | __main__:trials:29 - Trial = 26779/30000 | Total reward = 22.66
2022-01-26 14:18:36.315 | DEBUG    | __main__:trials:24 - Trial = 26780/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.317 | DEBUG    | __main__:trials:29 - Trial = 26780/30000 | Total reward = 25.94
2022-01-26 14:18:36.320 | DEBUG    | __main__:trials:24 - Trial = 26781/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.321 | DEBUG    | __main__:trials:29 - Trial = 26781/30000 | Total reward = 27.82
2022-01-26 14:18:36.325 | DEBUG    | __main__:trials:24 - Trial = 26782/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.327 | DEBUG    | __main__:trials:29 - Trial = 26782/30000 | Total reward = 27.22
2022-01-26 14:18:36.330 | DEBUG    | __main__:trials:24 - Trial = 26783/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.331 | DEBUG    | __main__:trials:29 - Trial = 26783/30000 | Total reward = 24.27
2022-01-26 14:18:36.335 | DEBUG    | __main__:trials:24 - Trial = 26784/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.337 | DEBUG    | __main__:trials:29 - Trial = 26784/30000 | Total reward = 50.85
2022-01-26 14:18:36.340 | DEBUG    | __main__:trials:24 - Trial = 26785/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.341 | DEBUG    | __main__:trials:29 - Trial = 26785/30000 | Total reward = 27.15
2022-01-26 14:18:36.345 | DEBUG    | __main__:trials:24 - Trial = 26786/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.346 | DEBUG    | __main__:trials:29 - Trial = 26786/30000 | Total reward = 24.89
2022-01-26 14:18:36.349 | DEBUG    | __main__:trials:24 - Trial = 26787/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.350 | DEBUG    | __main__:trials:29 - Trial = 26787/30000 | Total reward = 35.78
2022-01-26 14:18:36.352 | DEBUG    | __main__:trials:26 - Trial = 26788/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.354 | DEBUG    | __main__:trials:29 - Trial = 26788/30000 | Total reward = 17.59
2022-01-26 14:18:36.357 | DEBUG    | __main__:trials:26 - Trial = 26789/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.358 | DEBUG    | __main__:trials:29 - Trial = 26789/30000 | Total reward = 27.14
2022-01-26 14:18:36.362 | DEBUG    | __main__:trials:24 - Trial = 26790/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.364 | DEBUG    | __main__:trials:29 - Trial = 26790/30000 | Total reward = 35.42
2022-01-26 14:18:36.367 | DEBUG    | __main__:trials:24 - Trial = 26791/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.369 | DEBUG    | __main__:trials:29 - Trial = 26791/30000 | Total reward = 40.31
2022-01-26 14:18:36.372 | DEBUG    | __main__:trials:24 - Trial = 26792/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.374 | DEBUG    | __main__:trials:29 - Trial = 26792/30000 | Total reward = 47.36
2022-01-26 14:18:36.377 | DEBUG    | __main__:trials:24 - Trial = 26793/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.379 | DEBUG    | __main__:trials:29 - Trial = 26793/30000 | Total reward = 27.81
2022-01-26 14:18:36.382 | DEBUG    | __main__:trials:26 - Trial = 26794/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.384 | DEBUG    | __main__:trials:29 - Trial = 26794/30000 | Total reward = 29.46
2022-01-26 14:18:36.387 | DEBUG    | __main__:trials:24 - Trial = 26795/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.389 | DEBUG    | __main__:trials:29 - Trial = 26795/30000 | Total reward = 38.27
2022-01-26 14:18:36.393 | DEBUG    | __main__:trials:24 - Trial = 26796/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.394 | DEBUG    | __main__:trials:29 - Trial = 26796/30000 | Total reward = 43.52
2022-01-26 14:18:36.398 | DEBUG    | __main__:trials:24 - Trial = 26797/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.399 | DEBUG    | __main__:trials:29 - Trial = 26797/30000 | Total reward = 48.24
2022-01-26 14:18:36.402 | DEBUG    | __main__:trials:26 - Trial = 26798/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.404 | DEBUG    | __main__:trials:29 - Trial = 26798/30000 | Total reward = 18.36
2022-01-26 14:18:36.407 | DEBUG    | __main__:trials:26 - Trial = 26799/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.409 | DEBUG    | __main__:trials:29 - Trial = 26799/30000 | Total reward = 16.41
2022-01-26 14:18:36.412 | DEBUG    | __main__:trials:24 - Trial = 26800/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.414 | DEBUG    | __main__:trials:29 - Trial = 26800/30000 | Total reward = 22.47
2022-01-26 14:18:36.417 | DEBUG    | __main__:trials:24 - Trial = 26801/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.418 | DEBUG    | __main__:trials:29 - Trial = 26801/30000 | Total reward = 42.70
2022-01-26 14:18:36.422 | DEBUG    | __main__:trials:24 - Trial = 26802/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.424 | DEBUG    | __main__:trials:29 - Trial = 26802/30000 | Total reward = 26.42
2022-01-26 14:18:36.427 | DEBUG    | __main__:trials:24 - Trial = 26803/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.428 | DEBUG    | __main__:trials:29 - Trial = 26803/30000 | Total reward = 14.88
2022-01-26 14:18:36.432 | DEBUG    | __main__:trials:24 - Trial = 26804/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.434 | DEBUG    | __main__:trials:29 - Trial = 26804/30000 | Total reward = 54.15
2022-01-26 14:18:36.438 | DEBUG    | __main__:trials:24 - Trial = 26805/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.439 | DEBUG    | __main__:trials:29 - Trial = 26805/30000 | Total reward = 27.76
2022-01-26 14:18:36.443 | DEBUG    | __main__:trials:24 - Trial = 26806/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.445 | DEBUG    | __main__:trials:29 - Trial = 26806/30000 | Total reward = 23.86
2022-01-26 14:18:36.448 | DEBUG    | __main__:trials:24 - Trial = 26807/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.450 | DEBUG    | __main__:trials:29 - Trial = 26807/30000 | Total reward = 12.68
2022-01-26 14:18:36.452 | DEBUG    | __main__:trials:26 - Trial = 26808/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.454 | DEBUG    | __main__:trials:29 - Trial = 26808/30000 | Total reward = 15.58
2022-01-26 14:18:36.457 | DEBUG    | __main__:trials:24 - Trial = 26809/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.459 | DEBUG    | __main__:trials:29 - Trial = 26809/30000 | Total reward = 26.27
2022-01-26 14:18:36.462 | DEBUG    | __main__:trials:26 - Trial = 26810/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.463 | DEBUG    | __main__:trials:29 - Trial = 26810/30000 | Total reward = 12.94
2022-01-26 14:18:36.466 | DEBUG    | __main__:trials:24 - Trial = 26811/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.468 | DEBUG    | __main__:trials:29 - Trial = 26811/30000 | Total reward = 27.69
2022-01-26 14:18:36.472 | DEBUG    | __main__:trials:24 - Trial = 26812/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.472 | DEBUG    | __main__:trials:29 - Trial = 26812/30000 | Total reward = 35.25
2022-01-26 14:18:36.476 | DEBUG    | __main__:trials:24 - Trial = 26813/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.477 | DEBUG    | __main__:trials:29 - Trial = 26813/30000 | Total reward = 22.42
2022-01-26 14:18:36.481 | DEBUG    | __main__:trials:24 - Trial = 26814/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.482 | DEBUG    | __main__:trials:29 - Trial = 26814/30000 | Total reward = 51.33
2022-01-26 14:18:36.485 | DEBUG    | __main__:trials:24 - Trial = 26815/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.487 | DEBUG    | __main__:trials:29 - Trial = 26815/30000 | Total reward = 27.41
2022-01-26 14:18:36.489 | DEBUG    | __main__:trials:24 - Trial = 26816/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.490 | DEBUG    | __main__:trials:29 - Trial = 26816/30000 | Total reward = 29.42
2022-01-26 14:18:36.493 | DEBUG    | __main__:trials:26 - Trial = 26817/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.494 | DEBUG    | __main__:trials:29 - Trial = 26817/30000 | Total reward = 19.15
2022-01-26 14:18:36.497 | DEBUG    | __main__:trials:24 - Trial = 26818/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.499 | DEBUG    | __main__:trials:29 - Trial = 26818/30000 | Total reward = 30.89
2022-01-26 14:18:36.502 | DEBUG    | __main__:trials:26 - Trial = 26819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.504 | DEBUG    | __main__:trials:29 - Trial = 26819/30000 | Total reward = 33.65
2022-01-26 14:18:36.508 | DEBUG    | __main__:trials:24 - Trial = 26820/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.510 | DEBUG    | __main__:trials:29 - Trial = 26820/30000 | Total reward = 34.67
2022-01-26 14:18:36.513 | DEBUG    | __main__:trials:26 - Trial = 26821/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.514 | DEBUG    | __main__:trials:29 - Trial = 26821/30000 | Total reward = 19.51
2022-01-26 14:18:36.517 | DEBUG    | __main__:trials:26 - Trial = 26822/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.518 | DEBUG    | __main__:trials:29 - Trial = 26822/30000 | Total reward = 11.82
2022-01-26 14:18:36.520 | DEBUG    | __main__:trials:26 - Trial = 26823/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.522 | DEBUG    | __main__:trials:29 - Trial = 26823/30000 | Total reward = 16.70
2022-01-26 14:18:36.526 | DEBUG    | __main__:trials:24 - Trial = 26824/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.528 | DEBUG    | __main__:trials:29 - Trial = 26824/30000 | Total reward = 24.72
2022-01-26 14:18:36.531 | DEBUG    | __main__:trials:26 - Trial = 26825/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.533 | DEBUG    | __main__:trials:29 - Trial = 26825/30000 | Total reward = 22.80
2022-01-26 14:18:36.536 | DEBUG    | __main__:trials:24 - Trial = 26826/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.538 | DEBUG    | __main__:trials:29 - Trial = 26826/30000 | Total reward = 25.98
2022-01-26 14:18:36.541 | DEBUG    | __main__:trials:24 - Trial = 26827/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.543 | DEBUG    | __main__:trials:29 - Trial = 26827/30000 | Total reward = 26.11
2022-01-26 14:18:36.546 | DEBUG    | __main__:trials:24 - Trial = 26828/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.548 | DEBUG    | __main__:trials:29 - Trial = 26828/30000 | Total reward = 42.84
2022-01-26 14:18:36.551 | DEBUG    | __main__:trials:24 - Trial = 26829/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.553 | DEBUG    | __main__:trials:29 - Trial = 26829/30000 | Total reward = 47.86
2022-01-26 14:18:36.556 | DEBUG    | __main__:trials:24 - Trial = 26830/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.558 | DEBUG    | __main__:trials:29 - Trial = 26830/30000 | Total reward = 27.56
2022-01-26 14:18:36.561 | DEBUG    | __main__:trials:26 - Trial = 26831/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.563 | DEBUG    | __main__:trials:29 - Trial = 26831/30000 | Total reward = 18.25
2022-01-26 14:18:36.565 | DEBUG    | __main__:trials:24 - Trial = 26832/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.567 | DEBUG    | __main__:trials:29 - Trial = 26832/30000 | Total reward = 30.57
2022-01-26 14:18:36.571 | DEBUG    | __main__:trials:24 - Trial = 26833/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.572 | DEBUG    | __main__:trials:29 - Trial = 26833/30000 | Total reward = 26.18
2022-01-26 14:18:36.576 | DEBUG    | __main__:trials:24 - Trial = 26834/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.578 | DEBUG    | __main__:trials:29 - Trial = 26834/30000 | Total reward = 25.31
2022-01-26 14:18:36.581 | DEBUG    | __main__:trials:24 - Trial = 26835/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.582 | DEBUG    | __main__:trials:29 - Trial = 26835/30000 | Total reward = 27.88
2022-01-26 14:18:36.585 | DEBUG    | __main__:trials:24 - Trial = 26836/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.587 | DEBUG    | __main__:trials:29 - Trial = 26836/30000 | Total reward = 28.64
2022-01-26 14:18:36.589 | DEBUG    | __main__:trials:24 - Trial = 26837/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.591 | DEBUG    | __main__:trials:29 - Trial = 26837/30000 | Total reward = 26.42
2022-01-26 14:18:36.594 | DEBUG    | __main__:trials:24 - Trial = 26838/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.596 | DEBUG    | __main__:trials:29 - Trial = 26838/30000 | Total reward = 27.37
2022-01-26 14:18:36.600 | DEBUG    | __main__:trials:24 - Trial = 26839/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.601 | DEBUG    | __main__:trials:29 - Trial = 26839/30000 | Total reward = 31.50
2022-01-26 14:18:36.605 | DEBUG    | __main__:trials:24 - Trial = 26840/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.606 | DEBUG    | __main__:trials:29 - Trial = 26840/30000 | Total reward = 26.75
2022-01-26 14:18:36.610 | DEBUG    | __main__:trials:24 - Trial = 26841/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.612 | DEBUG    | __main__:trials:29 - Trial = 26841/30000 | Total reward = 28.52
2022-01-26 14:18:36.615 | DEBUG    | __main__:trials:24 - Trial = 26842/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.617 | DEBUG    | __main__:trials:29 - Trial = 26842/30000 | Total reward = 24.97
2022-01-26 14:18:36.620 | DEBUG    | __main__:trials:24 - Trial = 26843/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.622 | DEBUG    | __main__:trials:29 - Trial = 26843/30000 | Total reward = 21.29
2022-01-26 14:18:36.625 | DEBUG    | __main__:trials:26 - Trial = 26844/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.626 | DEBUG    | __main__:trials:29 - Trial = 26844/30000 | Total reward = 15.14
2022-01-26 14:18:36.630 | DEBUG    | __main__:trials:24 - Trial = 26845/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.632 | DEBUG    | __main__:trials:29 - Trial = 26845/30000 | Total reward = 44.43
2022-01-26 14:18:36.634 | DEBUG    | __main__:trials:26 - Trial = 26846/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.636 | DEBUG    | __main__:trials:29 - Trial = 26846/30000 | Total reward = 18.25
2022-01-26 14:18:36.639 | DEBUG    | __main__:trials:24 - Trial = 26847/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.641 | DEBUG    | __main__:trials:29 - Trial = 26847/30000 | Total reward = 23.04
2022-01-26 14:18:36.644 | DEBUG    | __main__:trials:24 - Trial = 26848/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.645 | DEBUG    | __main__:trials:29 - Trial = 26848/30000 | Total reward = 48.71
2022-01-26 14:18:36.649 | DEBUG    | __main__:trials:24 - Trial = 26849/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.650 | DEBUG    | __main__:trials:29 - Trial = 26849/30000 | Total reward = 31.94
2022-01-26 14:18:36.654 | DEBUG    | __main__:trials:24 - Trial = 26850/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.656 | DEBUG    | __main__:trials:29 - Trial = 26850/30000 | Total reward = 41.77
2022-01-26 14:18:36.659 | DEBUG    | __main__:trials:26 - Trial = 26851/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.660 | DEBUG    | __main__:trials:29 - Trial = 26851/30000 | Total reward = 20.20
2022-01-26 14:18:36.664 | DEBUG    | __main__:trials:24 - Trial = 26852/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.666 | DEBUG    | __main__:trials:29 - Trial = 26852/30000 | Total reward = 26.42
2022-01-26 14:18:36.670 | DEBUG    | __main__:trials:24 - Trial = 26853/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.672 | DEBUG    | __main__:trials:29 - Trial = 26853/30000 | Total reward = 23.26
2022-01-26 14:18:36.676 | DEBUG    | __main__:trials:24 - Trial = 26854/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.677 | DEBUG    | __main__:trials:29 - Trial = 26854/30000 | Total reward = 18.51
2022-01-26 14:18:36.680 | DEBUG    | __main__:trials:26 - Trial = 26855/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.682 | DEBUG    | __main__:trials:29 - Trial = 26855/30000 | Total reward = 15.11
2022-01-26 14:18:36.684 | DEBUG    | __main__:trials:26 - Trial = 26856/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.686 | DEBUG    | __main__:trials:29 - Trial = 26856/30000 | Total reward = 8.43
2022-01-26 14:18:36.690 | DEBUG    | __main__:trials:24 - Trial = 26857/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.691 | DEBUG    | __main__:trials:29 - Trial = 26857/30000 | Total reward = 31.45
2022-01-26 14:18:36.695 | DEBUG    | __main__:trials:24 - Trial = 26858/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.696 | DEBUG    | __main__:trials:29 - Trial = 26858/30000 | Total reward = 58.49
2022-01-26 14:18:36.699 | DEBUG    | __main__:trials:24 - Trial = 26859/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.701 | DEBUG    | __main__:trials:29 - Trial = 26859/30000 | Total reward = 30.12
2022-01-26 14:18:36.704 | DEBUG    | __main__:trials:24 - Trial = 26860/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.706 | DEBUG    | __main__:trials:29 - Trial = 26860/30000 | Total reward = 45.01
2022-01-26 14:18:36.710 | DEBUG    | __main__:trials:24 - Trial = 26861/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.711 | DEBUG    | __main__:trials:29 - Trial = 26861/30000 | Total reward = 16.89
2022-01-26 14:18:36.715 | DEBUG    | __main__:trials:24 - Trial = 26862/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.717 | DEBUG    | __main__:trials:29 - Trial = 26862/30000 | Total reward = 31.65
2022-01-26 14:18:36.721 | DEBUG    | __main__:trials:24 - Trial = 26863/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.722 | DEBUG    | __main__:trials:29 - Trial = 26863/30000 | Total reward = 31.77
2022-01-26 14:18:36.725 | DEBUG    | __main__:trials:26 - Trial = 26864/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.726 | DEBUG    | __main__:trials:29 - Trial = 26864/30000 | Total reward = 15.84
2022-01-26 14:18:36.730 | DEBUG    | __main__:trials:24 - Trial = 26865/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.732 | DEBUG    | __main__:trials:29 - Trial = 26865/30000 | Total reward = 31.39
2022-01-26 14:18:36.735 | DEBUG    | __main__:trials:24 - Trial = 26866/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.737 | DEBUG    | __main__:trials:29 - Trial = 26866/30000 | Total reward = 32.82
2022-01-26 14:18:36.740 | DEBUG    | __main__:trials:26 - Trial = 26867/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.741 | DEBUG    | __main__:trials:29 - Trial = 26867/30000 | Total reward = 13.57
2022-01-26 14:18:36.745 | DEBUG    | __main__:trials:24 - Trial = 26868/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.746 | DEBUG    | __main__:trials:29 - Trial = 26868/30000 | Total reward = 48.20
2022-01-26 14:18:36.750 | DEBUG    | __main__:trials:24 - Trial = 26869/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.752 | DEBUG    | __main__:trials:29 - Trial = 26869/30000 | Total reward = 28.13
2022-01-26 14:18:36.755 | DEBUG    | __main__:trials:24 - Trial = 26870/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.757 | DEBUG    | __main__:trials:29 - Trial = 26870/30000 | Total reward = 24.24
2022-01-26 14:18:36.760 | DEBUG    | __main__:trials:24 - Trial = 26871/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.761 | DEBUG    | __main__:trials:29 - Trial = 26871/30000 | Total reward = 39.87
2022-01-26 14:18:36.765 | DEBUG    | __main__:trials:24 - Trial = 26872/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.767 | DEBUG    | __main__:trials:29 - Trial = 26872/30000 | Total reward = 37.63
2022-01-26 14:18:36.770 | DEBUG    | __main__:trials:26 - Trial = 26873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.772 | DEBUG    | __main__:trials:29 - Trial = 26873/30000 | Total reward = 20.72
2022-01-26 14:18:36.775 | DEBUG    | __main__:trials:24 - Trial = 26874/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.776 | DEBUG    | __main__:trials:29 - Trial = 26874/30000 | Total reward = 21.13
2022-01-26 14:18:36.780 | DEBUG    | __main__:trials:24 - Trial = 26875/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.782 | DEBUG    | __main__:trials:29 - Trial = 26875/30000 | Total reward = 35.85
2022-01-26 14:18:36.785 | DEBUG    | __main__:trials:24 - Trial = 26876/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.787 | DEBUG    | __main__:trials:29 - Trial = 26876/30000 | Total reward = 28.97
2022-01-26 14:18:36.791 | DEBUG    | __main__:trials:24 - Trial = 26877/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.792 | DEBUG    | __main__:trials:29 - Trial = 26877/30000 | Total reward = 28.30
2022-01-26 14:18:36.796 | DEBUG    | __main__:trials:24 - Trial = 26878/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.797 | DEBUG    | __main__:trials:29 - Trial = 26878/30000 | Total reward = 25.67
2022-01-26 14:18:36.800 | DEBUG    | __main__:trials:24 - Trial = 26879/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.802 | DEBUG    | __main__:trials:29 - Trial = 26879/30000 | Total reward = 31.72
2022-01-26 14:18:36.806 | DEBUG    | __main__:trials:24 - Trial = 26880/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.807 | DEBUG    | __main__:trials:29 - Trial = 26880/30000 | Total reward = 31.56
2022-01-26 14:18:36.811 | DEBUG    | __main__:trials:24 - Trial = 26881/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.813 | DEBUG    | __main__:trials:29 - Trial = 26881/30000 | Total reward = 36.15
2022-01-26 14:18:36.816 | DEBUG    | __main__:trials:24 - Trial = 26882/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.817 | DEBUG    | __main__:trials:29 - Trial = 26882/30000 | Total reward = 30.24
2022-01-26 14:18:36.821 | DEBUG    | __main__:trials:24 - Trial = 26883/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.822 | DEBUG    | __main__:trials:29 - Trial = 26883/30000 | Total reward = 22.77
2022-01-26 14:18:36.826 | DEBUG    | __main__:trials:24 - Trial = 26884/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.828 | DEBUG    | __main__:trials:29 - Trial = 26884/30000 | Total reward = 35.87
2022-01-26 14:18:36.830 | DEBUG    | __main__:trials:24 - Trial = 26885/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.832 | DEBUG    | __main__:trials:29 - Trial = 26885/30000 | Total reward = 31.59
2022-01-26 14:18:36.836 | DEBUG    | __main__:trials:24 - Trial = 26886/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.837 | DEBUG    | __main__:trials:29 - Trial = 26886/30000 | Total reward = 23.45
2022-01-26 14:18:36.841 | DEBUG    | __main__:trials:24 - Trial = 26887/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.843 | DEBUG    | __main__:trials:29 - Trial = 26887/30000 | Total reward = 14.46
2022-01-26 14:18:36.847 | DEBUG    | __main__:trials:24 - Trial = 26888/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.848 | DEBUG    | __main__:trials:29 - Trial = 26888/30000 | Total reward = 29.34
2022-01-26 14:18:36.851 | DEBUG    | __main__:trials:24 - Trial = 26889/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.853 | DEBUG    | __main__:trials:29 - Trial = 26889/30000 | Total reward = 31.20
2022-01-26 14:18:36.857 | DEBUG    | __main__:trials:24 - Trial = 26890/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.858 | DEBUG    | __main__:trials:29 - Trial = 26890/30000 | Total reward = 34.05
2022-01-26 14:18:36.863 | DEBUG    | __main__:trials:24 - Trial = 26891/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.864 | DEBUG    | __main__:trials:29 - Trial = 26891/30000 | Total reward = 31.75
2022-01-26 14:18:36.868 | DEBUG    | __main__:trials:24 - Trial = 26892/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.870 | DEBUG    | __main__:trials:29 - Trial = 26892/30000 | Total reward = 35.52
2022-01-26 14:18:36.874 | DEBUG    | __main__:trials:24 - Trial = 26893/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.874 | DEBUG    | __main__:trials:29 - Trial = 26893/30000 | Total reward = 42.34
2022-01-26 14:18:36.879 | DEBUG    | __main__:trials:24 - Trial = 26894/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.880 | DEBUG    | __main__:trials:29 - Trial = 26894/30000 | Total reward = 32.32
2022-01-26 14:18:36.884 | DEBUG    | __main__:trials:24 - Trial = 26895/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.885 | DEBUG    | __main__:trials:29 - Trial = 26895/30000 | Total reward = 51.04
2022-01-26 14:18:36.889 | DEBUG    | __main__:trials:24 - Trial = 26896/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.890 | DEBUG    | __main__:trials:29 - Trial = 26896/30000 | Total reward = 36.10
2022-01-26 14:18:36.894 | DEBUG    | __main__:trials:24 - Trial = 26897/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.895 | DEBUG    | __main__:trials:29 - Trial = 26897/30000 | Total reward = 26.19
2022-01-26 14:18:36.899 | DEBUG    | __main__:trials:26 - Trial = 26898/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.900 | DEBUG    | __main__:trials:29 - Trial = 26898/30000 | Total reward = 21.14
2022-01-26 14:18:36.904 | DEBUG    | __main__:trials:24 - Trial = 26899/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.905 | DEBUG    | __main__:trials:29 - Trial = 26899/30000 | Total reward = 30.40
2022-01-26 14:18:36.909 | DEBUG    | __main__:trials:24 - Trial = 26900/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.910 | DEBUG    | __main__:trials:29 - Trial = 26900/30000 | Total reward = 23.64
2022-01-26 14:18:36.914 | DEBUG    | __main__:trials:26 - Trial = 26901/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.915 | DEBUG    | __main__:trials:29 - Trial = 26901/30000 | Total reward = 26.33
2022-01-26 14:18:36.919 | DEBUG    | __main__:trials:24 - Trial = 26902/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.920 | DEBUG    | __main__:trials:29 - Trial = 26902/30000 | Total reward = 26.28
2022-01-26 14:18:36.924 | DEBUG    | __main__:trials:24 - Trial = 26903/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.926 | DEBUG    | __main__:trials:29 - Trial = 26903/30000 | Total reward = 26.56
2022-01-26 14:18:36.930 | DEBUG    | __main__:trials:24 - Trial = 26904/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.931 | DEBUG    | __main__:trials:29 - Trial = 26904/30000 | Total reward = 35.39
2022-01-26 14:18:36.934 | DEBUG    | __main__:trials:24 - Trial = 26905/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.936 | DEBUG    | __main__:trials:29 - Trial = 26905/30000 | Total reward = 23.55
2022-01-26 14:18:36.939 | DEBUG    | __main__:trials:24 - Trial = 26906/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.941 | DEBUG    | __main__:trials:29 - Trial = 26906/30000 | Total reward = 39.30
2022-01-26 14:18:36.944 | DEBUG    | __main__:trials:24 - Trial = 26907/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.946 | DEBUG    | __main__:trials:29 - Trial = 26907/30000 | Total reward = 46.10
2022-01-26 14:18:36.949 | DEBUG    | __main__:trials:26 - Trial = 26908/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.951 | DEBUG    | __main__:trials:29 - Trial = 26908/30000 | Total reward = 18.88
2022-01-26 14:18:36.955 | DEBUG    | __main__:trials:24 - Trial = 26909/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.956 | DEBUG    | __main__:trials:29 - Trial = 26909/30000 | Total reward = 42.48
2022-01-26 14:18:36.959 | DEBUG    | __main__:trials:24 - Trial = 26910/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.961 | DEBUG    | __main__:trials:29 - Trial = 26910/30000 | Total reward = 24.05
2022-01-26 14:18:36.965 | DEBUG    | __main__:trials:24 - Trial = 26911/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.966 | DEBUG    | __main__:trials:29 - Trial = 26911/30000 | Total reward = 45.70
2022-01-26 14:18:36.969 | DEBUG    | __main__:trials:26 - Trial = 26912/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:36.970 | DEBUG    | __main__:trials:29 - Trial = 26912/30000 | Total reward = 12.90
2022-01-26 14:18:36.973 | DEBUG    | __main__:trials:24 - Trial = 26913/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.974 | DEBUG    | __main__:trials:29 - Trial = 26913/30000 | Total reward = 35.00
2022-01-26 14:18:36.978 | DEBUG    | __main__:trials:24 - Trial = 26914/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.980 | DEBUG    | __main__:trials:29 - Trial = 26914/30000 | Total reward = 47.50
2022-01-26 14:18:36.984 | DEBUG    | __main__:trials:24 - Trial = 26915/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.985 | DEBUG    | __main__:trials:29 - Trial = 26915/30000 | Total reward = 42.63
2022-01-26 14:18:36.989 | DEBUG    | __main__:trials:24 - Trial = 26916/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.989 | DEBUG    | __main__:trials:29 - Trial = 26916/30000 | Total reward = 39.16
2022-01-26 14:18:36.994 | DEBUG    | __main__:trials:24 - Trial = 26917/30000 | Max number of steps (20) reached
2022-01-26 14:18:36.994 | DEBUG    | __main__:trials:29 - Trial = 26917/30000 | Total reward = 45.74
2022-01-26 14:18:36.999 | DEBUG    | __main__:trials:24 - Trial = 26918/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.000 | DEBUG    | __main__:trials:29 - Trial = 26918/30000 | Total reward = 41.76
2022-01-26 14:18:37.004 | DEBUG    | __main__:trials:24 - Trial = 26919/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.005 | DEBUG    | __main__:trials:29 - Trial = 26919/30000 | Total reward = 45.27
2022-01-26 14:18:37.009 | DEBUG    | __main__:trials:24 - Trial = 26920/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.011 | DEBUG    | __main__:trials:29 - Trial = 26920/30000 | Total reward = 50.35
2022-01-26 14:18:37.015 | DEBUG    | __main__:trials:24 - Trial = 26921/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.016 | DEBUG    | __main__:trials:29 - Trial = 26921/30000 | Total reward = 37.90
2022-01-26 14:18:37.019 | DEBUG    | __main__:trials:26 - Trial = 26922/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.020 | DEBUG    | __main__:trials:29 - Trial = 26922/30000 | Total reward = 11.25
2022-01-26 14:18:37.024 | DEBUG    | __main__:trials:24 - Trial = 26923/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.025 | DEBUG    | __main__:trials:29 - Trial = 26923/30000 | Total reward = 43.45
2022-01-26 14:18:37.029 | DEBUG    | __main__:trials:24 - Trial = 26924/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.030 | DEBUG    | __main__:trials:29 - Trial = 26924/30000 | Total reward = 19.85
2022-01-26 14:18:37.033 | DEBUG    | __main__:trials:26 - Trial = 26925/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.035 | DEBUG    | __main__:trials:29 - Trial = 26925/30000 | Total reward = 25.02
2022-01-26 14:18:37.039 | DEBUG    | __main__:trials:24 - Trial = 26926/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.039 | DEBUG    | __main__:trials:29 - Trial = 26926/30000 | Total reward = 23.13
2022-01-26 14:18:37.044 | DEBUG    | __main__:trials:24 - Trial = 26927/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.045 | DEBUG    | __main__:trials:29 - Trial = 26927/30000 | Total reward = 29.60
2022-01-26 14:18:37.049 | DEBUG    | __main__:trials:26 - Trial = 26928/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.050 | DEBUG    | __main__:trials:29 - Trial = 26928/30000 | Total reward = 24.68
2022-01-26 14:18:37.054 | DEBUG    | __main__:trials:24 - Trial = 26929/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.056 | DEBUG    | __main__:trials:29 - Trial = 26929/30000 | Total reward = 47.99
2022-01-26 14:18:37.059 | DEBUG    | __main__:trials:24 - Trial = 26930/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.061 | DEBUG    | __main__:trials:29 - Trial = 26930/30000 | Total reward = 45.58
2022-01-26 14:18:37.064 | DEBUG    | __main__:trials:26 - Trial = 26931/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.064 | DEBUG    | __main__:trials:29 - Trial = 26931/30000 | Total reward = 17.25
2022-01-26 14:18:37.068 | DEBUG    | __main__:trials:24 - Trial = 26932/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.069 | DEBUG    | __main__:trials:29 - Trial = 26932/30000 | Total reward = 36.10
2022-01-26 14:18:37.073 | DEBUG    | __main__:trials:24 - Trial = 26933/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.073 | DEBUG    | __main__:trials:29 - Trial = 26933/30000 | Total reward = 37.79
2022-01-26 14:18:37.077 | DEBUG    | __main__:trials:24 - Trial = 26934/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.077 | DEBUG    | __main__:trials:29 - Trial = 26934/30000 | Total reward = 37.10
2022-01-26 14:18:37.082 | DEBUG    | __main__:trials:24 - Trial = 26935/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.083 | DEBUG    | __main__:trials:29 - Trial = 26935/30000 | Total reward = 50.10
2022-01-26 14:18:37.088 | DEBUG    | __main__:trials:24 - Trial = 26936/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.088 | DEBUG    | __main__:trials:29 - Trial = 26936/30000 | Total reward = 43.34
2022-01-26 14:18:37.092 | DEBUG    | __main__:trials:26 - Trial = 26937/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.093 | DEBUG    | __main__:trials:29 - Trial = 26937/30000 | Total reward = 17.72
2022-01-26 14:18:37.098 | DEBUG    | __main__:trials:24 - Trial = 26938/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.099 | DEBUG    | __main__:trials:29 - Trial = 26938/30000 | Total reward = 34.67
2022-01-26 14:18:37.102 | DEBUG    | __main__:trials:26 - Trial = 26939/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.103 | DEBUG    | __main__:trials:29 - Trial = 26939/30000 | Total reward = 11.64
2022-01-26 14:18:37.107 | DEBUG    | __main__:trials:24 - Trial = 26940/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.109 | DEBUG    | __main__:trials:29 - Trial = 26940/30000 | Total reward = 52.81
2022-01-26 14:18:37.112 | DEBUG    | __main__:trials:24 - Trial = 26941/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.114 | DEBUG    | __main__:trials:29 - Trial = 26941/30000 | Total reward = 40.52
2022-01-26 14:18:37.117 | DEBUG    | __main__:trials:26 - Trial = 26942/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.118 | DEBUG    | __main__:trials:29 - Trial = 26942/30000 | Total reward = 37.50
2022-01-26 14:18:37.122 | DEBUG    | __main__:trials:24 - Trial = 26943/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.123 | DEBUG    | __main__:trials:29 - Trial = 26943/30000 | Total reward = 37.30
2022-01-26 14:18:37.126 | DEBUG    | __main__:trials:24 - Trial = 26944/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.128 | DEBUG    | __main__:trials:29 - Trial = 26944/30000 | Total reward = 42.15
2022-01-26 14:18:37.131 | DEBUG    | __main__:trials:26 - Trial = 26945/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.132 | DEBUG    | __main__:trials:29 - Trial = 26945/30000 | Total reward = 21.37
2022-01-26 14:18:37.136 | DEBUG    | __main__:trials:24 - Trial = 26946/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.137 | DEBUG    | __main__:trials:29 - Trial = 26946/30000 | Total reward = 41.89
2022-01-26 14:18:37.141 | DEBUG    | __main__:trials:24 - Trial = 26947/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.143 | DEBUG    | __main__:trials:29 - Trial = 26947/30000 | Total reward = 40.15
2022-01-26 14:18:37.147 | DEBUG    | __main__:trials:24 - Trial = 26948/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.147 | DEBUG    | __main__:trials:29 - Trial = 26948/30000 | Total reward = 42.57
2022-01-26 14:18:37.152 | DEBUG    | __main__:trials:24 - Trial = 26949/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.152 | DEBUG    | __main__:trials:29 - Trial = 26949/30000 | Total reward = 35.50
2022-01-26 14:18:37.156 | DEBUG    | __main__:trials:24 - Trial = 26950/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.157 | DEBUG    | __main__:trials:29 - Trial = 26950/30000 | Total reward = 36.07
2022-01-26 14:18:37.160 | DEBUG    | __main__:trials:26 - Trial = 26951/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.160 | DEBUG    | __main__:trials:29 - Trial = 26951/30000 | Total reward = 19.26
2022-01-26 14:18:37.163 | DEBUG    | __main__:trials:26 - Trial = 26952/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.165 | DEBUG    | __main__:trials:29 - Trial = 26952/30000 | Total reward = 24.47
2022-01-26 14:18:37.168 | DEBUG    | __main__:trials:24 - Trial = 26953/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.169 | DEBUG    | __main__:trials:29 - Trial = 26953/30000 | Total reward = 20.82
2022-01-26 14:18:37.174 | DEBUG    | __main__:trials:24 - Trial = 26954/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.175 | DEBUG    | __main__:trials:29 - Trial = 26954/30000 | Total reward = 37.23
2022-01-26 14:18:37.178 | DEBUG    | __main__:trials:26 - Trial = 26955/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.180 | DEBUG    | __main__:trials:29 - Trial = 26955/30000 | Total reward = 14.56
2022-01-26 14:18:37.182 | DEBUG    | __main__:trials:26 - Trial = 26956/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.183 | DEBUG    | __main__:trials:29 - Trial = 26956/30000 | Total reward = 17.17
2022-01-26 14:18:37.187 | DEBUG    | __main__:trials:26 - Trial = 26957/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.189 | DEBUG    | __main__:trials:29 - Trial = 26957/30000 | Total reward = 15.80
2022-01-26 14:18:37.191 | DEBUG    | __main__:trials:26 - Trial = 26958/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.193 | DEBUG    | __main__:trials:29 - Trial = 26958/30000 | Total reward = 24.26
2022-01-26 14:18:37.196 | DEBUG    | __main__:trials:24 - Trial = 26959/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.198 | DEBUG    | __main__:trials:29 - Trial = 26959/30000 | Total reward = 38.25
2022-01-26 14:18:37.202 | DEBUG    | __main__:trials:24 - Trial = 26960/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.203 | DEBUG    | __main__:trials:29 - Trial = 26960/30000 | Total reward = 27.62
2022-01-26 14:18:37.206 | DEBUG    | __main__:trials:24 - Trial = 26961/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.208 | DEBUG    | __main__:trials:29 - Trial = 26961/30000 | Total reward = 33.44
2022-01-26 14:18:37.211 | DEBUG    | __main__:trials:24 - Trial = 26962/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.213 | DEBUG    | __main__:trials:29 - Trial = 26962/30000 | Total reward = 28.89
2022-01-26 14:18:37.215 | DEBUG    | __main__:trials:24 - Trial = 26963/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.217 | DEBUG    | __main__:trials:29 - Trial = 26963/30000 | Total reward = 36.15
2022-01-26 14:18:37.221 | DEBUG    | __main__:trials:24 - Trial = 26964/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.222 | DEBUG    | __main__:trials:29 - Trial = 26964/30000 | Total reward = 35.18
2022-01-26 14:18:37.224 | DEBUG    | __main__:trials:26 - Trial = 26965/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.225 | DEBUG    | __main__:trials:29 - Trial = 26965/30000 | Total reward = 7.55
2022-01-26 14:18:37.229 | DEBUG    | __main__:trials:26 - Trial = 26966/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.231 | DEBUG    | __main__:trials:29 - Trial = 26966/30000 | Total reward = 27.25
2022-01-26 14:18:37.234 | DEBUG    | __main__:trials:26 - Trial = 26967/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.236 | DEBUG    | __main__:trials:29 - Trial = 26967/30000 | Total reward = 23.51
2022-01-26 14:18:37.239 | DEBUG    | __main__:trials:24 - Trial = 26968/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.240 | DEBUG    | __main__:trials:29 - Trial = 26968/30000 | Total reward = 41.57
2022-01-26 14:18:37.244 | DEBUG    | __main__:trials:24 - Trial = 26969/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.246 | DEBUG    | __main__:trials:29 - Trial = 26969/30000 | Total reward = 36.34
2022-01-26 14:18:37.250 | DEBUG    | __main__:trials:24 - Trial = 26970/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.250 | DEBUG    | __main__:trials:29 - Trial = 26970/30000 | Total reward = 50.96
2022-01-26 14:18:37.255 | DEBUG    | __main__:trials:24 - Trial = 26971/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.256 | DEBUG    | __main__:trials:29 - Trial = 26971/30000 | Total reward = 37.01
2022-01-26 14:18:37.260 | DEBUG    | __main__:trials:26 - Trial = 26972/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.261 | DEBUG    | __main__:trials:29 - Trial = 26972/30000 | Total reward = 22.26
2022-01-26 14:18:37.265 | DEBUG    | __main__:trials:26 - Trial = 26973/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.266 | DEBUG    | __main__:trials:29 - Trial = 26973/30000 | Total reward = 18.96
2022-01-26 14:18:37.270 | DEBUG    | __main__:trials:24 - Trial = 26974/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.271 | DEBUG    | __main__:trials:29 - Trial = 26974/30000 | Total reward = 41.99
2022-01-26 14:18:37.275 | DEBUG    | __main__:trials:24 - Trial = 26975/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.276 | DEBUG    | __main__:trials:29 - Trial = 26975/30000 | Total reward = 33.33
2022-01-26 14:18:37.280 | DEBUG    | __main__:trials:24 - Trial = 26976/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.282 | DEBUG    | __main__:trials:29 - Trial = 26976/30000 | Total reward = 42.15
2022-01-26 14:18:37.286 | DEBUG    | __main__:trials:24 - Trial = 26977/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.286 | DEBUG    | __main__:trials:29 - Trial = 26977/30000 | Total reward = 41.64
2022-01-26 14:18:37.291 | DEBUG    | __main__:trials:24 - Trial = 26978/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.292 | DEBUG    | __main__:trials:29 - Trial = 26978/30000 | Total reward = 34.37
2022-01-26 14:18:37.296 | DEBUG    | __main__:trials:26 - Trial = 26979/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.297 | DEBUG    | __main__:trials:29 - Trial = 26979/30000 | Total reward = 15.55
2022-01-26 14:18:37.300 | DEBUG    | __main__:trials:24 - Trial = 26980/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.301 | DEBUG    | __main__:trials:29 - Trial = 26980/30000 | Total reward = 40.52
2022-01-26 14:18:37.305 | DEBUG    | __main__:trials:24 - Trial = 26981/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.306 | DEBUG    | __main__:trials:29 - Trial = 26981/30000 | Total reward = 41.94
2022-01-26 14:18:37.310 | DEBUG    | __main__:trials:24 - Trial = 26982/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.312 | DEBUG    | __main__:trials:29 - Trial = 26982/30000 | Total reward = 46.56
2022-01-26 14:18:37.315 | DEBUG    | __main__:trials:26 - Trial = 26983/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.316 | DEBUG    | __main__:trials:29 - Trial = 26983/30000 | Total reward = 23.23
2022-01-26 14:18:37.320 | DEBUG    | __main__:trials:24 - Trial = 26984/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.322 | DEBUG    | __main__:trials:29 - Trial = 26984/30000 | Total reward = 25.48
2022-01-26 14:18:37.326 | DEBUG    | __main__:trials:24 - Trial = 26985/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.327 | DEBUG    | __main__:trials:29 - Trial = 26985/30000 | Total reward = 36.53
2022-01-26 14:18:37.331 | DEBUG    | __main__:trials:24 - Trial = 26986/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.332 | DEBUG    | __main__:trials:29 - Trial = 26986/30000 | Total reward = 28.73
2022-01-26 14:18:37.334 | DEBUG    | __main__:trials:26 - Trial = 26987/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.336 | DEBUG    | __main__:trials:29 - Trial = 26987/30000 | Total reward = 15.13
2022-01-26 14:18:37.339 | DEBUG    | __main__:trials:24 - Trial = 26988/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.341 | DEBUG    | __main__:trials:29 - Trial = 26988/30000 | Total reward = 47.45
2022-01-26 14:18:37.344 | DEBUG    | __main__:trials:24 - Trial = 26989/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.344 | DEBUG    | __main__:trials:29 - Trial = 26989/30000 | Total reward = 41.81
2022-01-26 14:18:37.348 | DEBUG    | __main__:trials:24 - Trial = 26990/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.348 | DEBUG    | __main__:trials:29 - Trial = 26990/30000 | Total reward = 41.14
2022-01-26 14:18:37.352 | DEBUG    | __main__:trials:24 - Trial = 26991/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.353 | DEBUG    | __main__:trials:29 - Trial = 26991/30000 | Total reward = 25.17
2022-01-26 14:18:37.356 | DEBUG    | __main__:trials:24 - Trial = 26992/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.358 | DEBUG    | __main__:trials:29 - Trial = 26992/30000 | Total reward = 41.83
2022-01-26 14:18:37.361 | DEBUG    | __main__:trials:24 - Trial = 26993/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.362 | DEBUG    | __main__:trials:29 - Trial = 26993/30000 | Total reward = 42.65
2022-01-26 14:18:37.365 | DEBUG    | __main__:trials:24 - Trial = 26994/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.367 | DEBUG    | __main__:trials:29 - Trial = 26994/30000 | Total reward = 34.37
2022-01-26 14:18:37.370 | DEBUG    | __main__:trials:24 - Trial = 26995/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.371 | DEBUG    | __main__:trials:29 - Trial = 26995/30000 | Total reward = 47.14
2022-01-26 14:18:37.374 | DEBUG    | __main__:trials:24 - Trial = 26996/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.376 | DEBUG    | __main__:trials:29 - Trial = 26996/30000 | Total reward = 36.49
2022-01-26 14:18:37.379 | DEBUG    | __main__:trials:24 - Trial = 26997/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.380 | DEBUG    | __main__:trials:29 - Trial = 26997/30000 | Total reward = 34.33
2022-01-26 14:18:37.384 | DEBUG    | __main__:trials:24 - Trial = 26998/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.385 | DEBUG    | __main__:trials:29 - Trial = 26998/30000 | Total reward = 36.24
2022-01-26 14:18:37.388 | DEBUG    | __main__:trials:24 - Trial = 26999/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.390 | DEBUG    | __main__:trials:29 - Trial = 26999/30000 | Total reward = 39.28
2022-01-26 14:18:37.393 | DEBUG    | __main__:trials:24 - Trial = 27000/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.393 | DEBUG    | __main__:trials:29 - Trial = 27000/30000 | Total reward = 45.53
2022-01-26 14:18:37.397 | DEBUG    | __main__:trials:24 - Trial = 27001/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.398 | DEBUG    | __main__:trials:29 - Trial = 27001/30000 | Total reward = 42.15
2022-01-26 14:18:37.401 | DEBUG    | __main__:trials:24 - Trial = 27002/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.402 | DEBUG    | __main__:trials:29 - Trial = 27002/30000 | Total reward = 55.55
2022-01-26 14:18:37.405 | DEBUG    | __main__:trials:24 - Trial = 27003/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.407 | DEBUG    | __main__:trials:29 - Trial = 27003/30000 | Total reward = 39.56
2022-01-26 14:18:37.410 | DEBUG    | __main__:trials:24 - Trial = 27004/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.412 | DEBUG    | __main__:trials:29 - Trial = 27004/30000 | Total reward = 42.04
2022-01-26 14:18:37.415 | DEBUG    | __main__:trials:26 - Trial = 27005/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.417 | DEBUG    | __main__:trials:29 - Trial = 27005/30000 | Total reward = 26.98
2022-01-26 14:18:37.420 | DEBUG    | __main__:trials:24 - Trial = 27006/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.422 | DEBUG    | __main__:trials:29 - Trial = 27006/30000 | Total reward = 42.59
2022-01-26 14:18:37.426 | DEBUG    | __main__:trials:24 - Trial = 27007/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.427 | DEBUG    | __main__:trials:29 - Trial = 27007/30000 | Total reward = 46.59
2022-01-26 14:18:37.431 | DEBUG    | __main__:trials:24 - Trial = 27008/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.432 | DEBUG    | __main__:trials:29 - Trial = 27008/30000 | Total reward = 38.54
2022-01-26 14:18:37.435 | DEBUG    | __main__:trials:24 - Trial = 27009/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.437 | DEBUG    | __main__:trials:29 - Trial = 27009/30000 | Total reward = 45.62
2022-01-26 14:18:37.441 | DEBUG    | __main__:trials:24 - Trial = 27010/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.442 | DEBUG    | __main__:trials:29 - Trial = 27010/30000 | Total reward = 43.98
2022-01-26 14:18:37.445 | DEBUG    | __main__:trials:24 - Trial = 27011/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.447 | DEBUG    | __main__:trials:29 - Trial = 27011/30000 | Total reward = 41.70
2022-01-26 14:18:37.450 | DEBUG    | __main__:trials:24 - Trial = 27012/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.450 | DEBUG    | __main__:trials:29 - Trial = 27012/30000 | Total reward = 16.24
2022-01-26 14:18:37.454 | DEBUG    | __main__:trials:24 - Trial = 27013/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.455 | DEBUG    | __main__:trials:29 - Trial = 27013/30000 | Total reward = 41.04
2022-01-26 14:18:37.459 | DEBUG    | __main__:trials:24 - Trial = 27014/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.460 | DEBUG    | __main__:trials:29 - Trial = 27014/30000 | Total reward = 38.22
2022-01-26 14:18:37.463 | DEBUG    | __main__:trials:24 - Trial = 27015/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.465 | DEBUG    | __main__:trials:29 - Trial = 27015/30000 | Total reward = 38.68
2022-01-26 14:18:37.468 | DEBUG    | __main__:trials:24 - Trial = 27016/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.470 | DEBUG    | __main__:trials:29 - Trial = 27016/30000 | Total reward = 37.04
2022-01-26 14:18:37.474 | DEBUG    | __main__:trials:24 - Trial = 27017/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.476 | DEBUG    | __main__:trials:29 - Trial = 27017/30000 | Total reward = 32.41
2022-01-26 14:18:37.478 | DEBUG    | __main__:trials:26 - Trial = 27018/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.480 | DEBUG    | __main__:trials:29 - Trial = 27018/30000 | Total reward = 22.76
2022-01-26 14:18:37.484 | DEBUG    | __main__:trials:24 - Trial = 27019/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.485 | DEBUG    | __main__:trials:29 - Trial = 27019/30000 | Total reward = 42.15
2022-01-26 14:18:37.488 | DEBUG    | __main__:trials:26 - Trial = 27020/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.489 | DEBUG    | __main__:trials:29 - Trial = 27020/30000 | Total reward = 21.55
2022-01-26 14:18:37.492 | DEBUG    | __main__:trials:24 - Trial = 27021/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.493 | DEBUG    | __main__:trials:29 - Trial = 27021/30000 | Total reward = 43.51
2022-01-26 14:18:37.497 | DEBUG    | __main__:trials:26 - Trial = 27022/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.498 | DEBUG    | __main__:trials:29 - Trial = 27022/30000 | Total reward = 20.95
2022-01-26 14:18:37.502 | DEBUG    | __main__:trials:24 - Trial = 27023/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.503 | DEBUG    | __main__:trials:29 - Trial = 27023/30000 | Total reward = 36.15
2022-01-26 14:18:37.507 | DEBUG    | __main__:trials:24 - Trial = 27024/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.508 | DEBUG    | __main__:trials:29 - Trial = 27024/30000 | Total reward = 39.08
2022-01-26 14:18:37.512 | DEBUG    | __main__:trials:26 - Trial = 27025/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.514 | DEBUG    | __main__:trials:29 - Trial = 27025/30000 | Total reward = 22.36
2022-01-26 14:18:37.517 | DEBUG    | __main__:trials:24 - Trial = 27026/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.519 | DEBUG    | __main__:trials:29 - Trial = 27026/30000 | Total reward = 45.57
2022-01-26 14:18:37.522 | DEBUG    | __main__:trials:24 - Trial = 27027/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.524 | DEBUG    | __main__:trials:29 - Trial = 27027/30000 | Total reward = 45.62
2022-01-26 14:18:37.528 | DEBUG    | __main__:trials:24 - Trial = 27028/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.529 | DEBUG    | __main__:trials:29 - Trial = 27028/30000 | Total reward = 37.63
2022-01-26 14:18:37.532 | DEBUG    | __main__:trials:26 - Trial = 27029/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.534 | DEBUG    | __main__:trials:29 - Trial = 27029/30000 | Total reward = 20.24
2022-01-26 14:18:37.537 | DEBUG    | __main__:trials:24 - Trial = 27030/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.539 | DEBUG    | __main__:trials:29 - Trial = 27030/30000 | Total reward = 42.65
2022-01-26 14:18:37.542 | DEBUG    | __main__:trials:24 - Trial = 27031/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.544 | DEBUG    | __main__:trials:29 - Trial = 27031/30000 | Total reward = 42.54
2022-01-26 14:18:37.547 | DEBUG    | __main__:trials:24 - Trial = 27032/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.549 | DEBUG    | __main__:trials:29 - Trial = 27032/30000 | Total reward = 39.66
2022-01-26 14:18:37.552 | DEBUG    | __main__:trials:24 - Trial = 27033/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.553 | DEBUG    | __main__:trials:29 - Trial = 27033/30000 | Total reward = 42.17
2022-01-26 14:18:37.557 | DEBUG    | __main__:trials:24 - Trial = 27034/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.559 | DEBUG    | __main__:trials:29 - Trial = 27034/30000 | Total reward = 41.35
2022-01-26 14:18:37.562 | DEBUG    | __main__:trials:26 - Trial = 27035/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.563 | DEBUG    | __main__:trials:29 - Trial = 27035/30000 | Total reward = 14.89
2022-01-26 14:18:37.567 | DEBUG    | __main__:trials:24 - Trial = 27036/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.568 | DEBUG    | __main__:trials:29 - Trial = 27036/30000 | Total reward = 42.15
2022-01-26 14:18:37.572 | DEBUG    | __main__:trials:24 - Trial = 27037/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.573 | DEBUG    | __main__:trials:29 - Trial = 27037/30000 | Total reward = 35.25
2022-01-26 14:18:37.577 | DEBUG    | __main__:trials:24 - Trial = 27038/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.579 | DEBUG    | __main__:trials:29 - Trial = 27038/30000 | Total reward = 35.87
2022-01-26 14:18:37.582 | DEBUG    | __main__:trials:24 - Trial = 27039/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.584 | DEBUG    | __main__:trials:29 - Trial = 27039/30000 | Total reward = 40.17
2022-01-26 14:18:37.586 | DEBUG    | __main__:trials:24 - Trial = 27040/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.588 | DEBUG    | __main__:trials:29 - Trial = 27040/30000 | Total reward = 39.00
2022-01-26 14:18:37.591 | DEBUG    | __main__:trials:24 - Trial = 27041/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.593 | DEBUG    | __main__:trials:29 - Trial = 27041/30000 | Total reward = 40.21
2022-01-26 14:18:37.597 | DEBUG    | __main__:trials:26 - Trial = 27042/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.598 | DEBUG    | __main__:trials:29 - Trial = 27042/30000 | Total reward = 30.57
2022-01-26 14:18:37.602 | DEBUG    | __main__:trials:24 - Trial = 27043/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.603 | DEBUG    | __main__:trials:29 - Trial = 27043/30000 | Total reward = 42.15
2022-01-26 14:18:37.607 | DEBUG    | __main__:trials:26 - Trial = 27044/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.608 | DEBUG    | __main__:trials:29 - Trial = 27044/30000 | Total reward = 24.73
2022-01-26 14:18:37.611 | DEBUG    | __main__:trials:24 - Trial = 27045/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.613 | DEBUG    | __main__:trials:29 - Trial = 27045/30000 | Total reward = 40.30
2022-01-26 14:18:37.616 | DEBUG    | __main__:trials:24 - Trial = 27046/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.618 | DEBUG    | __main__:trials:29 - Trial = 27046/30000 | Total reward = 42.15
2022-01-26 14:18:37.621 | DEBUG    | __main__:trials:26 - Trial = 27047/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.623 | DEBUG    | __main__:trials:29 - Trial = 27047/30000 | Total reward = 15.53
2022-01-26 14:18:37.626 | DEBUG    | __main__:trials:24 - Trial = 27048/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.628 | DEBUG    | __main__:trials:29 - Trial = 27048/30000 | Total reward = 43.84
2022-01-26 14:18:37.631 | DEBUG    | __main__:trials:24 - Trial = 27049/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.632 | DEBUG    | __main__:trials:29 - Trial = 27049/30000 | Total reward = 49.12
2022-01-26 14:18:37.636 | DEBUG    | __main__:trials:24 - Trial = 27050/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.638 | DEBUG    | __main__:trials:29 - Trial = 27050/30000 | Total reward = 42.25
2022-01-26 14:18:37.641 | DEBUG    | __main__:trials:24 - Trial = 27051/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.643 | DEBUG    | __main__:trials:29 - Trial = 27051/30000 | Total reward = 49.35
2022-01-26 14:18:37.646 | DEBUG    | __main__:trials:24 - Trial = 27052/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.647 | DEBUG    | __main__:trials:29 - Trial = 27052/30000 | Total reward = 35.78
2022-01-26 14:18:37.651 | DEBUG    | __main__:trials:24 - Trial = 27053/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.653 | DEBUG    | __main__:trials:29 - Trial = 27053/30000 | Total reward = 53.23
2022-01-26 14:18:37.657 | DEBUG    | __main__:trials:24 - Trial = 27054/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.659 | DEBUG    | __main__:trials:29 - Trial = 27054/30000 | Total reward = 44.54
2022-01-26 14:18:37.663 | DEBUG    | __main__:trials:24 - Trial = 27055/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.664 | DEBUG    | __main__:trials:29 - Trial = 27055/30000 | Total reward = 38.54
2022-01-26 14:18:37.668 | DEBUG    | __main__:trials:24 - Trial = 27056/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.669 | DEBUG    | __main__:trials:29 - Trial = 27056/30000 | Total reward = 44.54
2022-01-26 14:18:37.673 | DEBUG    | __main__:trials:24 - Trial = 27057/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.675 | DEBUG    | __main__:trials:29 - Trial = 27057/30000 | Total reward = 21.73
2022-01-26 14:18:37.678 | DEBUG    | __main__:trials:24 - Trial = 27058/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.679 | DEBUG    | __main__:trials:29 - Trial = 27058/30000 | Total reward = 40.58
2022-01-26 14:18:37.683 | DEBUG    | __main__:trials:24 - Trial = 27059/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.685 | DEBUG    | __main__:trials:29 - Trial = 27059/30000 | Total reward = 30.66
2022-01-26 14:18:37.688 | DEBUG    | __main__:trials:24 - Trial = 27060/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.689 | DEBUG    | __main__:trials:29 - Trial = 27060/30000 | Total reward = 54.47
2022-01-26 14:18:37.692 | DEBUG    | __main__:trials:24 - Trial = 27061/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.693 | DEBUG    | __main__:trials:29 - Trial = 27061/30000 | Total reward = 42.15
2022-01-26 14:18:37.696 | DEBUG    | __main__:trials:24 - Trial = 27062/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.697 | DEBUG    | __main__:trials:29 - Trial = 27062/30000 | Total reward = 41.65
2022-01-26 14:18:37.701 | DEBUG    | __main__:trials:26 - Trial = 27063/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.702 | DEBUG    | __main__:trials:29 - Trial = 27063/30000 | Total reward = 25.59
2022-01-26 14:18:37.705 | DEBUG    | __main__:trials:24 - Trial = 27064/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.706 | DEBUG    | __main__:trials:29 - Trial = 27064/30000 | Total reward = 30.13
2022-01-26 14:18:37.710 | DEBUG    | __main__:trials:24 - Trial = 27065/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.712 | DEBUG    | __main__:trials:29 - Trial = 27065/30000 | Total reward = 42.66
2022-01-26 14:18:37.715 | DEBUG    | __main__:trials:24 - Trial = 27066/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.716 | DEBUG    | __main__:trials:29 - Trial = 27066/30000 | Total reward = 50.84
2022-01-26 14:18:37.720 | DEBUG    | __main__:trials:24 - Trial = 27067/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.722 | DEBUG    | __main__:trials:29 - Trial = 27067/30000 | Total reward = 33.81
2022-01-26 14:18:37.725 | DEBUG    | __main__:trials:24 - Trial = 27068/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.727 | DEBUG    | __main__:trials:29 - Trial = 27068/30000 | Total reward = 38.38
2022-01-26 14:18:37.730 | DEBUG    | __main__:trials:26 - Trial = 27069/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.732 | DEBUG    | __main__:trials:29 - Trial = 27069/30000 | Total reward = 19.59
2022-01-26 14:18:37.735 | DEBUG    | __main__:trials:24 - Trial = 27070/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.736 | DEBUG    | __main__:trials:29 - Trial = 27070/30000 | Total reward = 36.75
2022-01-26 14:18:37.740 | DEBUG    | __main__:trials:24 - Trial = 27071/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.742 | DEBUG    | __main__:trials:29 - Trial = 27071/30000 | Total reward = 44.69
2022-01-26 14:18:37.745 | DEBUG    | __main__:trials:24 - Trial = 27072/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.747 | DEBUG    | __main__:trials:29 - Trial = 27072/30000 | Total reward = 32.52
2022-01-26 14:18:37.751 | DEBUG    | __main__:trials:24 - Trial = 27073/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.752 | DEBUG    | __main__:trials:29 - Trial = 27073/30000 | Total reward = 40.05
2022-01-26 14:18:37.756 | DEBUG    | __main__:trials:24 - Trial = 27074/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.758 | DEBUG    | __main__:trials:29 - Trial = 27074/30000 | Total reward = 28.74
2022-01-26 14:18:37.762 | DEBUG    | __main__:trials:24 - Trial = 27075/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.762 | DEBUG    | __main__:trials:29 - Trial = 27075/30000 | Total reward = 40.12
2022-01-26 14:18:37.766 | DEBUG    | __main__:trials:24 - Trial = 27076/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.768 | DEBUG    | __main__:trials:29 - Trial = 27076/30000 | Total reward = 39.76
2022-01-26 14:18:37.772 | DEBUG    | __main__:trials:24 - Trial = 27077/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.773 | DEBUG    | __main__:trials:29 - Trial = 27077/30000 | Total reward = 25.52
2022-01-26 14:18:37.776 | DEBUG    | __main__:trials:24 - Trial = 27078/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.778 | DEBUG    | __main__:trials:29 - Trial = 27078/30000 | Total reward = 38.35
2022-01-26 14:18:37.782 | DEBUG    | __main__:trials:24 - Trial = 27079/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.782 | DEBUG    | __main__:trials:29 - Trial = 27079/30000 | Total reward = 44.87
2022-01-26 14:18:37.787 | DEBUG    | __main__:trials:24 - Trial = 27080/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.789 | DEBUG    | __main__:trials:29 - Trial = 27080/30000 | Total reward = 42.69
2022-01-26 14:18:37.792 | DEBUG    | __main__:trials:24 - Trial = 27081/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.794 | DEBUG    | __main__:trials:29 - Trial = 27081/30000 | Total reward = 41.00
2022-01-26 14:18:37.797 | DEBUG    | __main__:trials:24 - Trial = 27082/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.799 | DEBUG    | __main__:trials:29 - Trial = 27082/30000 | Total reward = 39.73
2022-01-26 14:18:37.802 | DEBUG    | __main__:trials:24 - Trial = 27083/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.803 | DEBUG    | __main__:trials:29 - Trial = 27083/30000 | Total reward = 46.28
2022-01-26 14:18:37.806 | DEBUG    | __main__:trials:24 - Trial = 27084/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.808 | DEBUG    | __main__:trials:29 - Trial = 27084/30000 | Total reward = 36.64
2022-01-26 14:18:37.812 | DEBUG    | __main__:trials:24 - Trial = 27085/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.813 | DEBUG    | __main__:trials:29 - Trial = 27085/30000 | Total reward = 36.36
2022-01-26 14:18:37.817 | DEBUG    | __main__:trials:24 - Trial = 27086/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.818 | DEBUG    | __main__:trials:29 - Trial = 27086/30000 | Total reward = 44.87
2022-01-26 14:18:37.822 | DEBUG    | __main__:trials:24 - Trial = 27087/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.823 | DEBUG    | __main__:trials:29 - Trial = 27087/30000 | Total reward = 39.76
2022-01-26 14:18:37.826 | DEBUG    | __main__:trials:26 - Trial = 27088/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.828 | DEBUG    | __main__:trials:29 - Trial = 27088/30000 | Total reward = 21.59
2022-01-26 14:18:37.832 | DEBUG    | __main__:trials:24 - Trial = 27089/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.833 | DEBUG    | __main__:trials:29 - Trial = 27089/30000 | Total reward = 35.85
2022-01-26 14:18:37.836 | DEBUG    | __main__:trials:24 - Trial = 27090/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.838 | DEBUG    | __main__:trials:29 - Trial = 27090/30000 | Total reward = 26.85
2022-01-26 14:18:37.841 | DEBUG    | __main__:trials:24 - Trial = 27091/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.843 | DEBUG    | __main__:trials:29 - Trial = 27091/30000 | Total reward = 32.18
2022-01-26 14:18:37.846 | DEBUG    | __main__:trials:24 - Trial = 27092/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.848 | DEBUG    | __main__:trials:29 - Trial = 27092/30000 | Total reward = 38.91
2022-01-26 14:18:37.850 | DEBUG    | __main__:trials:24 - Trial = 27093/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.852 | DEBUG    | __main__:trials:29 - Trial = 27093/30000 | Total reward = 49.68
2022-01-26 14:18:37.856 | DEBUG    | __main__:trials:24 - Trial = 27094/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.858 | DEBUG    | __main__:trials:29 - Trial = 27094/30000 | Total reward = 43.23
2022-01-26 14:18:37.861 | DEBUG    | __main__:trials:24 - Trial = 27095/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.863 | DEBUG    | __main__:trials:29 - Trial = 27095/30000 | Total reward = 42.15
2022-01-26 14:18:37.867 | DEBUG    | __main__:trials:24 - Trial = 27096/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.868 | DEBUG    | __main__:trials:29 - Trial = 27096/30000 | Total reward = 37.44
2022-01-26 14:18:37.872 | DEBUG    | __main__:trials:24 - Trial = 27097/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.873 | DEBUG    | __main__:trials:29 - Trial = 27097/30000 | Total reward = 45.03
2022-01-26 14:18:37.876 | DEBUG    | __main__:trials:24 - Trial = 27098/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.878 | DEBUG    | __main__:trials:29 - Trial = 27098/30000 | Total reward = 38.57
2022-01-26 14:18:37.881 | DEBUG    | __main__:trials:26 - Trial = 27099/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.882 | DEBUG    | __main__:trials:29 - Trial = 27099/30000 | Total reward = 19.52
2022-01-26 14:18:37.886 | DEBUG    | __main__:trials:24 - Trial = 27100/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.888 | DEBUG    | __main__:trials:29 - Trial = 27100/30000 | Total reward = 49.31
2022-01-26 14:18:37.892 | DEBUG    | __main__:trials:24 - Trial = 27101/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.893 | DEBUG    | __main__:trials:29 - Trial = 27101/30000 | Total reward = 41.97
2022-01-26 14:18:37.896 | DEBUG    | __main__:trials:24 - Trial = 27102/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.898 | DEBUG    | __main__:trials:29 - Trial = 27102/30000 | Total reward = 45.55
2022-01-26 14:18:37.901 | DEBUG    | __main__:trials:24 - Trial = 27103/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.903 | DEBUG    | __main__:trials:29 - Trial = 27103/30000 | Total reward = 45.38
2022-01-26 14:18:37.906 | DEBUG    | __main__:trials:24 - Trial = 27104/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.908 | DEBUG    | __main__:trials:29 - Trial = 27104/30000 | Total reward = 23.31
2022-01-26 14:18:37.911 | DEBUG    | __main__:trials:24 - Trial = 27105/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.913 | DEBUG    | __main__:trials:29 - Trial = 27105/30000 | Total reward = 46.09
2022-01-26 14:18:37.916 | DEBUG    | __main__:trials:24 - Trial = 27106/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.918 | DEBUG    | __main__:trials:29 - Trial = 27106/30000 | Total reward = 42.33
2022-01-26 14:18:37.921 | DEBUG    | __main__:trials:26 - Trial = 27107/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.922 | DEBUG    | __main__:trials:29 - Trial = 27107/30000 | Total reward = 12.98
2022-01-26 14:18:37.925 | DEBUG    | __main__:trials:24 - Trial = 27108/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.927 | DEBUG    | __main__:trials:29 - Trial = 27108/30000 | Total reward = 45.63
2022-01-26 14:18:37.930 | DEBUG    | __main__:trials:24 - Trial = 27109/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.932 | DEBUG    | __main__:trials:29 - Trial = 27109/30000 | Total reward = 36.18
2022-01-26 14:18:37.935 | DEBUG    | __main__:trials:24 - Trial = 27110/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.937 | DEBUG    | __main__:trials:29 - Trial = 27110/30000 | Total reward = 34.02
2022-01-26 14:18:37.940 | DEBUG    | __main__:trials:24 - Trial = 27111/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.942 | DEBUG    | __main__:trials:29 - Trial = 27111/30000 | Total reward = 39.76
2022-01-26 14:18:37.945 | DEBUG    | __main__:trials:24 - Trial = 27112/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.947 | DEBUG    | __main__:trials:29 - Trial = 27112/30000 | Total reward = 66.84
2022-01-26 14:18:37.951 | DEBUG    | __main__:trials:24 - Trial = 27113/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.952 | DEBUG    | __main__:trials:29 - Trial = 27113/30000 | Total reward = 48.42
2022-01-26 14:18:37.956 | DEBUG    | __main__:trials:24 - Trial = 27114/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.957 | DEBUG    | __main__:trials:29 - Trial = 27114/30000 | Total reward = 36.72
2022-01-26 14:18:37.961 | DEBUG    | __main__:trials:26 - Trial = 27115/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.962 | DEBUG    | __main__:trials:29 - Trial = 27115/30000 | Total reward = 12.18
2022-01-26 14:18:37.966 | DEBUG    | __main__:trials:24 - Trial = 27116/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.967 | DEBUG    | __main__:trials:29 - Trial = 27116/30000 | Total reward = 24.93
2022-01-26 14:18:37.971 | DEBUG    | __main__:trials:24 - Trial = 27117/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.972 | DEBUG    | __main__:trials:29 - Trial = 27117/30000 | Total reward = 32.12
2022-01-26 14:18:37.976 | DEBUG    | __main__:trials:24 - Trial = 27118/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.978 | DEBUG    | __main__:trials:29 - Trial = 27118/30000 | Total reward = 47.45
2022-01-26 14:18:37.981 | DEBUG    | __main__:trials:24 - Trial = 27119/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.983 | DEBUG    | __main__:trials:29 - Trial = 27119/30000 | Total reward = 48.77
2022-01-26 14:18:37.986 | DEBUG    | __main__:trials:24 - Trial = 27120/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.988 | DEBUG    | __main__:trials:29 - Trial = 27120/30000 | Total reward = 40.02
2022-01-26 14:18:37.991 | DEBUG    | __main__:trials:26 - Trial = 27121/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:37.991 | DEBUG    | __main__:trials:29 - Trial = 27121/30000 | Total reward = 15.13
2022-01-26 14:18:37.995 | DEBUG    | __main__:trials:24 - Trial = 27122/30000 | Max number of steps (20) reached
2022-01-26 14:18:37.996 | DEBUG    | __main__:trials:29 - Trial = 27122/30000 | Total reward = 38.97
2022-01-26 14:18:38.000 | DEBUG    | __main__:trials:24 - Trial = 27123/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.002 | DEBUG    | __main__:trials:29 - Trial = 27123/30000 | Total reward = 25.76
2022-01-26 14:18:38.006 | DEBUG    | __main__:trials:24 - Trial = 27124/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.006 | DEBUG    | __main__:trials:29 - Trial = 27124/30000 | Total reward = 29.46
2022-01-26 14:18:38.010 | DEBUG    | __main__:trials:24 - Trial = 27125/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.012 | DEBUG    | __main__:trials:29 - Trial = 27125/30000 | Total reward = 54.17
2022-01-26 14:18:38.016 | DEBUG    | __main__:trials:24 - Trial = 27126/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.017 | DEBUG    | __main__:trials:29 - Trial = 27126/30000 | Total reward = 45.14
2022-01-26 14:18:38.020 | DEBUG    | __main__:trials:24 - Trial = 27127/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.021 | DEBUG    | __main__:trials:29 - Trial = 27127/30000 | Total reward = 52.58
2022-01-26 14:18:38.025 | DEBUG    | __main__:trials:24 - Trial = 27128/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.026 | DEBUG    | __main__:trials:29 - Trial = 27128/30000 | Total reward = 31.40
2022-01-26 14:18:38.029 | DEBUG    | __main__:trials:24 - Trial = 27129/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.031 | DEBUG    | __main__:trials:29 - Trial = 27129/30000 | Total reward = 29.57
2022-01-26 14:18:38.034 | DEBUG    | __main__:trials:24 - Trial = 27130/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.036 | DEBUG    | __main__:trials:29 - Trial = 27130/30000 | Total reward = 39.21
2022-01-26 14:18:38.039 | DEBUG    | __main__:trials:24 - Trial = 27131/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.040 | DEBUG    | __main__:trials:29 - Trial = 27131/30000 | Total reward = 42.91
2022-01-26 14:18:38.043 | DEBUG    | __main__:trials:24 - Trial = 27132/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.045 | DEBUG    | __main__:trials:29 - Trial = 27132/30000 | Total reward = 44.13
2022-01-26 14:18:38.048 | DEBUG    | __main__:trials:24 - Trial = 27133/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.049 | DEBUG    | __main__:trials:29 - Trial = 27133/30000 | Total reward = 41.02
2022-01-26 14:18:38.052 | DEBUG    | __main__:trials:24 - Trial = 27134/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.054 | DEBUG    | __main__:trials:29 - Trial = 27134/30000 | Total reward = 36.58
2022-01-26 14:18:38.058 | DEBUG    | __main__:trials:24 - Trial = 27135/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.058 | DEBUG    | __main__:trials:29 - Trial = 27135/30000 | Total reward = 34.95
2022-01-26 14:18:38.063 | DEBUG    | __main__:trials:24 - Trial = 27136/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.064 | DEBUG    | __main__:trials:29 - Trial = 27136/30000 | Total reward = 47.72
2022-01-26 14:18:38.068 | DEBUG    | __main__:trials:24 - Trial = 27137/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.069 | DEBUG    | __main__:trials:29 - Trial = 27137/30000 | Total reward = 52.71
2022-01-26 14:18:38.073 | DEBUG    | __main__:trials:24 - Trial = 27138/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.074 | DEBUG    | __main__:trials:29 - Trial = 27138/30000 | Total reward = 37.89
2022-01-26 14:18:38.077 | DEBUG    | __main__:trials:24 - Trial = 27139/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.078 | DEBUG    | __main__:trials:29 - Trial = 27139/30000 | Total reward = 41.74
2022-01-26 14:18:38.082 | DEBUG    | __main__:trials:24 - Trial = 27140/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.083 | DEBUG    | __main__:trials:29 - Trial = 27140/30000 | Total reward = 42.15
2022-01-26 14:18:38.086 | DEBUG    | __main__:trials:24 - Trial = 27141/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.087 | DEBUG    | __main__:trials:29 - Trial = 27141/30000 | Total reward = 38.28
2022-01-26 14:18:38.092 | DEBUG    | __main__:trials:24 - Trial = 27142/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.093 | DEBUG    | __main__:trials:29 - Trial = 27142/30000 | Total reward = 51.03
2022-01-26 14:18:38.096 | DEBUG    | __main__:trials:24 - Trial = 27143/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.097 | DEBUG    | __main__:trials:29 - Trial = 27143/30000 | Total reward = 46.80
2022-01-26 14:18:38.100 | DEBUG    | __main__:trials:24 - Trial = 27144/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.102 | DEBUG    | __main__:trials:29 - Trial = 27144/30000 | Total reward = 29.54
2022-01-26 14:18:38.106 | DEBUG    | __main__:trials:24 - Trial = 27145/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.106 | DEBUG    | __main__:trials:29 - Trial = 27145/30000 | Total reward = 43.26
2022-01-26 14:18:38.110 | DEBUG    | __main__:trials:26 - Trial = 27146/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.111 | DEBUG    | __main__:trials:29 - Trial = 27146/30000 | Total reward = 13.08
2022-01-26 14:18:38.115 | DEBUG    | __main__:trials:24 - Trial = 27147/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.117 | DEBUG    | __main__:trials:29 - Trial = 27147/30000 | Total reward = 42.15
2022-01-26 14:18:38.120 | DEBUG    | __main__:trials:24 - Trial = 27148/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.122 | DEBUG    | __main__:trials:29 - Trial = 27148/30000 | Total reward = 37.98
2022-01-26 14:18:38.125 | DEBUG    | __main__:trials:26 - Trial = 27149/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.126 | DEBUG    | __main__:trials:29 - Trial = 27149/30000 | Total reward = 14.58
2022-01-26 14:18:38.130 | DEBUG    | __main__:trials:24 - Trial = 27150/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.130 | DEBUG    | __main__:trials:29 - Trial = 27150/30000 | Total reward = 38.01
2022-01-26 14:18:38.135 | DEBUG    | __main__:trials:24 - Trial = 27151/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.137 | DEBUG    | __main__:trials:29 - Trial = 27151/30000 | Total reward = 42.15
2022-01-26 14:18:38.139 | DEBUG    | __main__:trials:24 - Trial = 27152/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.141 | DEBUG    | __main__:trials:29 - Trial = 27152/30000 | Total reward = 52.59
2022-01-26 14:18:38.145 | DEBUG    | __main__:trials:24 - Trial = 27153/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.146 | DEBUG    | __main__:trials:29 - Trial = 27153/30000 | Total reward = 31.47
2022-01-26 14:18:38.150 | DEBUG    | __main__:trials:24 - Trial = 27154/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.150 | DEBUG    | __main__:trials:29 - Trial = 27154/30000 | Total reward = 45.93
2022-01-26 14:18:38.154 | DEBUG    | __main__:trials:24 - Trial = 27155/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.155 | DEBUG    | __main__:trials:29 - Trial = 27155/30000 | Total reward = 41.81
2022-01-26 14:18:38.159 | DEBUG    | __main__:trials:24 - Trial = 27156/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.160 | DEBUG    | __main__:trials:29 - Trial = 27156/30000 | Total reward = 40.65
2022-01-26 14:18:38.163 | DEBUG    | __main__:trials:26 - Trial = 27157/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.163 | DEBUG    | __main__:trials:29 - Trial = 27157/30000 | Total reward = 18.93
2022-01-26 14:18:38.167 | DEBUG    | __main__:trials:24 - Trial = 27158/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.168 | DEBUG    | __main__:trials:29 - Trial = 27158/30000 | Total reward = 37.43
2022-01-26 14:18:38.171 | DEBUG    | __main__:trials:24 - Trial = 27159/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.173 | DEBUG    | __main__:trials:29 - Trial = 27159/30000 | Total reward = 40.26
2022-01-26 14:18:38.176 | DEBUG    | __main__:trials:24 - Trial = 27160/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.177 | DEBUG    | __main__:trials:29 - Trial = 27160/30000 | Total reward = 27.45
2022-01-26 14:18:38.180 | DEBUG    | __main__:trials:24 - Trial = 27161/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.181 | DEBUG    | __main__:trials:29 - Trial = 27161/30000 | Total reward = 41.36
2022-01-26 14:18:38.183 | DEBUG    | __main__:trials:26 - Trial = 27162/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.184 | DEBUG    | __main__:trials:29 - Trial = 27162/30000 | Total reward = 9.48
2022-01-26 14:18:38.188 | DEBUG    | __main__:trials:24 - Trial = 27163/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.189 | DEBUG    | __main__:trials:29 - Trial = 27163/30000 | Total reward = 43.83
2022-01-26 14:18:38.192 | DEBUG    | __main__:trials:24 - Trial = 27164/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.194 | DEBUG    | __main__:trials:29 - Trial = 27164/30000 | Total reward = 41.18
2022-01-26 14:18:38.197 | DEBUG    | __main__:trials:26 - Trial = 27165/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.197 | DEBUG    | __main__:trials:29 - Trial = 27165/30000 | Total reward = 17.59
2022-01-26 14:18:38.201 | DEBUG    | __main__:trials:24 - Trial = 27166/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.202 | DEBUG    | __main__:trials:29 - Trial = 27166/30000 | Total reward = 39.94
2022-01-26 14:18:38.205 | DEBUG    | __main__:trials:24 - Trial = 27167/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.206 | DEBUG    | __main__:trials:29 - Trial = 27167/30000 | Total reward = 46.60
2022-01-26 14:18:38.208 | DEBUG    | __main__:trials:26 - Trial = 27168/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.210 | DEBUG    | __main__:trials:29 - Trial = 27168/30000 | Total reward = 14.95
2022-01-26 14:18:38.213 | DEBUG    | __main__:trials:24 - Trial = 27169/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.215 | DEBUG    | __main__:trials:29 - Trial = 27169/30000 | Total reward = 46.08
2022-01-26 14:18:38.219 | DEBUG    | __main__:trials:24 - Trial = 27170/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.220 | DEBUG    | __main__:trials:29 - Trial = 27170/30000 | Total reward = 47.90
2022-01-26 14:18:38.223 | DEBUG    | __main__:trials:26 - Trial = 27171/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.225 | DEBUG    | __main__:trials:29 - Trial = 27171/30000 | Total reward = 15.02
2022-01-26 14:18:38.228 | DEBUG    | __main__:trials:26 - Trial = 27172/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.229 | DEBUG    | __main__:trials:29 - Trial = 27172/30000 | Total reward = 17.71
2022-01-26 14:18:38.233 | DEBUG    | __main__:trials:24 - Trial = 27173/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.234 | DEBUG    | __main__:trials:29 - Trial = 27173/30000 | Total reward = 41.74
2022-01-26 14:18:38.238 | DEBUG    | __main__:trials:24 - Trial = 27174/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.239 | DEBUG    | __main__:trials:29 - Trial = 27174/30000 | Total reward = 45.62
2022-01-26 14:18:38.243 | DEBUG    | __main__:trials:26 - Trial = 27175/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.245 | DEBUG    | __main__:trials:29 - Trial = 27175/30000 | Total reward = 14.24
2022-01-26 14:18:38.248 | DEBUG    | __main__:trials:24 - Trial = 27176/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.249 | DEBUG    | __main__:trials:29 - Trial = 27176/30000 | Total reward = 39.11
2022-01-26 14:18:38.254 | DEBUG    | __main__:trials:26 - Trial = 27177/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.254 | DEBUG    | __main__:trials:29 - Trial = 27177/30000 | Total reward = 33.61
2022-01-26 14:18:38.259 | DEBUG    | __main__:trials:24 - Trial = 27178/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.260 | DEBUG    | __main__:trials:29 - Trial = 27178/30000 | Total reward = 60.15
2022-01-26 14:18:38.264 | DEBUG    | __main__:trials:24 - Trial = 27179/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.265 | DEBUG    | __main__:trials:29 - Trial = 27179/30000 | Total reward = 41.24
2022-01-26 14:18:38.269 | DEBUG    | __main__:trials:24 - Trial = 27180/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.270 | DEBUG    | __main__:trials:29 - Trial = 27180/30000 | Total reward = 39.77
2022-01-26 14:18:38.274 | DEBUG    | __main__:trials:24 - Trial = 27181/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.276 | DEBUG    | __main__:trials:29 - Trial = 27181/30000 | Total reward = 37.48
2022-01-26 14:18:38.280 | DEBUG    | __main__:trials:24 - Trial = 27182/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.282 | DEBUG    | __main__:trials:29 - Trial = 27182/30000 | Total reward = 30.71
2022-01-26 14:18:38.285 | DEBUG    | __main__:trials:26 - Trial = 27183/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.287 | DEBUG    | __main__:trials:29 - Trial = 27183/30000 | Total reward = 22.94
2022-01-26 14:18:38.290 | DEBUG    | __main__:trials:24 - Trial = 27184/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.292 | DEBUG    | __main__:trials:29 - Trial = 27184/30000 | Total reward = 42.15
2022-01-26 14:18:38.294 | DEBUG    | __main__:trials:26 - Trial = 27185/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.296 | DEBUG    | __main__:trials:29 - Trial = 27185/30000 | Total reward = 30.00
2022-01-26 14:18:38.300 | DEBUG    | __main__:trials:24 - Trial = 27186/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.300 | DEBUG    | __main__:trials:29 - Trial = 27186/30000 | Total reward = 35.83
2022-01-26 14:18:38.304 | DEBUG    | __main__:trials:24 - Trial = 27187/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.306 | DEBUG    | __main__:trials:29 - Trial = 27187/30000 | Total reward = 49.15
2022-01-26 14:18:38.309 | DEBUG    | __main__:trials:24 - Trial = 27188/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.311 | DEBUG    | __main__:trials:29 - Trial = 27188/30000 | Total reward = 31.02
2022-01-26 14:18:38.314 | DEBUG    | __main__:trials:24 - Trial = 27189/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.316 | DEBUG    | __main__:trials:29 - Trial = 27189/30000 | Total reward = 41.28
2022-01-26 14:18:38.320 | DEBUG    | __main__:trials:24 - Trial = 27190/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.321 | DEBUG    | __main__:trials:29 - Trial = 27190/30000 | Total reward = 53.06
2022-01-26 14:18:38.324 | DEBUG    | __main__:trials:26 - Trial = 27191/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.325 | DEBUG    | __main__:trials:29 - Trial = 27191/30000 | Total reward = 20.76
2022-01-26 14:18:38.328 | DEBUG    | __main__:trials:24 - Trial = 27192/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.330 | DEBUG    | __main__:trials:29 - Trial = 27192/30000 | Total reward = 28.42
2022-01-26 14:18:38.333 | DEBUG    | __main__:trials:24 - Trial = 27193/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.335 | DEBUG    | __main__:trials:29 - Trial = 27193/30000 | Total reward = 39.38
2022-01-26 14:18:38.339 | DEBUG    | __main__:trials:26 - Trial = 27194/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.340 | DEBUG    | __main__:trials:29 - Trial = 27194/30000 | Total reward = 25.82
2022-01-26 14:18:38.344 | DEBUG    | __main__:trials:24 - Trial = 27195/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.346 | DEBUG    | __main__:trials:29 - Trial = 27195/30000 | Total reward = 38.80
2022-01-26 14:18:38.349 | DEBUG    | __main__:trials:26 - Trial = 27196/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.351 | DEBUG    | __main__:trials:29 - Trial = 27196/30000 | Total reward = 16.65
2022-01-26 14:18:38.354 | DEBUG    | __main__:trials:24 - Trial = 27197/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.356 | DEBUG    | __main__:trials:29 - Trial = 27197/30000 | Total reward = 35.86
2022-01-26 14:18:38.360 | DEBUG    | __main__:trials:24 - Trial = 27198/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.361 | DEBUG    | __main__:trials:29 - Trial = 27198/30000 | Total reward = 19.51
2022-01-26 14:18:38.363 | DEBUG    | __main__:trials:26 - Trial = 27199/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.364 | DEBUG    | __main__:trials:29 - Trial = 27199/30000 | Total reward = 9.48
2022-01-26 14:18:38.368 | DEBUG    | __main__:trials:24 - Trial = 27200/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.369 | DEBUG    | __main__:trials:29 - Trial = 27200/30000 | Total reward = 32.28
2022-01-26 14:18:38.372 | DEBUG    | __main__:trials:24 - Trial = 27201/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.373 | DEBUG    | __main__:trials:29 - Trial = 27201/30000 | Total reward = 42.15
2022-01-26 14:18:38.377 | DEBUG    | __main__:trials:24 - Trial = 27202/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.378 | DEBUG    | __main__:trials:29 - Trial = 27202/30000 | Total reward = 56.01
2022-01-26 14:18:38.381 | DEBUG    | __main__:trials:24 - Trial = 27203/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.382 | DEBUG    | __main__:trials:29 - Trial = 27203/30000 | Total reward = 42.22
2022-01-26 14:18:38.385 | DEBUG    | __main__:trials:24 - Trial = 27204/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.386 | DEBUG    | __main__:trials:29 - Trial = 27204/30000 | Total reward = 40.07
2022-01-26 14:18:38.389 | DEBUG    | __main__:trials:24 - Trial = 27205/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.390 | DEBUG    | __main__:trials:29 - Trial = 27205/30000 | Total reward = 34.46
2022-01-26 14:18:38.393 | DEBUG    | __main__:trials:24 - Trial = 27206/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.793 | DEBUG    | __main__:trials:29 - Trial = 27206/30000 | Total reward = 33.90
2022-01-26 14:18:38.798 | DEBUG    | __main__:trials:24 - Trial = 27207/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.800 | DEBUG    | __main__:trials:29 - Trial = 27207/30000 | Total reward = 34.10
2022-01-26 14:18:38.804 | DEBUG    | __main__:trials:24 - Trial = 27208/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.805 | DEBUG    | __main__:trials:29 - Trial = 27208/30000 | Total reward = 48.96
2022-01-26 14:18:38.809 | DEBUG    | __main__:trials:24 - Trial = 27209/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.811 | DEBUG    | __main__:trials:29 - Trial = 27209/30000 | Total reward = 37.86
2022-01-26 14:18:38.814 | DEBUG    | __main__:trials:24 - Trial = 27210/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.816 | DEBUG    | __main__:trials:29 - Trial = 27210/30000 | Total reward = 42.15
2022-01-26 14:18:38.819 | DEBUG    | __main__:trials:24 - Trial = 27211/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.820 | DEBUG    | __main__:trials:29 - Trial = 27211/30000 | Total reward = 45.15
2022-01-26 14:18:38.824 | DEBUG    | __main__:trials:24 - Trial = 27212/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.826 | DEBUG    | __main__:trials:29 - Trial = 27212/30000 | Total reward = 35.09
2022-01-26 14:18:38.829 | DEBUG    | __main__:trials:24 - Trial = 27213/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.831 | DEBUG    | __main__:trials:29 - Trial = 27213/30000 | Total reward = 45.28
2022-01-26 14:18:38.834 | DEBUG    | __main__:trials:24 - Trial = 27214/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.835 | DEBUG    | __main__:trials:29 - Trial = 27214/30000 | Total reward = 21.00
2022-01-26 14:18:38.838 | DEBUG    | __main__:trials:24 - Trial = 27215/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.840 | DEBUG    | __main__:trials:29 - Trial = 27215/30000 | Total reward = 25.92
2022-01-26 14:18:38.844 | DEBUG    | __main__:trials:24 - Trial = 27216/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.844 | DEBUG    | __main__:trials:29 - Trial = 27216/30000 | Total reward = 42.15
2022-01-26 14:18:38.848 | DEBUG    | __main__:trials:24 - Trial = 27217/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.850 | DEBUG    | __main__:trials:29 - Trial = 27217/30000 | Total reward = 47.45
2022-01-26 14:18:38.854 | DEBUG    | __main__:trials:24 - Trial = 27218/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.854 | DEBUG    | __main__:trials:29 - Trial = 27218/30000 | Total reward = 40.41
2022-01-26 14:18:38.859 | DEBUG    | __main__:trials:24 - Trial = 27219/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.860 | DEBUG    | __main__:trials:29 - Trial = 27219/30000 | Total reward = 35.42
2022-01-26 14:18:38.864 | DEBUG    | __main__:trials:24 - Trial = 27220/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.865 | DEBUG    | __main__:trials:29 - Trial = 27220/30000 | Total reward = 41.28
2022-01-26 14:18:38.869 | DEBUG    | __main__:trials:24 - Trial = 27221/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.870 | DEBUG    | __main__:trials:29 - Trial = 27221/30000 | Total reward = 52.33
2022-01-26 14:18:38.874 | DEBUG    | __main__:trials:24 - Trial = 27222/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.875 | DEBUG    | __main__:trials:29 - Trial = 27222/30000 | Total reward = 37.88
2022-01-26 14:18:38.879 | DEBUG    | __main__:trials:24 - Trial = 27223/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.881 | DEBUG    | __main__:trials:29 - Trial = 27223/30000 | Total reward = 42.56
2022-01-26 14:18:38.884 | DEBUG    | __main__:trials:24 - Trial = 27224/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.885 | DEBUG    | __main__:trials:29 - Trial = 27224/30000 | Total reward = 29.86
2022-01-26 14:18:38.888 | DEBUG    | __main__:trials:24 - Trial = 27225/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.890 | DEBUG    | __main__:trials:29 - Trial = 27225/30000 | Total reward = 38.29
2022-01-26 14:18:38.893 | DEBUG    | __main__:trials:24 - Trial = 27226/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.894 | DEBUG    | __main__:trials:29 - Trial = 27226/30000 | Total reward = 32.05
2022-01-26 14:18:38.897 | DEBUG    | __main__:trials:24 - Trial = 27227/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.899 | DEBUG    | __main__:trials:29 - Trial = 27227/30000 | Total reward = 45.87
2022-01-26 14:18:38.903 | DEBUG    | __main__:trials:24 - Trial = 27228/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.904 | DEBUG    | __main__:trials:29 - Trial = 27228/30000 | Total reward = 35.77
2022-01-26 14:18:38.907 | DEBUG    | __main__:trials:24 - Trial = 27229/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.909 | DEBUG    | __main__:trials:29 - Trial = 27229/30000 | Total reward = 40.23
2022-01-26 14:18:38.912 | DEBUG    | __main__:trials:24 - Trial = 27230/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.913 | DEBUG    | __main__:trials:29 - Trial = 27230/30000 | Total reward = 32.86
2022-01-26 14:18:38.916 | DEBUG    | __main__:trials:24 - Trial = 27231/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.918 | DEBUG    | __main__:trials:29 - Trial = 27231/30000 | Total reward = 40.43
2022-01-26 14:18:38.922 | DEBUG    | __main__:trials:24 - Trial = 27232/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.923 | DEBUG    | __main__:trials:29 - Trial = 27232/30000 | Total reward = 24.42
2022-01-26 14:18:38.927 | DEBUG    | __main__:trials:24 - Trial = 27233/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.928 | DEBUG    | __main__:trials:29 - Trial = 27233/30000 | Total reward = 22.89
2022-01-26 14:18:38.931 | DEBUG    | __main__:trials:24 - Trial = 27234/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.933 | DEBUG    | __main__:trials:29 - Trial = 27234/30000 | Total reward = 35.79
2022-01-26 14:18:38.936 | DEBUG    | __main__:trials:24 - Trial = 27235/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.938 | DEBUG    | __main__:trials:29 - Trial = 27235/30000 | Total reward = 44.21
2022-01-26 14:18:38.942 | DEBUG    | __main__:trials:24 - Trial = 27236/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.943 | DEBUG    | __main__:trials:29 - Trial = 27236/30000 | Total reward = 41.74
2022-01-26 14:18:38.946 | DEBUG    | __main__:trials:24 - Trial = 27237/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.948 | DEBUG    | __main__:trials:29 - Trial = 27237/30000 | Total reward = 43.98
2022-01-26 14:18:38.951 | DEBUG    | __main__:trials:24 - Trial = 27238/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.952 | DEBUG    | __main__:trials:29 - Trial = 27238/30000 | Total reward = 47.89
2022-01-26 14:18:38.955 | DEBUG    | __main__:trials:24 - Trial = 27239/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.957 | DEBUG    | __main__:trials:29 - Trial = 27239/30000 | Total reward = 34.06
2022-01-26 14:18:38.960 | DEBUG    | __main__:trials:24 - Trial = 27240/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.961 | DEBUG    | __main__:trials:29 - Trial = 27240/30000 | Total reward = 43.57
2022-01-26 14:18:38.964 | DEBUG    | __main__:trials:24 - Trial = 27241/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.966 | DEBUG    | __main__:trials:29 - Trial = 27241/30000 | Total reward = 35.32
2022-01-26 14:18:38.968 | DEBUG    | __main__:trials:26 - Trial = 27242/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.968 | DEBUG    | __main__:trials:29 - Trial = 27242/30000 | Total reward = 15.21
2022-01-26 14:18:38.972 | DEBUG    | __main__:trials:24 - Trial = 27243/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.974 | DEBUG    | __main__:trials:29 - Trial = 27243/30000 | Total reward = 46.53
2022-01-26 14:18:38.976 | DEBUG    | __main__:trials:24 - Trial = 27244/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.978 | DEBUG    | __main__:trials:29 - Trial = 27244/30000 | Total reward = 37.35
2022-01-26 14:18:38.981 | DEBUG    | __main__:trials:26 - Trial = 27245/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:38.982 | DEBUG    | __main__:trials:29 - Trial = 27245/30000 | Total reward = 25.97
2022-01-26 14:18:38.986 | DEBUG    | __main__:trials:24 - Trial = 27246/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.987 | DEBUG    | __main__:trials:29 - Trial = 27246/30000 | Total reward = 41.81
2022-01-26 14:18:38.991 | DEBUG    | __main__:trials:24 - Trial = 27247/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.992 | DEBUG    | __main__:trials:29 - Trial = 27247/30000 | Total reward = 36.35
2022-01-26 14:18:38.996 | DEBUG    | __main__:trials:24 - Trial = 27248/30000 | Max number of steps (20) reached
2022-01-26 14:18:38.998 | DEBUG    | __main__:trials:29 - Trial = 27248/30000 | Total reward = 51.06
2022-01-26 14:18:39.002 | DEBUG    | __main__:trials:24 - Trial = 27249/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.003 | DEBUG    | __main__:trials:29 - Trial = 27249/30000 | Total reward = 33.31
2022-01-26 14:18:39.007 | DEBUG    | __main__:trials:24 - Trial = 27250/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.008 | DEBUG    | __main__:trials:29 - Trial = 27250/30000 | Total reward = 27.76
2022-01-26 14:18:39.011 | DEBUG    | __main__:trials:24 - Trial = 27251/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.013 | DEBUG    | __main__:trials:29 - Trial = 27251/30000 | Total reward = 38.15
2022-01-26 14:18:39.017 | DEBUG    | __main__:trials:24 - Trial = 27252/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.018 | DEBUG    | __main__:trials:29 - Trial = 27252/30000 | Total reward = 35.13
2022-01-26 14:18:39.021 | DEBUG    | __main__:trials:24 - Trial = 27253/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.022 | DEBUG    | __main__:trials:29 - Trial = 27253/30000 | Total reward = 33.75
2022-01-26 14:18:39.027 | DEBUG    | __main__:trials:24 - Trial = 27254/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.028 | DEBUG    | __main__:trials:29 - Trial = 27254/30000 | Total reward = 33.46
2022-01-26 14:18:39.032 | DEBUG    | __main__:trials:24 - Trial = 27255/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.033 | DEBUG    | __main__:trials:29 - Trial = 27255/30000 | Total reward = 53.27
2022-01-26 14:18:39.036 | DEBUG    | __main__:trials:24 - Trial = 27256/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.038 | DEBUG    | __main__:trials:29 - Trial = 27256/30000 | Total reward = 34.89
2022-01-26 14:18:39.042 | DEBUG    | __main__:trials:24 - Trial = 27257/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.042 | DEBUG    | __main__:trials:29 - Trial = 27257/30000 | Total reward = 32.81
2022-01-26 14:18:39.046 | DEBUG    | __main__:trials:24 - Trial = 27258/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.048 | DEBUG    | __main__:trials:29 - Trial = 27258/30000 | Total reward = 36.15
2022-01-26 14:18:39.051 | DEBUG    | __main__:trials:24 - Trial = 27259/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.052 | DEBUG    | __main__:trials:29 - Trial = 27259/30000 | Total reward = 14.93
2022-01-26 14:18:39.055 | DEBUG    | __main__:trials:24 - Trial = 27260/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.057 | DEBUG    | __main__:trials:29 - Trial = 27260/30000 | Total reward = 42.22
2022-01-26 14:18:39.060 | DEBUG    | __main__:trials:24 - Trial = 27261/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.062 | DEBUG    | __main__:trials:29 - Trial = 27261/30000 | Total reward = 36.73
2022-01-26 14:18:39.065 | DEBUG    | __main__:trials:24 - Trial = 27262/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.067 | DEBUG    | __main__:trials:29 - Trial = 27262/30000 | Total reward = 42.15
2022-01-26 14:18:39.070 | DEBUG    | __main__:trials:24 - Trial = 27263/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.072 | DEBUG    | __main__:trials:29 - Trial = 27263/30000 | Total reward = 47.17
2022-01-26 14:18:39.074 | DEBUG    | __main__:trials:26 - Trial = 27264/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.076 | DEBUG    | __main__:trials:29 - Trial = 27264/30000 | Total reward = 16.48
2022-01-26 14:18:39.079 | DEBUG    | __main__:trials:26 - Trial = 27265/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.080 | DEBUG    | __main__:trials:29 - Trial = 27265/30000 | Total reward = 16.81
2022-01-26 14:18:39.083 | DEBUG    | __main__:trials:26 - Trial = 27266/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.085 | DEBUG    | __main__:trials:29 - Trial = 27266/30000 | Total reward = 28.64
2022-01-26 14:18:39.086 | DEBUG    | __main__:trials:26 - Trial = 27267/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.088 | DEBUG    | __main__:trials:29 - Trial = 27267/30000 | Total reward = 10.87
2022-01-26 14:18:39.091 | DEBUG    | __main__:trials:26 - Trial = 27268/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.092 | DEBUG    | __main__:trials:29 - Trial = 27268/30000 | Total reward = 14.23
2022-01-26 14:18:39.096 | DEBUG    | __main__:trials:24 - Trial = 27269/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.097 | DEBUG    | __main__:trials:29 - Trial = 27269/30000 | Total reward = 36.65
2022-01-26 14:18:39.101 | DEBUG    | __main__:trials:24 - Trial = 27270/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.102 | DEBUG    | __main__:trials:29 - Trial = 27270/30000 | Total reward = 37.09
2022-01-26 14:18:39.106 | DEBUG    | __main__:trials:24 - Trial = 27271/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.107 | DEBUG    | __main__:trials:29 - Trial = 27271/30000 | Total reward = 35.05
2022-01-26 14:18:39.110 | DEBUG    | __main__:trials:26 - Trial = 27272/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.112 | DEBUG    | __main__:trials:29 - Trial = 27272/30000 | Total reward = 20.96
2022-01-26 14:18:39.116 | DEBUG    | __main__:trials:24 - Trial = 27273/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.117 | DEBUG    | __main__:trials:29 - Trial = 27273/30000 | Total reward = 55.13
2022-01-26 14:18:39.119 | DEBUG    | __main__:trials:26 - Trial = 27274/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.121 | DEBUG    | __main__:trials:29 - Trial = 27274/30000 | Total reward = 12.68
2022-01-26 14:18:39.123 | DEBUG    | __main__:trials:26 - Trial = 27275/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.124 | DEBUG    | __main__:trials:29 - Trial = 27275/30000 | Total reward = 9.84
2022-01-26 14:18:39.128 | DEBUG    | __main__:trials:24 - Trial = 27276/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.130 | DEBUG    | __main__:trials:29 - Trial = 27276/30000 | Total reward = 43.10
2022-01-26 14:18:39.134 | DEBUG    | __main__:trials:24 - Trial = 27277/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.135 | DEBUG    | __main__:trials:29 - Trial = 27277/30000 | Total reward = 24.82
2022-01-26 14:18:39.138 | DEBUG    | __main__:trials:24 - Trial = 27278/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.140 | DEBUG    | __main__:trials:29 - Trial = 27278/30000 | Total reward = 39.74
2022-01-26 14:18:39.143 | DEBUG    | __main__:trials:24 - Trial = 27279/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.145 | DEBUG    | __main__:trials:29 - Trial = 27279/30000 | Total reward = 29.30
2022-01-26 14:18:39.148 | DEBUG    | __main__:trials:24 - Trial = 27280/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.150 | DEBUG    | __main__:trials:29 - Trial = 27280/30000 | Total reward = 33.51
2022-01-26 14:18:39.153 | DEBUG    | __main__:trials:26 - Trial = 27281/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.155 | DEBUG    | __main__:trials:29 - Trial = 27281/30000 | Total reward = 16.88
2022-01-26 14:18:39.157 | DEBUG    | __main__:trials:26 - Trial = 27282/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.158 | DEBUG    | __main__:trials:29 - Trial = 27282/30000 | Total reward = 16.88
2022-01-26 14:18:39.160 | DEBUG    | __main__:trials:26 - Trial = 27283/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.161 | DEBUG    | __main__:trials:29 - Trial = 27283/30000 | Total reward = 14.56
2022-01-26 14:18:39.163 | DEBUG    | __main__:trials:26 - Trial = 27284/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.164 | DEBUG    | __main__:trials:29 - Trial = 27284/30000 | Total reward = 9.93
2022-01-26 14:18:39.167 | DEBUG    | __main__:trials:26 - Trial = 27285/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.167 | DEBUG    | __main__:trials:29 - Trial = 27285/30000 | Total reward = 14.62
2022-01-26 14:18:39.169 | DEBUG    | __main__:trials:26 - Trial = 27286/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.171 | DEBUG    | __main__:trials:29 - Trial = 27286/30000 | Total reward = 9.93
2022-01-26 14:18:39.174 | DEBUG    | __main__:trials:24 - Trial = 27287/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.176 | DEBUG    | __main__:trials:29 - Trial = 27287/30000 | Total reward = 29.47
2022-01-26 14:18:39.178 | DEBUG    | __main__:trials:26 - Trial = 27288/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.178 | DEBUG    | __main__:trials:29 - Trial = 27288/30000 | Total reward = 9.93
2022-01-26 14:18:39.182 | DEBUG    | __main__:trials:24 - Trial = 27289/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.184 | DEBUG    | __main__:trials:29 - Trial = 27289/30000 | Total reward = 25.31
2022-01-26 14:18:39.186 | DEBUG    | __main__:trials:24 - Trial = 27290/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.188 | DEBUG    | __main__:trials:29 - Trial = 27290/30000 | Total reward = 50.84
2022-01-26 14:18:39.191 | DEBUG    | __main__:trials:24 - Trial = 27291/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.193 | DEBUG    | __main__:trials:29 - Trial = 27291/30000 | Total reward = 32.84
2022-01-26 14:18:39.196 | DEBUG    | __main__:trials:24 - Trial = 27292/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.197 | DEBUG    | __main__:trials:29 - Trial = 27292/30000 | Total reward = 23.10
2022-01-26 14:18:39.200 | DEBUG    | __main__:trials:24 - Trial = 27293/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.201 | DEBUG    | __main__:trials:29 - Trial = 27293/30000 | Total reward = 26.29
2022-01-26 14:18:39.204 | DEBUG    | __main__:trials:24 - Trial = 27294/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.205 | DEBUG    | __main__:trials:29 - Trial = 27294/30000 | Total reward = 32.91
2022-01-26 14:18:39.208 | DEBUG    | __main__:trials:24 - Trial = 27295/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.211 | DEBUG    | __main__:trials:29 - Trial = 27295/30000 | Total reward = 27.48
2022-01-26 14:18:39.213 | DEBUG    | __main__:trials:24 - Trial = 27296/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.214 | DEBUG    | __main__:trials:29 - Trial = 27296/30000 | Total reward = 26.23
2022-01-26 14:18:39.218 | DEBUG    | __main__:trials:24 - Trial = 27297/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.219 | DEBUG    | __main__:trials:29 - Trial = 27297/30000 | Total reward = 32.86
2022-01-26 14:18:39.221 | DEBUG    | __main__:trials:26 - Trial = 27298/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.223 | DEBUG    | __main__:trials:29 - Trial = 27298/30000 | Total reward = 15.08
2022-01-26 14:18:39.225 | DEBUG    | __main__:trials:26 - Trial = 27299/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.226 | DEBUG    | __main__:trials:29 - Trial = 27299/30000 | Total reward = 11.82
2022-01-26 14:18:39.229 | DEBUG    | __main__:trials:24 - Trial = 27300/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.231 | DEBUG    | __main__:trials:29 - Trial = 27300/30000 | Total reward = 31.72
2022-01-26 14:18:39.233 | DEBUG    | __main__:trials:26 - Trial = 27301/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.235 | DEBUG    | __main__:trials:29 - Trial = 27301/30000 | Total reward = 19.44
2022-01-26 14:18:39.238 | DEBUG    | __main__:trials:26 - Trial = 27302/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.239 | DEBUG    | __main__:trials:29 - Trial = 27302/30000 | Total reward = 9.01
2022-01-26 14:18:39.243 | DEBUG    | __main__:trials:24 - Trial = 27303/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.245 | DEBUG    | __main__:trials:29 - Trial = 27303/30000 | Total reward = 20.30
2022-01-26 14:18:39.248 | DEBUG    | __main__:trials:24 - Trial = 27304/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.250 | DEBUG    | __main__:trials:29 - Trial = 27304/30000 | Total reward = 18.90
2022-01-26 14:18:39.253 | DEBUG    | __main__:trials:24 - Trial = 27305/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.255 | DEBUG    | __main__:trials:29 - Trial = 27305/30000 | Total reward = 30.08
2022-01-26 14:18:39.259 | DEBUG    | __main__:trials:24 - Trial = 27306/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.259 | DEBUG    | __main__:trials:29 - Trial = 27306/30000 | Total reward = 26.39
2022-01-26 14:18:39.264 | DEBUG    | __main__:trials:24 - Trial = 27307/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.265 | DEBUG    | __main__:trials:29 - Trial = 27307/30000 | Total reward = 24.85
2022-01-26 14:18:39.268 | DEBUG    | __main__:trials:24 - Trial = 27308/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.270 | DEBUG    | __main__:trials:29 - Trial = 27308/30000 | Total reward = 37.89
2022-01-26 14:18:39.274 | DEBUG    | __main__:trials:24 - Trial = 27309/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.274 | DEBUG    | __main__:trials:29 - Trial = 27309/30000 | Total reward = 39.93
2022-01-26 14:18:39.278 | DEBUG    | __main__:trials:26 - Trial = 27310/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.279 | DEBUG    | __main__:trials:29 - Trial = 27310/30000 | Total reward = 15.43
2022-01-26 14:18:39.283 | DEBUG    | __main__:trials:24 - Trial = 27311/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.284 | DEBUG    | __main__:trials:29 - Trial = 27311/30000 | Total reward = 39.66
2022-01-26 14:18:39.288 | DEBUG    | __main__:trials:24 - Trial = 27312/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.290 | DEBUG    | __main__:trials:29 - Trial = 27312/30000 | Total reward = 36.15
2022-01-26 14:18:39.293 | DEBUG    | __main__:trials:24 - Trial = 27313/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.295 | DEBUG    | __main__:trials:29 - Trial = 27313/30000 | Total reward = 42.67
2022-01-26 14:18:39.299 | DEBUG    | __main__:trials:24 - Trial = 27314/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.300 | DEBUG    | __main__:trials:29 - Trial = 27314/30000 | Total reward = 34.33
2022-01-26 14:18:39.304 | DEBUG    | __main__:trials:24 - Trial = 27315/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.306 | DEBUG    | __main__:trials:29 - Trial = 27315/30000 | Total reward = 49.64
2022-01-26 14:18:39.311 | DEBUG    | __main__:trials:24 - Trial = 27316/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.311 | DEBUG    | __main__:trials:29 - Trial = 27316/30000 | Total reward = 37.81
2022-01-26 14:18:39.317 | DEBUG    | __main__:trials:24 - Trial = 27317/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.318 | DEBUG    | __main__:trials:29 - Trial = 27317/30000 | Total reward = 37.34
2022-01-26 14:18:39.321 | DEBUG    | __main__:trials:24 - Trial = 27318/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.324 | DEBUG    | __main__:trials:29 - Trial = 27318/30000 | Total reward = 30.43
2022-01-26 14:18:39.328 | DEBUG    | __main__:trials:24 - Trial = 27319/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.329 | DEBUG    | __main__:trials:29 - Trial = 27319/30000 | Total reward = 34.87
2022-01-26 14:18:39.333 | DEBUG    | __main__:trials:24 - Trial = 27320/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.335 | DEBUG    | __main__:trials:29 - Trial = 27320/30000 | Total reward = 35.86
2022-01-26 14:18:39.339 | DEBUG    | __main__:trials:24 - Trial = 27321/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.340 | DEBUG    | __main__:trials:29 - Trial = 27321/30000 | Total reward = 47.00
2022-01-26 14:18:39.344 | DEBUG    | __main__:trials:24 - Trial = 27322/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.345 | DEBUG    | __main__:trials:29 - Trial = 27322/30000 | Total reward = 48.07
2022-01-26 14:18:39.349 | DEBUG    | __main__:trials:26 - Trial = 27323/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.350 | DEBUG    | __main__:trials:29 - Trial = 27323/30000 | Total reward = 26.62
2022-01-26 14:18:39.354 | DEBUG    | __main__:trials:24 - Trial = 27324/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.356 | DEBUG    | __main__:trials:29 - Trial = 27324/30000 | Total reward = 45.87
2022-01-26 14:18:39.359 | DEBUG    | __main__:trials:24 - Trial = 27325/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.361 | DEBUG    | __main__:trials:29 - Trial = 27325/30000 | Total reward = 35.56
2022-01-26 14:18:39.364 | DEBUG    | __main__:trials:24 - Trial = 27326/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.366 | DEBUG    | __main__:trials:29 - Trial = 27326/30000 | Total reward = 34.90
2022-01-26 14:18:39.369 | DEBUG    | __main__:trials:24 - Trial = 27327/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.370 | DEBUG    | __main__:trials:29 - Trial = 27327/30000 | Total reward = 30.12
2022-01-26 14:18:39.374 | DEBUG    | __main__:trials:24 - Trial = 27328/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.376 | DEBUG    | __main__:trials:29 - Trial = 27328/30000 | Total reward = 35.93
2022-01-26 14:18:39.379 | DEBUG    | __main__:trials:24 - Trial = 27329/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.381 | DEBUG    | __main__:trials:29 - Trial = 27329/30000 | Total reward = 36.31
2022-01-26 14:18:39.383 | DEBUG    | __main__:trials:24 - Trial = 27330/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.385 | DEBUG    | __main__:trials:29 - Trial = 27330/30000 | Total reward = 36.49
2022-01-26 14:18:39.388 | DEBUG    | __main__:trials:24 - Trial = 27331/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.390 | DEBUG    | __main__:trials:29 - Trial = 27331/30000 | Total reward = 37.54
2022-01-26 14:18:39.394 | DEBUG    | __main__:trials:24 - Trial = 27332/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.395 | DEBUG    | __main__:trials:29 - Trial = 27332/30000 | Total reward = 36.76
2022-01-26 14:18:39.399 | DEBUG    | __main__:trials:24 - Trial = 27333/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.400 | DEBUG    | __main__:trials:29 - Trial = 27333/30000 | Total reward = 47.42
2022-01-26 14:18:39.404 | DEBUG    | __main__:trials:24 - Trial = 27334/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.406 | DEBUG    | __main__:trials:29 - Trial = 27334/30000 | Total reward = 40.98
2022-01-26 14:18:39.409 | DEBUG    | __main__:trials:26 - Trial = 27335/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.409 | DEBUG    | __main__:trials:29 - Trial = 27335/30000 | Total reward = 15.96
2022-01-26 14:18:39.413 | DEBUG    | __main__:trials:26 - Trial = 27336/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.414 | DEBUG    | __main__:trials:29 - Trial = 27336/30000 | Total reward = 16.03
2022-01-26 14:18:39.418 | DEBUG    | __main__:trials:26 - Trial = 27337/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.419 | DEBUG    | __main__:trials:29 - Trial = 27337/30000 | Total reward = 30.11
2022-01-26 14:18:39.423 | DEBUG    | __main__:trials:24 - Trial = 27338/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.424 | DEBUG    | __main__:trials:29 - Trial = 27338/30000 | Total reward = 25.67
2022-01-26 14:18:39.428 | DEBUG    | __main__:trials:24 - Trial = 27339/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.430 | DEBUG    | __main__:trials:29 - Trial = 27339/30000 | Total reward = 36.22
2022-01-26 14:18:39.433 | DEBUG    | __main__:trials:24 - Trial = 27340/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.435 | DEBUG    | __main__:trials:29 - Trial = 27340/30000 | Total reward = 29.11
2022-01-26 14:18:39.438 | DEBUG    | __main__:trials:24 - Trial = 27341/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.440 | DEBUG    | __main__:trials:29 - Trial = 27341/30000 | Total reward = 27.21
2022-01-26 14:18:39.442 | DEBUG    | __main__:trials:26 - Trial = 27342/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.443 | DEBUG    | __main__:trials:29 - Trial = 27342/30000 | Total reward = 11.11
2022-01-26 14:18:39.447 | DEBUG    | __main__:trials:26 - Trial = 27343/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.449 | DEBUG    | __main__:trials:29 - Trial = 27343/30000 | Total reward = 25.74
2022-01-26 14:18:39.452 | DEBUG    | __main__:trials:24 - Trial = 27344/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.454 | DEBUG    | __main__:trials:29 - Trial = 27344/30000 | Total reward = 20.96
2022-01-26 14:18:39.457 | DEBUG    | __main__:trials:24 - Trial = 27345/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.459 | DEBUG    | __main__:trials:29 - Trial = 27345/30000 | Total reward = 47.65
2022-01-26 14:18:39.464 | DEBUG    | __main__:trials:24 - Trial = 27346/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.465 | DEBUG    | __main__:trials:29 - Trial = 27346/30000 | Total reward = 47.74
2022-01-26 14:18:39.469 | DEBUG    | __main__:trials:24 - Trial = 27347/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.470 | DEBUG    | __main__:trials:29 - Trial = 27347/30000 | Total reward = 28.21
2022-01-26 14:18:39.473 | DEBUG    | __main__:trials:24 - Trial = 27348/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.475 | DEBUG    | __main__:trials:29 - Trial = 27348/30000 | Total reward = 36.10
2022-01-26 14:18:39.478 | DEBUG    | __main__:trials:26 - Trial = 27349/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.479 | DEBUG    | __main__:trials:29 - Trial = 27349/30000 | Total reward = 20.17
2022-01-26 14:18:39.483 | DEBUG    | __main__:trials:24 - Trial = 27350/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.485 | DEBUG    | __main__:trials:29 - Trial = 27350/30000 | Total reward = 28.35
2022-01-26 14:18:39.487 | DEBUG    | __main__:trials:26 - Trial = 27351/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.488 | DEBUG    | __main__:trials:29 - Trial = 27351/30000 | Total reward = 14.08
2022-01-26 14:18:39.492 | DEBUG    | __main__:trials:24 - Trial = 27352/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.493 | DEBUG    | __main__:trials:29 - Trial = 27352/30000 | Total reward = 40.39
2022-01-26 14:18:39.497 | DEBUG    | __main__:trials:24 - Trial = 27353/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.498 | DEBUG    | __main__:trials:29 - Trial = 27353/30000 | Total reward = 37.47
2022-01-26 14:18:39.502 | DEBUG    | __main__:trials:24 - Trial = 27354/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.504 | DEBUG    | __main__:trials:29 - Trial = 27354/30000 | Total reward = 32.68
2022-01-26 14:18:39.506 | DEBUG    | __main__:trials:24 - Trial = 27355/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.508 | DEBUG    | __main__:trials:29 - Trial = 27355/30000 | Total reward = 46.50
2022-01-26 14:18:39.512 | DEBUG    | __main__:trials:24 - Trial = 27356/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.514 | DEBUG    | __main__:trials:29 - Trial = 27356/30000 | Total reward = 36.75
2022-01-26 14:18:39.517 | DEBUG    | __main__:trials:24 - Trial = 27357/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.518 | DEBUG    | __main__:trials:29 - Trial = 27357/30000 | Total reward = 40.14
2022-01-26 14:18:39.521 | DEBUG    | __main__:trials:24 - Trial = 27358/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.522 | DEBUG    | __main__:trials:29 - Trial = 27358/30000 | Total reward = 27.64
2022-01-26 14:18:39.526 | DEBUG    | __main__:trials:24 - Trial = 27359/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.528 | DEBUG    | __main__:trials:29 - Trial = 27359/30000 | Total reward = 42.50
2022-01-26 14:18:39.532 | DEBUG    | __main__:trials:24 - Trial = 27360/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.533 | DEBUG    | __main__:trials:29 - Trial = 27360/30000 | Total reward = 38.03
2022-01-26 14:18:39.537 | DEBUG    | __main__:trials:24 - Trial = 27361/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.538 | DEBUG    | __main__:trials:29 - Trial = 27361/30000 | Total reward = 25.31
2022-01-26 14:18:39.542 | DEBUG    | __main__:trials:24 - Trial = 27362/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.543 | DEBUG    | __main__:trials:29 - Trial = 27362/30000 | Total reward = 26.37
2022-01-26 14:18:39.547 | DEBUG    | __main__:trials:24 - Trial = 27363/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.549 | DEBUG    | __main__:trials:29 - Trial = 27363/30000 | Total reward = 23.60
2022-01-26 14:18:39.552 | DEBUG    | __main__:trials:26 - Trial = 27364/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.552 | DEBUG    | __main__:trials:29 - Trial = 27364/30000 | Total reward = 16.92
2022-01-26 14:18:39.555 | DEBUG    | __main__:trials:26 - Trial = 27365/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.557 | DEBUG    | __main__:trials:29 - Trial = 27365/30000 | Total reward = 7.07
2022-01-26 14:18:39.559 | DEBUG    | __main__:trials:26 - Trial = 27366/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.561 | DEBUG    | __main__:trials:29 - Trial = 27366/30000 | Total reward = 11.01
2022-01-26 14:18:39.564 | DEBUG    | __main__:trials:24 - Trial = 27367/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.565 | DEBUG    | __main__:trials:29 - Trial = 27367/30000 | Total reward = 35.36
2022-01-26 14:18:39.569 | DEBUG    | __main__:trials:26 - Trial = 27368/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.570 | DEBUG    | __main__:trials:29 - Trial = 27368/30000 | Total reward = 14.47
2022-01-26 14:18:39.574 | DEBUG    | __main__:trials:24 - Trial = 27369/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.575 | DEBUG    | __main__:trials:29 - Trial = 27369/30000 | Total reward = 37.71
2022-01-26 14:18:39.578 | DEBUG    | __main__:trials:26 - Trial = 27370/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.580 | DEBUG    | __main__:trials:29 - Trial = 27370/30000 | Total reward = 14.30
2022-01-26 14:18:39.584 | DEBUG    | __main__:trials:24 - Trial = 27371/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.585 | DEBUG    | __main__:trials:29 - Trial = 27371/30000 | Total reward = 30.39
2022-01-26 14:18:39.588 | DEBUG    | __main__:trials:26 - Trial = 27372/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.590 | DEBUG    | __main__:trials:29 - Trial = 27372/30000 | Total reward = 12.68
2022-01-26 14:18:39.593 | DEBUG    | __main__:trials:26 - Trial = 27373/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.595 | DEBUG    | __main__:trials:29 - Trial = 27373/30000 | Total reward = 16.80
2022-01-26 14:18:39.597 | DEBUG    | __main__:trials:26 - Trial = 27374/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.598 | DEBUG    | __main__:trials:29 - Trial = 27374/30000 | Total reward = 11.45
2022-01-26 14:18:39.602 | DEBUG    | __main__:trials:24 - Trial = 27375/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.603 | DEBUG    | __main__:trials:29 - Trial = 27375/30000 | Total reward = 36.00
2022-01-26 14:18:39.607 | DEBUG    | __main__:trials:24 - Trial = 27376/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.608 | DEBUG    | __main__:trials:29 - Trial = 27376/30000 | Total reward = 32.92
2022-01-26 14:18:39.611 | DEBUG    | __main__:trials:24 - Trial = 27377/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.613 | DEBUG    | __main__:trials:29 - Trial = 27377/30000 | Total reward = 40.49
2022-01-26 14:18:39.616 | DEBUG    | __main__:trials:24 - Trial = 27378/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.618 | DEBUG    | __main__:trials:29 - Trial = 27378/30000 | Total reward = 33.44
2022-01-26 14:18:39.622 | DEBUG    | __main__:trials:24 - Trial = 27379/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.623 | DEBUG    | __main__:trials:29 - Trial = 27379/30000 | Total reward = 28.42
2022-01-26 14:18:39.627 | DEBUG    | __main__:trials:24 - Trial = 27380/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.629 | DEBUG    | __main__:trials:29 - Trial = 27380/30000 | Total reward = 9.09
2022-01-26 14:18:39.631 | DEBUG    | __main__:trials:26 - Trial = 27381/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.633 | DEBUG    | __main__:trials:29 - Trial = 27381/30000 | Total reward = 19.21
2022-01-26 14:18:39.636 | DEBUG    | __main__:trials:24 - Trial = 27382/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.638 | DEBUG    | __main__:trials:29 - Trial = 27382/30000 | Total reward = 28.78
2022-01-26 14:18:39.642 | DEBUG    | __main__:trials:24 - Trial = 27383/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.643 | DEBUG    | __main__:trials:29 - Trial = 27383/30000 | Total reward = 40.34
2022-01-26 14:18:39.647 | DEBUG    | __main__:trials:26 - Trial = 27384/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.648 | DEBUG    | __main__:trials:29 - Trial = 27384/30000 | Total reward = 17.70
2022-01-26 14:18:39.651 | DEBUG    | __main__:trials:24 - Trial = 27385/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.653 | DEBUG    | __main__:trials:29 - Trial = 27385/30000 | Total reward = 40.70
2022-01-26 14:18:39.656 | DEBUG    | __main__:trials:24 - Trial = 27386/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.657 | DEBUG    | __main__:trials:29 - Trial = 27386/30000 | Total reward = 44.14
2022-01-26 14:18:39.662 | DEBUG    | __main__:trials:24 - Trial = 27387/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.663 | DEBUG    | __main__:trials:29 - Trial = 27387/30000 | Total reward = 41.61
2022-01-26 14:18:39.666 | DEBUG    | __main__:trials:26 - Trial = 27388/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.668 | DEBUG    | __main__:trials:29 - Trial = 27388/30000 | Total reward = 14.99
2022-01-26 14:18:39.671 | DEBUG    | __main__:trials:24 - Trial = 27389/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.672 | DEBUG    | __main__:trials:29 - Trial = 27389/30000 | Total reward = 24.10
2022-01-26 14:18:39.676 | DEBUG    | __main__:trials:24 - Trial = 27390/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.678 | DEBUG    | __main__:trials:29 - Trial = 27390/30000 | Total reward = 42.15
2022-01-26 14:18:39.681 | DEBUG    | __main__:trials:24 - Trial = 27391/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.683 | DEBUG    | __main__:trials:29 - Trial = 27391/30000 | Total reward = 33.21
2022-01-26 14:18:39.686 | DEBUG    | __main__:trials:26 - Trial = 27392/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.687 | DEBUG    | __main__:trials:29 - Trial = 27392/30000 | Total reward = 15.40
2022-01-26 14:18:39.691 | DEBUG    | __main__:trials:24 - Trial = 27393/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.692 | DEBUG    | __main__:trials:29 - Trial = 27393/30000 | Total reward = 25.94
2022-01-26 14:18:39.695 | DEBUG    | __main__:trials:26 - Trial = 27394/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.697 | DEBUG    | __main__:trials:29 - Trial = 27394/30000 | Total reward = 14.46
2022-01-26 14:18:39.700 | DEBUG    | __main__:trials:24 - Trial = 27395/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.702 | DEBUG    | __main__:trials:29 - Trial = 27395/30000 | Total reward = 31.37
2022-01-26 14:18:39.705 | DEBUG    | __main__:trials:24 - Trial = 27396/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.707 | DEBUG    | __main__:trials:29 - Trial = 27396/30000 | Total reward = 56.49
2022-01-26 14:18:39.711 | DEBUG    | __main__:trials:24 - Trial = 27397/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.712 | DEBUG    | __main__:trials:29 - Trial = 27397/30000 | Total reward = 26.34
2022-01-26 14:18:39.715 | DEBUG    | __main__:trials:26 - Trial = 27398/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.717 | DEBUG    | __main__:trials:29 - Trial = 27398/30000 | Total reward = 14.62
2022-01-26 14:18:39.720 | DEBUG    | __main__:trials:24 - Trial = 27399/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.722 | DEBUG    | __main__:trials:29 - Trial = 27399/30000 | Total reward = 29.78
2022-01-26 14:18:39.725 | DEBUG    | __main__:trials:26 - Trial = 27400/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.726 | DEBUG    | __main__:trials:29 - Trial = 27400/30000 | Total reward = 18.10
2022-01-26 14:18:39.728 | DEBUG    | __main__:trials:26 - Trial = 27401/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.729 | DEBUG    | __main__:trials:29 - Trial = 27401/30000 | Total reward = 7.84
2022-01-26 14:18:39.732 | DEBUG    | __main__:trials:24 - Trial = 27402/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.733 | DEBUG    | __main__:trials:29 - Trial = 27402/30000 | Total reward = 57.13
2022-01-26 14:18:39.736 | DEBUG    | __main__:trials:26 - Trial = 27403/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.738 | DEBUG    | __main__:trials:29 - Trial = 27403/30000 | Total reward = 8.98
2022-01-26 14:18:39.740 | DEBUG    | __main__:trials:26 - Trial = 27404/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.741 | DEBUG    | __main__:trials:29 - Trial = 27404/30000 | Total reward = 13.29
2022-01-26 14:18:39.744 | DEBUG    | __main__:trials:26 - Trial = 27405/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.744 | DEBUG    | __main__:trials:29 - Trial = 27405/30000 | Total reward = 10.01
2022-01-26 14:18:39.748 | DEBUG    | __main__:trials:24 - Trial = 27406/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.750 | DEBUG    | __main__:trials:29 - Trial = 27406/30000 | Total reward = 26.42
2022-01-26 14:18:39.753 | DEBUG    | __main__:trials:24 - Trial = 27407/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.753 | DEBUG    | __main__:trials:29 - Trial = 27407/30000 | Total reward = 42.87
2022-01-26 14:18:39.756 | DEBUG    | __main__:trials:26 - Trial = 27408/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.758 | DEBUG    | __main__:trials:29 - Trial = 27408/30000 | Total reward = 10.12
2022-01-26 14:18:39.761 | DEBUG    | __main__:trials:26 - Trial = 27409/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.762 | DEBUG    | __main__:trials:29 - Trial = 27409/30000 | Total reward = 22.35
2022-01-26 14:18:39.766 | DEBUG    | __main__:trials:24 - Trial = 27410/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.767 | DEBUG    | __main__:trials:29 - Trial = 27410/30000 | Total reward = 23.18
2022-01-26 14:18:39.770 | DEBUG    | __main__:trials:24 - Trial = 27411/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.772 | DEBUG    | __main__:trials:29 - Trial = 27411/30000 | Total reward = 33.51
2022-01-26 14:18:39.775 | DEBUG    | __main__:trials:26 - Trial = 27412/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.777 | DEBUG    | __main__:trials:29 - Trial = 27412/30000 | Total reward = 22.07
2022-01-26 14:18:39.780 | DEBUG    | __main__:trials:26 - Trial = 27413/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.781 | DEBUG    | __main__:trials:29 - Trial = 27413/30000 | Total reward = 21.87
2022-01-26 14:18:39.785 | DEBUG    | __main__:trials:24 - Trial = 27414/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.787 | DEBUG    | __main__:trials:29 - Trial = 27414/30000 | Total reward = 29.78
2022-01-26 14:18:39.790 | DEBUG    | __main__:trials:24 - Trial = 27415/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.791 | DEBUG    | __main__:trials:29 - Trial = 27415/30000 | Total reward = 42.15
2022-01-26 14:18:39.795 | DEBUG    | __main__:trials:24 - Trial = 27416/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.796 | DEBUG    | __main__:trials:29 - Trial = 27416/30000 | Total reward = 14.65
2022-01-26 14:18:39.800 | DEBUG    | __main__:trials:24 - Trial = 27417/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.802 | DEBUG    | __main__:trials:29 - Trial = 27417/30000 | Total reward = 55.55
2022-01-26 14:18:39.805 | DEBUG    | __main__:trials:26 - Trial = 27418/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.806 | DEBUG    | __main__:trials:29 - Trial = 27418/30000 | Total reward = 26.79
2022-01-26 14:18:39.809 | DEBUG    | __main__:trials:26 - Trial = 27419/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.810 | DEBUG    | __main__:trials:29 - Trial = 27419/30000 | Total reward = 13.29
2022-01-26 14:18:39.814 | DEBUG    | __main__:trials:24 - Trial = 27420/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.816 | DEBUG    | __main__:trials:29 - Trial = 27420/30000 | Total reward = 25.94
2022-01-26 14:18:39.820 | DEBUG    | __main__:trials:24 - Trial = 27421/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.821 | DEBUG    | __main__:trials:29 - Trial = 27421/30000 | Total reward = 50.68
2022-01-26 14:18:39.825 | DEBUG    | __main__:trials:24 - Trial = 27422/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.826 | DEBUG    | __main__:trials:29 - Trial = 27422/30000 | Total reward = 26.06
2022-01-26 14:18:39.829 | DEBUG    | __main__:trials:24 - Trial = 27423/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.830 | DEBUG    | __main__:trials:29 - Trial = 27423/30000 | Total reward = 50.61
2022-01-26 14:18:39.833 | DEBUG    | __main__:trials:24 - Trial = 27424/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.835 | DEBUG    | __main__:trials:29 - Trial = 27424/30000 | Total reward = 31.21
2022-01-26 14:18:39.838 | DEBUG    | __main__:trials:24 - Trial = 27425/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.840 | DEBUG    | __main__:trials:29 - Trial = 27425/30000 | Total reward = 27.54
2022-01-26 14:18:39.842 | DEBUG    | __main__:trials:26 - Trial = 27426/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.844 | DEBUG    | __main__:trials:29 - Trial = 27426/30000 | Total reward = 18.48
2022-01-26 14:18:39.848 | DEBUG    | __main__:trials:24 - Trial = 27427/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.849 | DEBUG    | __main__:trials:29 - Trial = 27427/30000 | Total reward = 30.99
2022-01-26 14:18:39.853 | DEBUG    | __main__:trials:24 - Trial = 27428/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.854 | DEBUG    | __main__:trials:29 - Trial = 27428/30000 | Total reward = 26.12
2022-01-26 14:18:39.858 | DEBUG    | __main__:trials:24 - Trial = 27429/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.859 | DEBUG    | __main__:trials:29 - Trial = 27429/30000 | Total reward = 28.59
2022-01-26 14:18:39.862 | DEBUG    | __main__:trials:26 - Trial = 27430/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.863 | DEBUG    | __main__:trials:29 - Trial = 27430/30000 | Total reward = 19.59
2022-01-26 14:18:39.867 | DEBUG    | __main__:trials:24 - Trial = 27431/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.869 | DEBUG    | __main__:trials:29 - Trial = 27431/30000 | Total reward = 49.10
2022-01-26 14:18:39.872 | DEBUG    | __main__:trials:24 - Trial = 27432/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.873 | DEBUG    | __main__:trials:29 - Trial = 27432/30000 | Total reward = 43.53
2022-01-26 14:18:39.876 | DEBUG    | __main__:trials:24 - Trial = 27433/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.877 | DEBUG    | __main__:trials:29 - Trial = 27433/30000 | Total reward = 27.64
2022-01-26 14:18:39.881 | DEBUG    | __main__:trials:24 - Trial = 27434/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.883 | DEBUG    | __main__:trials:29 - Trial = 27434/30000 | Total reward = 27.86
2022-01-26 14:18:39.886 | DEBUG    | __main__:trials:26 - Trial = 27435/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.888 | DEBUG    | __main__:trials:29 - Trial = 27435/30000 | Total reward = 29.57
2022-01-26 14:18:39.889 | DEBUG    | __main__:trials:26 - Trial = 27436/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.890 | DEBUG    | __main__:trials:29 - Trial = 27436/30000 | Total reward = 10.12
2022-01-26 14:18:39.893 | DEBUG    | __main__:trials:24 - Trial = 27437/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.894 | DEBUG    | __main__:trials:29 - Trial = 27437/30000 | Total reward = 33.43
2022-01-26 14:18:39.897 | DEBUG    | __main__:trials:24 - Trial = 27438/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.898 | DEBUG    | __main__:trials:29 - Trial = 27438/30000 | Total reward = 45.94
2022-01-26 14:18:39.901 | DEBUG    | __main__:trials:24 - Trial = 27439/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.903 | DEBUG    | __main__:trials:29 - Trial = 27439/30000 | Total reward = 24.46
2022-01-26 14:18:39.905 | DEBUG    | __main__:trials:24 - Trial = 27440/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.907 | DEBUG    | __main__:trials:29 - Trial = 27440/30000 | Total reward = 44.85
2022-01-26 14:18:39.910 | DEBUG    | __main__:trials:26 - Trial = 27441/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.911 | DEBUG    | __main__:trials:29 - Trial = 27441/30000 | Total reward = 7.12
2022-01-26 14:18:39.915 | DEBUG    | __main__:trials:24 - Trial = 27442/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.916 | DEBUG    | __main__:trials:29 - Trial = 27442/30000 | Total reward = 22.10
2022-01-26 14:18:39.920 | DEBUG    | __main__:trials:24 - Trial = 27443/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.921 | DEBUG    | __main__:trials:29 - Trial = 27443/30000 | Total reward = 41.37
2022-01-26 14:18:39.924 | DEBUG    | __main__:trials:24 - Trial = 27444/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.926 | DEBUG    | __main__:trials:29 - Trial = 27444/30000 | Total reward = 35.67
2022-01-26 14:18:39.930 | DEBUG    | __main__:trials:24 - Trial = 27445/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.931 | DEBUG    | __main__:trials:29 - Trial = 27445/30000 | Total reward = 31.72
2022-01-26 14:18:39.935 | DEBUG    | __main__:trials:24 - Trial = 27446/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.937 | DEBUG    | __main__:trials:29 - Trial = 27446/30000 | Total reward = 32.17
2022-01-26 14:18:39.940 | DEBUG    | __main__:trials:24 - Trial = 27447/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.942 | DEBUG    | __main__:trials:29 - Trial = 27447/30000 | Total reward = 37.67
2022-01-26 14:18:39.945 | DEBUG    | __main__:trials:24 - Trial = 27448/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.947 | DEBUG    | __main__:trials:29 - Trial = 27448/30000 | Total reward = 31.31
2022-01-26 14:18:39.950 | DEBUG    | __main__:trials:24 - Trial = 27449/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.952 | DEBUG    | __main__:trials:29 - Trial = 27449/30000 | Total reward = 33.36
2022-01-26 14:18:39.955 | DEBUG    | __main__:trials:24 - Trial = 27450/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.957 | DEBUG    | __main__:trials:29 - Trial = 27450/30000 | Total reward = 36.39
2022-01-26 14:18:39.960 | DEBUG    | __main__:trials:24 - Trial = 27451/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.962 | DEBUG    | __main__:trials:29 - Trial = 27451/30000 | Total reward = 26.42
2022-01-26 14:18:39.966 | DEBUG    | __main__:trials:24 - Trial = 27452/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.967 | DEBUG    | __main__:trials:29 - Trial = 27452/30000 | Total reward = 33.94
2022-01-26 14:18:39.970 | DEBUG    | __main__:trials:26 - Trial = 27453/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.972 | DEBUG    | __main__:trials:29 - Trial = 27453/30000 | Total reward = 17.22
2022-01-26 14:18:39.975 | DEBUG    | __main__:trials:24 - Trial = 27454/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.977 | DEBUG    | __main__:trials:29 - Trial = 27454/30000 | Total reward = 25.33
2022-01-26 14:18:39.980 | DEBUG    | __main__:trials:26 - Trial = 27455/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.980 | DEBUG    | __main__:trials:29 - Trial = 27455/30000 | Total reward = 16.37
2022-01-26 14:18:39.984 | DEBUG    | __main__:trials:24 - Trial = 27456/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.985 | DEBUG    | __main__:trials:29 - Trial = 27456/30000 | Total reward = 45.68
2022-01-26 14:18:39.989 | DEBUG    | __main__:trials:24 - Trial = 27457/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.989 | DEBUG    | __main__:trials:29 - Trial = 27457/30000 | Total reward = 54.27
2022-01-26 14:18:39.993 | DEBUG    | __main__:trials:24 - Trial = 27458/30000 | Max number of steps (20) reached
2022-01-26 14:18:39.993 | DEBUG    | __main__:trials:29 - Trial = 27458/30000 | Total reward = 25.94
2022-01-26 14:18:39.998 | DEBUG    | __main__:trials:26 - Trial = 27459/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:39.999 | DEBUG    | __main__:trials:29 - Trial = 27459/30000 | Total reward = 20.00
2022-01-26 14:18:40.002 | DEBUG    | __main__:trials:26 - Trial = 27460/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.004 | DEBUG    | __main__:trials:29 - Trial = 27460/30000 | Total reward = 22.99
2022-01-26 14:18:40.008 | DEBUG    | __main__:trials:24 - Trial = 27461/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.010 | DEBUG    | __main__:trials:29 - Trial = 27461/30000 | Total reward = 27.31
2022-01-26 14:18:40.013 | DEBUG    | __main__:trials:24 - Trial = 27462/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.015 | DEBUG    | __main__:trials:29 - Trial = 27462/30000 | Total reward = 14.39
2022-01-26 14:18:40.018 | DEBUG    | __main__:trials:26 - Trial = 27463/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.019 | DEBUG    | __main__:trials:29 - Trial = 27463/30000 | Total reward = 19.30
2022-01-26 14:18:40.022 | DEBUG    | __main__:trials:26 - Trial = 27464/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.024 | DEBUG    | __main__:trials:29 - Trial = 27464/30000 | Total reward = 19.44
2022-01-26 14:18:40.027 | DEBUG    | __main__:trials:24 - Trial = 27465/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.029 | DEBUG    | __main__:trials:29 - Trial = 27465/30000 | Total reward = 34.37
2022-01-26 14:18:40.031 | DEBUG    | __main__:trials:26 - Trial = 27466/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.033 | DEBUG    | __main__:trials:29 - Trial = 27466/30000 | Total reward = 11.14
2022-01-26 14:18:40.036 | DEBUG    | __main__:trials:24 - Trial = 27467/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.038 | DEBUG    | __main__:trials:29 - Trial = 27467/30000 | Total reward = 24.14
2022-01-26 14:18:40.041 | DEBUG    | __main__:trials:26 - Trial = 27468/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.043 | DEBUG    | __main__:trials:29 - Trial = 27468/30000 | Total reward = 22.85
2022-01-26 14:18:40.047 | DEBUG    | __main__:trials:24 - Trial = 27469/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.048 | DEBUG    | __main__:trials:29 - Trial = 27469/30000 | Total reward = 26.89
2022-01-26 14:18:40.051 | DEBUG    | __main__:trials:26 - Trial = 27470/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.053 | DEBUG    | __main__:trials:29 - Trial = 27470/30000 | Total reward = 13.97
2022-01-26 14:18:40.056 | DEBUG    | __main__:trials:24 - Trial = 27471/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.057 | DEBUG    | __main__:trials:29 - Trial = 27471/30000 | Total reward = 26.56
2022-01-26 14:18:40.059 | DEBUG    | __main__:trials:26 - Trial = 27472/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.060 | DEBUG    | __main__:trials:29 - Trial = 27472/30000 | Total reward = 13.29
2022-01-26 14:18:40.064 | DEBUG    | __main__:trials:24 - Trial = 27473/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.066 | DEBUG    | __main__:trials:29 - Trial = 27473/30000 | Total reward = 25.55
2022-01-26 14:18:40.069 | DEBUG    | __main__:trials:24 - Trial = 27474/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.071 | DEBUG    | __main__:trials:29 - Trial = 27474/30000 | Total reward = 33.76
2022-01-26 14:18:40.074 | DEBUG    | __main__:trials:24 - Trial = 27475/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.076 | DEBUG    | __main__:trials:29 - Trial = 27475/30000 | Total reward = 26.61
2022-01-26 14:18:40.079 | DEBUG    | __main__:trials:24 - Trial = 27476/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.081 | DEBUG    | __main__:trials:29 - Trial = 27476/30000 | Total reward = 38.45
2022-01-26 14:18:40.084 | DEBUG    | __main__:trials:24 - Trial = 27477/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.086 | DEBUG    | __main__:trials:29 - Trial = 27477/30000 | Total reward = 49.27
2022-01-26 14:18:40.090 | DEBUG    | __main__:trials:24 - Trial = 27478/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.091 | DEBUG    | __main__:trials:29 - Trial = 27478/30000 | Total reward = 25.69
2022-01-26 14:18:40.095 | DEBUG    | __main__:trials:24 - Trial = 27479/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.096 | DEBUG    | __main__:trials:29 - Trial = 27479/30000 | Total reward = 47.97
2022-01-26 14:18:40.100 | DEBUG    | __main__:trials:24 - Trial = 27480/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.102 | DEBUG    | __main__:trials:29 - Trial = 27480/30000 | Total reward = 46.01
2022-01-26 14:18:40.106 | DEBUG    | __main__:trials:24 - Trial = 27481/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.107 | DEBUG    | __main__:trials:29 - Trial = 27481/30000 | Total reward = 23.55
2022-01-26 14:18:40.110 | DEBUG    | __main__:trials:26 - Trial = 27482/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.111 | DEBUG    | __main__:trials:29 - Trial = 27482/30000 | Total reward = 10.87
2022-01-26 14:18:40.114 | DEBUG    | __main__:trials:24 - Trial = 27483/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.116 | DEBUG    | __main__:trials:29 - Trial = 27483/30000 | Total reward = 34.49
2022-01-26 14:18:40.120 | DEBUG    | __main__:trials:24 - Trial = 27484/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.121 | DEBUG    | __main__:trials:29 - Trial = 27484/30000 | Total reward = 42.56
2022-01-26 14:18:40.124 | DEBUG    | __main__:trials:26 - Trial = 27485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.126 | DEBUG    | __main__:trials:29 - Trial = 27485/30000 | Total reward = 29.24
2022-01-26 14:18:40.130 | DEBUG    | __main__:trials:24 - Trial = 27486/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.131 | DEBUG    | __main__:trials:29 - Trial = 27486/30000 | Total reward = 26.58
2022-01-26 14:18:40.134 | DEBUG    | __main__:trials:26 - Trial = 27487/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.135 | DEBUG    | __main__:trials:29 - Trial = 27487/30000 | Total reward = 13.29
2022-01-26 14:18:40.139 | DEBUG    | __main__:trials:24 - Trial = 27488/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.140 | DEBUG    | __main__:trials:29 - Trial = 27488/30000 | Total reward = 30.23
2022-01-26 14:18:40.144 | DEBUG    | __main__:trials:24 - Trial = 27489/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.145 | DEBUG    | __main__:trials:29 - Trial = 27489/30000 | Total reward = 27.19
2022-01-26 14:18:40.148 | DEBUG    | __main__:trials:26 - Trial = 27490/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.150 | DEBUG    | __main__:trials:29 - Trial = 27490/30000 | Total reward = 11.10
2022-01-26 14:18:40.153 | DEBUG    | __main__:trials:26 - Trial = 27491/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.155 | DEBUG    | __main__:trials:29 - Trial = 27491/30000 | Total reward = 33.07
2022-01-26 14:18:40.158 | DEBUG    | __main__:trials:24 - Trial = 27492/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.160 | DEBUG    | __main__:trials:29 - Trial = 27492/30000 | Total reward = 26.10
2022-01-26 14:18:40.163 | DEBUG    | __main__:trials:24 - Trial = 27493/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.165 | DEBUG    | __main__:trials:29 - Trial = 27493/30000 | Total reward = 23.90
2022-01-26 14:18:40.168 | DEBUG    | __main__:trials:26 - Trial = 27494/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.169 | DEBUG    | __main__:trials:29 - Trial = 27494/30000 | Total reward = 15.13
2022-01-26 14:18:40.171 | DEBUG    | __main__:trials:26 - Trial = 27495/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.173 | DEBUG    | __main__:trials:29 - Trial = 27495/30000 | Total reward = 9.22
2022-01-26 14:18:40.176 | DEBUG    | __main__:trials:24 - Trial = 27496/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.178 | DEBUG    | __main__:trials:29 - Trial = 27496/30000 | Total reward = 36.19
2022-01-26 14:18:40.180 | DEBUG    | __main__:trials:26 - Trial = 27497/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.182 | DEBUG    | __main__:trials:29 - Trial = 27497/30000 | Total reward = 11.11
2022-01-26 14:18:40.187 | DEBUG    | __main__:trials:26 - Trial = 27498/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.188 | DEBUG    | __main__:trials:29 - Trial = 27498/30000 | Total reward = 32.68
2022-01-26 14:18:40.190 | DEBUG    | __main__:trials:26 - Trial = 27499/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.192 | DEBUG    | __main__:trials:29 - Trial = 27499/30000 | Total reward = 16.97
2022-01-26 14:18:40.195 | DEBUG    | __main__:trials:26 - Trial = 27500/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.197 | DEBUG    | __main__:trials:29 - Trial = 27500/30000 | Total reward = 15.46
2022-01-26 14:18:40.201 | DEBUG    | __main__:trials:24 - Trial = 27501/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.202 | DEBUG    | __main__:trials:29 - Trial = 27501/30000 | Total reward = 26.61
2022-01-26 14:18:40.206 | DEBUG    | __main__:trials:24 - Trial = 27502/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.207 | DEBUG    | __main__:trials:29 - Trial = 27502/30000 | Total reward = 34.75
2022-01-26 14:18:40.211 | DEBUG    | __main__:trials:24 - Trial = 27503/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.213 | DEBUG    | __main__:trials:29 - Trial = 27503/30000 | Total reward = 27.54
2022-01-26 14:18:40.214 | DEBUG    | __main__:trials:26 - Trial = 27504/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.216 | DEBUG    | __main__:trials:29 - Trial = 27504/30000 | Total reward = 12.01
2022-01-26 14:18:40.219 | DEBUG    | __main__:trials:26 - Trial = 27505/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.220 | DEBUG    | __main__:trials:29 - Trial = 27505/30000 | Total reward = 14.95
2022-01-26 14:18:40.223 | DEBUG    | __main__:trials:26 - Trial = 27506/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.224 | DEBUG    | __main__:trials:29 - Trial = 27506/30000 | Total reward = 8.76
2022-01-26 14:18:40.227 | DEBUG    | __main__:trials:26 - Trial = 27507/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.228 | DEBUG    | __main__:trials:29 - Trial = 27507/30000 | Total reward = 13.29
2022-01-26 14:18:40.231 | DEBUG    | __main__:trials:26 - Trial = 27508/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.233 | DEBUG    | __main__:trials:29 - Trial = 27508/30000 | Total reward = 11.82
2022-01-26 14:18:40.236 | DEBUG    | __main__:trials:24 - Trial = 27509/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.237 | DEBUG    | __main__:trials:29 - Trial = 27509/30000 | Total reward = 50.22
2022-01-26 14:18:40.240 | DEBUG    | __main__:trials:24 - Trial = 27510/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.242 | DEBUG    | __main__:trials:29 - Trial = 27510/30000 | Total reward = 23.91
2022-01-26 14:18:40.245 | DEBUG    | __main__:trials:24 - Trial = 27511/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.246 | DEBUG    | __main__:trials:29 - Trial = 27511/30000 | Total reward = 27.87
2022-01-26 14:18:40.248 | DEBUG    | __main__:trials:26 - Trial = 27512/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.250 | DEBUG    | __main__:trials:29 - Trial = 27512/30000 | Total reward = 12.94
2022-01-26 14:18:40.253 | DEBUG    | __main__:trials:26 - Trial = 27513/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.254 | DEBUG    | __main__:trials:29 - Trial = 27513/30000 | Total reward = 18.80
2022-01-26 14:18:40.258 | DEBUG    | __main__:trials:24 - Trial = 27514/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.259 | DEBUG    | __main__:trials:29 - Trial = 27514/30000 | Total reward = 23.15
2022-01-26 14:18:40.263 | DEBUG    | __main__:trials:26 - Trial = 27515/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.264 | DEBUG    | __main__:trials:29 - Trial = 27515/30000 | Total reward = 13.58
2022-01-26 14:18:40.268 | DEBUG    | __main__:trials:24 - Trial = 27516/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.269 | DEBUG    | __main__:trials:29 - Trial = 27516/30000 | Total reward = 24.75
2022-01-26 14:18:40.271 | DEBUG    | __main__:trials:26 - Trial = 27517/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.273 | DEBUG    | __main__:trials:29 - Trial = 27517/30000 | Total reward = 6.85
2022-01-26 14:18:40.276 | DEBUG    | __main__:trials:26 - Trial = 27518/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.277 | DEBUG    | __main__:trials:29 - Trial = 27518/30000 | Total reward = 7.07
2022-01-26 14:18:40.280 | DEBUG    | __main__:trials:26 - Trial = 27519/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.282 | DEBUG    | __main__:trials:29 - Trial = 27519/30000 | Total reward = 9.77
2022-01-26 14:18:40.285 | DEBUG    | __main__:trials:26 - Trial = 27520/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.286 | DEBUG    | __main__:trials:29 - Trial = 27520/30000 | Total reward = 27.59
2022-01-26 14:18:40.288 | DEBUG    | __main__:trials:26 - Trial = 27521/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.289 | DEBUG    | __main__:trials:29 - Trial = 27521/30000 | Total reward = 11.55
2022-01-26 14:18:40.292 | DEBUG    | __main__:trials:26 - Trial = 27522/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.294 | DEBUG    | __main__:trials:29 - Trial = 27522/30000 | Total reward = 38.89
2022-01-26 14:18:40.297 | DEBUG    | __main__:trials:26 - Trial = 27523/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.298 | DEBUG    | __main__:trials:29 - Trial = 27523/30000 | Total reward = 13.29
2022-01-26 14:18:40.301 | DEBUG    | __main__:trials:24 - Trial = 27524/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.302 | DEBUG    | __main__:trials:29 - Trial = 27524/30000 | Total reward = 33.29
2022-01-26 14:18:40.305 | DEBUG    | __main__:trials:24 - Trial = 27525/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.305 | DEBUG    | __main__:trials:29 - Trial = 27525/30000 | Total reward = 48.52
2022-01-26 14:18:40.310 | DEBUG    | __main__:trials:24 - Trial = 27526/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.311 | DEBUG    | __main__:trials:29 - Trial = 27526/30000 | Total reward = 20.88
2022-01-26 14:18:40.315 | DEBUG    | __main__:trials:24 - Trial = 27527/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.316 | DEBUG    | __main__:trials:29 - Trial = 27527/30000 | Total reward = 52.34
2022-01-26 14:18:40.320 | DEBUG    | __main__:trials:24 - Trial = 27528/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.321 | DEBUG    | __main__:trials:29 - Trial = 27528/30000 | Total reward = 19.06
2022-01-26 14:18:40.324 | DEBUG    | __main__:trials:26 - Trial = 27529/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.326 | DEBUG    | __main__:trials:29 - Trial = 27529/30000 | Total reward = 12.96
2022-01-26 14:18:40.330 | DEBUG    | __main__:trials:24 - Trial = 27530/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.331 | DEBUG    | __main__:trials:29 - Trial = 27530/30000 | Total reward = 28.46
2022-01-26 14:18:40.333 | DEBUG    | __main__:trials:26 - Trial = 27531/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.335 | DEBUG    | __main__:trials:29 - Trial = 27531/30000 | Total reward = 16.03
2022-01-26 14:18:40.339 | DEBUG    | __main__:trials:24 - Trial = 27532/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.340 | DEBUG    | __main__:trials:29 - Trial = 27532/30000 | Total reward = 29.82
2022-01-26 14:18:40.344 | DEBUG    | __main__:trials:24 - Trial = 27533/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.346 | DEBUG    | __main__:trials:29 - Trial = 27533/30000 | Total reward = 49.74
2022-01-26 14:18:40.349 | DEBUG    | __main__:trials:26 - Trial = 27534/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.350 | DEBUG    | __main__:trials:29 - Trial = 27534/30000 | Total reward = 27.59
2022-01-26 14:18:40.354 | DEBUG    | __main__:trials:24 - Trial = 27535/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.356 | DEBUG    | __main__:trials:29 - Trial = 27535/30000 | Total reward = 26.94
2022-01-26 14:18:40.359 | DEBUG    | __main__:trials:24 - Trial = 27536/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.361 | DEBUG    | __main__:trials:29 - Trial = 27536/30000 | Total reward = 57.78
2022-01-26 14:18:40.363 | DEBUG    | __main__:trials:26 - Trial = 27537/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.365 | DEBUG    | __main__:trials:29 - Trial = 27537/30000 | Total reward = 12.79
2022-01-26 14:18:40.368 | DEBUG    | __main__:trials:24 - Trial = 27538/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.370 | DEBUG    | __main__:trials:29 - Trial = 27538/30000 | Total reward = 18.66
2022-01-26 14:18:40.373 | DEBUG    | __main__:trials:24 - Trial = 27539/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.374 | DEBUG    | __main__:trials:29 - Trial = 27539/30000 | Total reward = 38.86
2022-01-26 14:18:40.376 | DEBUG    | __main__:trials:26 - Trial = 27540/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.378 | DEBUG    | __main__:trials:29 - Trial = 27540/30000 | Total reward = 8.09
2022-01-26 14:18:40.382 | DEBUG    | __main__:trials:24 - Trial = 27541/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.383 | DEBUG    | __main__:trials:29 - Trial = 27541/30000 | Total reward = 19.01
2022-01-26 14:18:40.386 | DEBUG    | __main__:trials:24 - Trial = 27542/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.388 | DEBUG    | __main__:trials:29 - Trial = 27542/30000 | Total reward = 51.17
2022-01-26 14:18:40.389 | DEBUG    | __main__:trials:26 - Trial = 27543/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.391 | DEBUG    | __main__:trials:29 - Trial = 27543/30000 | Total reward = 11.01
2022-01-26 14:18:40.395 | DEBUG    | __main__:trials:24 - Trial = 27544/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.397 | DEBUG    | __main__:trials:29 - Trial = 27544/30000 | Total reward = 46.15
2022-01-26 14:18:40.399 | DEBUG    | __main__:trials:26 - Trial = 27545/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.400 | DEBUG    | __main__:trials:29 - Trial = 27545/30000 | Total reward = 10.87
2022-01-26 14:18:40.404 | DEBUG    | __main__:trials:24 - Trial = 27546/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.406 | DEBUG    | __main__:trials:29 - Trial = 27546/30000 | Total reward = 47.72
2022-01-26 14:18:40.409 | DEBUG    | __main__:trials:26 - Trial = 27547/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.409 | DEBUG    | __main__:trials:29 - Trial = 27547/30000 | Total reward = 10.75
2022-01-26 14:18:40.411 | DEBUG    | __main__:trials:26 - Trial = 27548/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.412 | DEBUG    | __main__:trials:29 - Trial = 27548/30000 | Total reward = 11.88
2022-01-26 14:18:40.414 | DEBUG    | __main__:trials:26 - Trial = 27549/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.416 | DEBUG    | __main__:trials:29 - Trial = 27549/30000 | Total reward = 13.29
2022-01-26 14:18:40.419 | DEBUG    | __main__:trials:26 - Trial = 27550/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.420 | DEBUG    | __main__:trials:29 - Trial = 27550/30000 | Total reward = 20.58
2022-01-26 14:18:40.424 | DEBUG    | __main__:trials:24 - Trial = 27551/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.425 | DEBUG    | __main__:trials:29 - Trial = 27551/30000 | Total reward = 50.60
2022-01-26 14:18:40.429 | DEBUG    | __main__:trials:26 - Trial = 27552/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.430 | DEBUG    | __main__:trials:29 - Trial = 27552/30000 | Total reward = 9.01
2022-01-26 14:18:40.433 | DEBUG    | __main__:trials:26 - Trial = 27553/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.433 | DEBUG    | __main__:trials:29 - Trial = 27553/30000 | Total reward = 11.01
2022-01-26 14:18:40.436 | DEBUG    | __main__:trials:24 - Trial = 27554/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.437 | DEBUG    | __main__:trials:29 - Trial = 27554/30000 | Total reward = 32.62
2022-01-26 14:18:40.440 | DEBUG    | __main__:trials:26 - Trial = 27555/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.442 | DEBUG    | __main__:trials:29 - Trial = 27555/30000 | Total reward = 16.30
2022-01-26 14:18:40.444 | DEBUG    | __main__:trials:26 - Trial = 27556/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.445 | DEBUG    | __main__:trials:29 - Trial = 27556/30000 | Total reward = 9.07
2022-01-26 14:18:40.449 | DEBUG    | __main__:trials:24 - Trial = 27557/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.451 | DEBUG    | __main__:trials:29 - Trial = 27557/30000 | Total reward = 29.66
2022-01-26 14:18:40.452 | DEBUG    | __main__:trials:26 - Trial = 27558/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.454 | DEBUG    | __main__:trials:29 - Trial = 27558/30000 | Total reward = 10.12
2022-01-26 14:18:40.458 | DEBUG    | __main__:trials:24 - Trial = 27559/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.459 | DEBUG    | __main__:trials:29 - Trial = 27559/30000 | Total reward = 27.86
2022-01-26 14:18:40.461 | DEBUG    | __main__:trials:26 - Trial = 27560/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.462 | DEBUG    | __main__:trials:29 - Trial = 27560/30000 | Total reward = 13.29
2022-01-26 14:18:40.464 | DEBUG    | __main__:trials:26 - Trial = 27561/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.465 | DEBUG    | __main__:trials:29 - Trial = 27561/30000 | Total reward = 12.01
2022-01-26 14:18:40.469 | DEBUG    | __main__:trials:24 - Trial = 27562/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.470 | DEBUG    | __main__:trials:29 - Trial = 27562/30000 | Total reward = 50.44
2022-01-26 14:18:40.474 | DEBUG    | __main__:trials:24 - Trial = 27563/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.475 | DEBUG    | __main__:trials:29 - Trial = 27563/30000 | Total reward = 42.06
2022-01-26 14:18:40.479 | DEBUG    | __main__:trials:26 - Trial = 27564/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.480 | DEBUG    | __main__:trials:29 - Trial = 27564/30000 | Total reward = 15.56
2022-01-26 14:18:40.482 | DEBUG    | __main__:trials:26 - Trial = 27565/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.483 | DEBUG    | __main__:trials:29 - Trial = 27565/30000 | Total reward = 10.99
2022-01-26 14:18:40.487 | DEBUG    | __main__:trials:24 - Trial = 27566/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.488 | DEBUG    | __main__:trials:29 - Trial = 27566/30000 | Total reward = 42.32
2022-01-26 14:18:40.492 | DEBUG    | __main__:trials:24 - Trial = 27567/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.494 | DEBUG    | __main__:trials:29 - Trial = 27567/30000 | Total reward = 31.57
2022-01-26 14:18:40.497 | DEBUG    | __main__:trials:24 - Trial = 27568/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.498 | DEBUG    | __main__:trials:29 - Trial = 27568/30000 | Total reward = 27.82
2022-01-26 14:18:40.501 | DEBUG    | __main__:trials:26 - Trial = 27569/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.502 | DEBUG    | __main__:trials:29 - Trial = 27569/30000 | Total reward = 12.32
2022-01-26 14:18:40.506 | DEBUG    | __main__:trials:24 - Trial = 27570/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.508 | DEBUG    | __main__:trials:29 - Trial = 27570/30000 | Total reward = 27.91
2022-01-26 14:18:40.511 | DEBUG    | __main__:trials:24 - Trial = 27571/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.513 | DEBUG    | __main__:trials:29 - Trial = 27571/30000 | Total reward = 23.73
2022-01-26 14:18:40.516 | DEBUG    | __main__:trials:24 - Trial = 27572/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.518 | DEBUG    | __main__:trials:29 - Trial = 27572/30000 | Total reward = 27.71
2022-01-26 14:18:40.522 | DEBUG    | __main__:trials:24 - Trial = 27573/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.523 | DEBUG    | __main__:trials:29 - Trial = 27573/30000 | Total reward = 29.82
2022-01-26 14:18:40.527 | DEBUG    | __main__:trials:26 - Trial = 27574/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.528 | DEBUG    | __main__:trials:29 - Trial = 27574/30000 | Total reward = 7.24
2022-01-26 14:18:40.532 | DEBUG    | __main__:trials:24 - Trial = 27575/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.534 | DEBUG    | __main__:trials:29 - Trial = 27575/30000 | Total reward = 35.68
2022-01-26 14:18:40.537 | DEBUG    | __main__:trials:24 - Trial = 27576/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.539 | DEBUG    | __main__:trials:29 - Trial = 27576/30000 | Total reward = 45.20
2022-01-26 14:18:40.542 | DEBUG    | __main__:trials:24 - Trial = 27577/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.544 | DEBUG    | __main__:trials:29 - Trial = 27577/30000 | Total reward = 25.54
2022-01-26 14:18:40.548 | DEBUG    | __main__:trials:24 - Trial = 27578/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.549 | DEBUG    | __main__:trials:29 - Trial = 27578/30000 | Total reward = 31.56
2022-01-26 14:18:40.553 | DEBUG    | __main__:trials:24 - Trial = 27579/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.554 | DEBUG    | __main__:trials:29 - Trial = 27579/30000 | Total reward = 43.31
2022-01-26 14:18:40.558 | DEBUG    | __main__:trials:24 - Trial = 27580/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.559 | DEBUG    | __main__:trials:29 - Trial = 27580/30000 | Total reward = 35.45
2022-01-26 14:18:40.563 | DEBUG    | __main__:trials:24 - Trial = 27581/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.564 | DEBUG    | __main__:trials:29 - Trial = 27581/30000 | Total reward = 51.54
2022-01-26 14:18:40.568 | DEBUG    | __main__:trials:24 - Trial = 27582/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.570 | DEBUG    | __main__:trials:29 - Trial = 27582/30000 | Total reward = 17.55
2022-01-26 14:18:40.573 | DEBUG    | __main__:trials:26 - Trial = 27583/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.575 | DEBUG    | __main__:trials:29 - Trial = 27583/30000 | Total reward = 24.26
2022-01-26 14:18:40.578 | DEBUG    | __main__:trials:24 - Trial = 27584/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.580 | DEBUG    | __main__:trials:29 - Trial = 27584/30000 | Total reward = 39.70
2022-01-26 14:18:40.583 | DEBUG    | __main__:trials:24 - Trial = 27585/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.585 | DEBUG    | __main__:trials:29 - Trial = 27585/30000 | Total reward = 34.20
2022-01-26 14:18:40.588 | DEBUG    | __main__:trials:24 - Trial = 27586/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.590 | DEBUG    | __main__:trials:29 - Trial = 27586/30000 | Total reward = 28.59
2022-01-26 14:18:40.593 | DEBUG    | __main__:trials:26 - Trial = 27587/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.595 | DEBUG    | __main__:trials:29 - Trial = 27587/30000 | Total reward = 17.75
2022-01-26 14:18:40.598 | DEBUG    | __main__:trials:24 - Trial = 27588/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.600 | DEBUG    | __main__:trials:29 - Trial = 27588/30000 | Total reward = 19.68
2022-01-26 14:18:40.604 | DEBUG    | __main__:trials:24 - Trial = 27589/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.604 | DEBUG    | __main__:trials:29 - Trial = 27589/30000 | Total reward = 21.78
2022-01-26 14:18:40.609 | DEBUG    | __main__:trials:24 - Trial = 27590/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.610 | DEBUG    | __main__:trials:29 - Trial = 27590/30000 | Total reward = 43.68
2022-01-26 14:18:40.614 | DEBUG    | __main__:trials:24 - Trial = 27591/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.616 | DEBUG    | __main__:trials:29 - Trial = 27591/30000 | Total reward = 41.08
2022-01-26 14:18:40.620 | DEBUG    | __main__:trials:24 - Trial = 27592/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.620 | DEBUG    | __main__:trials:29 - Trial = 27592/30000 | Total reward = 28.13
2022-01-26 14:18:40.624 | DEBUG    | __main__:trials:24 - Trial = 27593/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.626 | DEBUG    | __main__:trials:29 - Trial = 27593/30000 | Total reward = 27.77
2022-01-26 14:18:40.629 | DEBUG    | __main__:trials:26 - Trial = 27594/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.631 | DEBUG    | __main__:trials:29 - Trial = 27594/30000 | Total reward = 25.05
2022-01-26 14:18:40.634 | DEBUG    | __main__:trials:24 - Trial = 27595/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.636 | DEBUG    | __main__:trials:29 - Trial = 27595/30000 | Total reward = 30.71
2022-01-26 14:18:40.640 | DEBUG    | __main__:trials:24 - Trial = 27596/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.641 | DEBUG    | __main__:trials:29 - Trial = 27596/30000 | Total reward = 37.74
2022-01-26 14:18:40.645 | DEBUG    | __main__:trials:26 - Trial = 27597/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.646 | DEBUG    | __main__:trials:29 - Trial = 27597/30000 | Total reward = 24.94
2022-01-26 14:18:40.648 | DEBUG    | __main__:trials:26 - Trial = 27598/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.648 | DEBUG    | __main__:trials:29 - Trial = 27598/30000 | Total reward = 8.09
2022-01-26 14:18:40.652 | DEBUG    | __main__:trials:24 - Trial = 27599/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.654 | DEBUG    | __main__:trials:29 - Trial = 27599/30000 | Total reward = 16.80
2022-01-26 14:18:40.657 | DEBUG    | __main__:trials:24 - Trial = 27600/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.658 | DEBUG    | __main__:trials:29 - Trial = 27600/30000 | Total reward = 24.95
2022-01-26 14:18:40.662 | DEBUG    | __main__:trials:24 - Trial = 27601/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.664 | DEBUG    | __main__:trials:29 - Trial = 27601/30000 | Total reward = 36.29
2022-01-26 14:18:40.667 | DEBUG    | __main__:trials:26 - Trial = 27602/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.668 | DEBUG    | __main__:trials:29 - Trial = 27602/30000 | Total reward = 17.46
2022-01-26 14:18:40.671 | DEBUG    | __main__:trials:24 - Trial = 27603/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.673 | DEBUG    | __main__:trials:29 - Trial = 27603/30000 | Total reward = 29.85
2022-01-26 14:18:40.677 | DEBUG    | __main__:trials:24 - Trial = 27604/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.678 | DEBUG    | __main__:trials:29 - Trial = 27604/30000 | Total reward = 27.38
2022-01-26 14:18:40.681 | DEBUG    | __main__:trials:24 - Trial = 27605/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.683 | DEBUG    | __main__:trials:29 - Trial = 27605/30000 | Total reward = 38.51
2022-01-26 14:18:40.686 | DEBUG    | __main__:trials:24 - Trial = 27606/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.687 | DEBUG    | __main__:trials:29 - Trial = 27606/30000 | Total reward = 30.17
2022-01-26 14:18:40.690 | DEBUG    | __main__:trials:24 - Trial = 27607/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.692 | DEBUG    | __main__:trials:29 - Trial = 27607/30000 | Total reward = 30.93
2022-01-26 14:18:40.695 | DEBUG    | __main__:trials:26 - Trial = 27608/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.696 | DEBUG    | __main__:trials:29 - Trial = 27608/30000 | Total reward = 9.66
2022-01-26 14:18:40.699 | DEBUG    | __main__:trials:24 - Trial = 27609/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.701 | DEBUG    | __main__:trials:29 - Trial = 27609/30000 | Total reward = 50.58
2022-01-26 14:18:40.705 | DEBUG    | __main__:trials:26 - Trial = 27610/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.705 | DEBUG    | __main__:trials:29 - Trial = 27610/30000 | Total reward = 31.70
2022-01-26 14:18:40.708 | DEBUG    | __main__:trials:26 - Trial = 27611/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.710 | DEBUG    | __main__:trials:29 - Trial = 27611/30000 | Total reward = 12.62
2022-01-26 14:18:40.714 | DEBUG    | __main__:trials:24 - Trial = 27612/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.715 | DEBUG    | __main__:trials:29 - Trial = 27612/30000 | Total reward = 20.04
2022-01-26 14:18:40.719 | DEBUG    | __main__:trials:24 - Trial = 27613/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.720 | DEBUG    | __main__:trials:29 - Trial = 27613/30000 | Total reward = 52.08
2022-01-26 14:18:40.722 | DEBUG    | __main__:trials:26 - Trial = 27614/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.724 | DEBUG    | __main__:trials:29 - Trial = 27614/30000 | Total reward = 11.75
2022-01-26 14:18:40.728 | DEBUG    | __main__:trials:24 - Trial = 27615/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.730 | DEBUG    | __main__:trials:29 - Trial = 27615/30000 | Total reward = 20.29
2022-01-26 14:18:40.733 | DEBUG    | __main__:trials:24 - Trial = 27616/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.735 | DEBUG    | __main__:trials:29 - Trial = 27616/30000 | Total reward = 35.01
2022-01-26 14:18:40.739 | DEBUG    | __main__:trials:24 - Trial = 27617/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.740 | DEBUG    | __main__:trials:29 - Trial = 27617/30000 | Total reward = 28.40
2022-01-26 14:18:40.744 | DEBUG    | __main__:trials:24 - Trial = 27618/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.746 | DEBUG    | __main__:trials:29 - Trial = 27618/30000 | Total reward = 48.54
2022-01-26 14:18:40.748 | DEBUG    | __main__:trials:26 - Trial = 27619/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.749 | DEBUG    | __main__:trials:29 - Trial = 27619/30000 | Total reward = 9.07
2022-01-26 14:18:40.752 | DEBUG    | __main__:trials:24 - Trial = 27620/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.754 | DEBUG    | __main__:trials:29 - Trial = 27620/30000 | Total reward = 30.75
2022-01-26 14:18:40.757 | DEBUG    | __main__:trials:24 - Trial = 27621/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.758 | DEBUG    | __main__:trials:29 - Trial = 27621/30000 | Total reward = 53.95
2022-01-26 14:18:40.761 | DEBUG    | __main__:trials:24 - Trial = 27622/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.763 | DEBUG    | __main__:trials:29 - Trial = 27622/30000 | Total reward = 36.17
2022-01-26 14:18:40.766 | DEBUG    | __main__:trials:26 - Trial = 27623/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.768 | DEBUG    | __main__:trials:29 - Trial = 27623/30000 | Total reward = 19.30
2022-01-26 14:18:40.771 | DEBUG    | __main__:trials:26 - Trial = 27624/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.772 | DEBUG    | __main__:trials:29 - Trial = 27624/30000 | Total reward = 19.01
2022-01-26 14:18:40.776 | DEBUG    | __main__:trials:24 - Trial = 27625/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.777 | DEBUG    | __main__:trials:29 - Trial = 27625/30000 | Total reward = 23.06
2022-01-26 14:18:40.781 | DEBUG    | __main__:trials:24 - Trial = 27626/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.782 | DEBUG    | __main__:trials:29 - Trial = 27626/30000 | Total reward = 28.18
2022-01-26 14:18:40.785 | DEBUG    | __main__:trials:26 - Trial = 27627/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.787 | DEBUG    | __main__:trials:29 - Trial = 27627/30000 | Total reward = 15.84
2022-01-26 14:18:40.790 | DEBUG    | __main__:trials:26 - Trial = 27628/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.792 | DEBUG    | __main__:trials:29 - Trial = 27628/30000 | Total reward = 25.62
2022-01-26 14:18:40.795 | DEBUG    | __main__:trials:26 - Trial = 27629/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.796 | DEBUG    | __main__:trials:29 - Trial = 27629/30000 | Total reward = 10.79
2022-01-26 14:18:40.800 | DEBUG    | __main__:trials:24 - Trial = 27630/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.801 | DEBUG    | __main__:trials:29 - Trial = 27630/30000 | Total reward = 28.24
2022-01-26 14:18:40.804 | DEBUG    | __main__:trials:24 - Trial = 27631/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.806 | DEBUG    | __main__:trials:29 - Trial = 27631/30000 | Total reward = 42.29
2022-01-26 14:18:40.810 | DEBUG    | __main__:trials:24 - Trial = 27632/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.811 | DEBUG    | __main__:trials:29 - Trial = 27632/30000 | Total reward = 30.07
2022-01-26 14:18:40.815 | DEBUG    | __main__:trials:26 - Trial = 27633/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.817 | DEBUG    | __main__:trials:29 - Trial = 27633/30000 | Total reward = 19.36
2022-01-26 14:18:40.820 | DEBUG    | __main__:trials:26 - Trial = 27634/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.822 | DEBUG    | __main__:trials:29 - Trial = 27634/30000 | Total reward = 14.50
2022-01-26 14:18:40.825 | DEBUG    | __main__:trials:26 - Trial = 27635/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.826 | DEBUG    | __main__:trials:29 - Trial = 27635/30000 | Total reward = 17.58
2022-01-26 14:18:40.829 | DEBUG    | __main__:trials:24 - Trial = 27636/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.831 | DEBUG    | __main__:trials:29 - Trial = 27636/30000 | Total reward = 31.21
2022-01-26 14:18:40.834 | DEBUG    | __main__:trials:26 - Trial = 27637/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.836 | DEBUG    | __main__:trials:29 - Trial = 27637/30000 | Total reward = 6.28
2022-01-26 14:18:40.838 | DEBUG    | __main__:trials:26 - Trial = 27638/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.840 | DEBUG    | __main__:trials:29 - Trial = 27638/30000 | Total reward = 13.61
2022-01-26 14:18:40.842 | DEBUG    | __main__:trials:26 - Trial = 27639/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.843 | DEBUG    | __main__:trials:29 - Trial = 27639/30000 | Total reward = 7.70
2022-01-26 14:18:40.846 | DEBUG    | __main__:trials:26 - Trial = 27640/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.848 | DEBUG    | __main__:trials:29 - Trial = 27640/30000 | Total reward = 20.52
2022-01-26 14:18:40.852 | DEBUG    | __main__:trials:26 - Trial = 27641/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.854 | DEBUG    | __main__:trials:29 - Trial = 27641/30000 | Total reward = 23.72
2022-01-26 14:18:40.857 | DEBUG    | __main__:trials:24 - Trial = 27642/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.859 | DEBUG    | __main__:trials:29 - Trial = 27642/30000 | Total reward = 24.26
2022-01-26 14:18:40.862 | DEBUG    | __main__:trials:24 - Trial = 27643/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.864 | DEBUG    | __main__:trials:29 - Trial = 27643/30000 | Total reward = 30.21
2022-01-26 14:18:40.867 | DEBUG    | __main__:trials:24 - Trial = 27644/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.868 | DEBUG    | __main__:trials:29 - Trial = 27644/30000 | Total reward = 38.75
2022-01-26 14:18:40.873 | DEBUG    | __main__:trials:24 - Trial = 27645/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.874 | DEBUG    | __main__:trials:29 - Trial = 27645/30000 | Total reward = 36.73
2022-01-26 14:18:40.878 | DEBUG    | __main__:trials:24 - Trial = 27646/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.878 | DEBUG    | __main__:trials:29 - Trial = 27646/30000 | Total reward = 30.57
2022-01-26 14:18:40.882 | DEBUG    | __main__:trials:24 - Trial = 27647/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.884 | DEBUG    | __main__:trials:29 - Trial = 27647/30000 | Total reward = 49.61
2022-01-26 14:18:40.887 | DEBUG    | __main__:trials:24 - Trial = 27648/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.889 | DEBUG    | __main__:trials:29 - Trial = 27648/30000 | Total reward = 41.69
2022-01-26 14:18:40.892 | DEBUG    | __main__:trials:26 - Trial = 27649/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.894 | DEBUG    | __main__:trials:29 - Trial = 27649/30000 | Total reward = 20.68
2022-01-26 14:18:40.898 | DEBUG    | __main__:trials:26 - Trial = 27650/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.899 | DEBUG    | __main__:trials:29 - Trial = 27650/30000 | Total reward = 26.33
2022-01-26 14:18:40.903 | DEBUG    | __main__:trials:24 - Trial = 27651/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.905 | DEBUG    | __main__:trials:29 - Trial = 27651/30000 | Total reward = 52.51
2022-01-26 14:18:40.907 | DEBUG    | __main__:trials:26 - Trial = 27652/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.909 | DEBUG    | __main__:trials:29 - Trial = 27652/30000 | Total reward = 8.73
2022-01-26 14:18:40.912 | DEBUG    | __main__:trials:24 - Trial = 27653/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.914 | DEBUG    | __main__:trials:29 - Trial = 27653/30000 | Total reward = 23.02
2022-01-26 14:18:40.917 | DEBUG    | __main__:trials:26 - Trial = 27654/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.919 | DEBUG    | __main__:trials:29 - Trial = 27654/30000 | Total reward = 19.83
2022-01-26 14:18:40.923 | DEBUG    | __main__:trials:24 - Trial = 27655/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.924 | DEBUG    | __main__:trials:29 - Trial = 27655/30000 | Total reward = 47.51
2022-01-26 14:18:40.928 | DEBUG    | __main__:trials:24 - Trial = 27656/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.929 | DEBUG    | __main__:trials:29 - Trial = 27656/30000 | Total reward = 24.55
2022-01-26 14:18:40.934 | DEBUG    | __main__:trials:24 - Trial = 27657/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.936 | DEBUG    | __main__:trials:29 - Trial = 27657/30000 | Total reward = 24.54
2022-01-26 14:18:40.939 | DEBUG    | __main__:trials:26 - Trial = 27658/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.941 | DEBUG    | __main__:trials:29 - Trial = 27658/30000 | Total reward = 18.77
2022-01-26 14:18:40.944 | DEBUG    | __main__:trials:24 - Trial = 27659/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.946 | DEBUG    | __main__:trials:29 - Trial = 27659/30000 | Total reward = 40.79
2022-01-26 14:18:40.948 | DEBUG    | __main__:trials:26 - Trial = 27660/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.950 | DEBUG    | __main__:trials:29 - Trial = 27660/30000 | Total reward = 14.95
2022-01-26 14:18:40.953 | DEBUG    | __main__:trials:24 - Trial = 27661/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.955 | DEBUG    | __main__:trials:29 - Trial = 27661/30000 | Total reward = 46.38
2022-01-26 14:18:40.959 | DEBUG    | __main__:trials:24 - Trial = 27662/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.960 | DEBUG    | __main__:trials:29 - Trial = 27662/30000 | Total reward = 32.94
2022-01-26 14:18:40.964 | DEBUG    | __main__:trials:26 - Trial = 27663/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.965 | DEBUG    | __main__:trials:29 - Trial = 27663/30000 | Total reward = 20.61
2022-01-26 14:18:40.968 | DEBUG    | __main__:trials:26 - Trial = 27664/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.969 | DEBUG    | __main__:trials:29 - Trial = 27664/30000 | Total reward = 7.80
2022-01-26 14:18:40.971 | DEBUG    | __main__:trials:26 - Trial = 27665/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.973 | DEBUG    | __main__:trials:29 - Trial = 27665/30000 | Total reward = 13.29
2022-01-26 14:18:40.976 | DEBUG    | __main__:trials:26 - Trial = 27666/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.978 | DEBUG    | __main__:trials:29 - Trial = 27666/30000 | Total reward = 24.48
2022-01-26 14:18:40.981 | DEBUG    | __main__:trials:24 - Trial = 27667/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.983 | DEBUG    | __main__:trials:29 - Trial = 27667/30000 | Total reward = 40.76
2022-01-26 14:18:40.985 | DEBUG    | __main__:trials:26 - Trial = 27668/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.986 | DEBUG    | __main__:trials:29 - Trial = 27668/30000 | Total reward = 18.04
2022-01-26 14:18:40.989 | DEBUG    | __main__:trials:26 - Trial = 27669/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.990 | DEBUG    | __main__:trials:29 - Trial = 27669/30000 | Total reward = 15.57
2022-01-26 14:18:40.993 | DEBUG    | __main__:trials:24 - Trial = 27670/30000 | Max number of steps (20) reached
2022-01-26 14:18:40.994 | DEBUG    | __main__:trials:29 - Trial = 27670/30000 | Total reward = 31.83
2022-01-26 14:18:40.997 | DEBUG    | __main__:trials:26 - Trial = 27671/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:40.998 | DEBUG    | __main__:trials:29 - Trial = 27671/30000 | Total reward = 17.89
2022-01-26 14:18:41.002 | DEBUG    | __main__:trials:24 - Trial = 27672/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.004 | DEBUG    | __main__:trials:29 - Trial = 27672/30000 | Total reward = 31.27
2022-01-26 14:18:41.007 | DEBUG    | __main__:trials:24 - Trial = 27673/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.009 | DEBUG    | __main__:trials:29 - Trial = 27673/30000 | Total reward = 22.49
2022-01-26 14:18:41.012 | DEBUG    | __main__:trials:24 - Trial = 27674/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.014 | DEBUG    | __main__:trials:29 - Trial = 27674/30000 | Total reward = 24.22
2022-01-26 14:18:41.017 | DEBUG    | __main__:trials:26 - Trial = 27675/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.019 | DEBUG    | __main__:trials:29 - Trial = 27675/30000 | Total reward = 22.12
2022-01-26 14:18:41.021 | DEBUG    | __main__:trials:26 - Trial = 27676/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.023 | DEBUG    | __main__:trials:29 - Trial = 27676/30000 | Total reward = 10.75
2022-01-26 14:18:41.026 | DEBUG    | __main__:trials:24 - Trial = 27677/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.028 | DEBUG    | __main__:trials:29 - Trial = 27677/30000 | Total reward = 28.64
2022-01-26 14:18:41.032 | DEBUG    | __main__:trials:24 - Trial = 27678/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.033 | DEBUG    | __main__:trials:29 - Trial = 27678/30000 | Total reward = 35.28
2022-01-26 14:18:41.036 | DEBUG    | __main__:trials:26 - Trial = 27679/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.038 | DEBUG    | __main__:trials:29 - Trial = 27679/30000 | Total reward = 8.92
2022-01-26 14:18:41.042 | DEBUG    | __main__:trials:24 - Trial = 27680/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.043 | DEBUG    | __main__:trials:29 - Trial = 27680/30000 | Total reward = 47.58
2022-01-26 14:18:41.047 | DEBUG    | __main__:trials:26 - Trial = 27681/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.049 | DEBUG    | __main__:trials:29 - Trial = 27681/30000 | Total reward = 27.24
2022-01-26 14:18:41.052 | DEBUG    | __main__:trials:24 - Trial = 27682/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.053 | DEBUG    | __main__:trials:29 - Trial = 27682/30000 | Total reward = 24.70
2022-01-26 14:18:41.057 | DEBUG    | __main__:trials:26 - Trial = 27683/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.058 | DEBUG    | __main__:trials:29 - Trial = 27683/30000 | Total reward = 27.08
2022-01-26 14:18:41.062 | DEBUG    | __main__:trials:24 - Trial = 27684/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.063 | DEBUG    | __main__:trials:29 - Trial = 27684/30000 | Total reward = 43.41
2022-01-26 14:18:41.067 | DEBUG    | __main__:trials:24 - Trial = 27685/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.069 | DEBUG    | __main__:trials:29 - Trial = 27685/30000 | Total reward = 25.41
2022-01-26 14:18:41.072 | DEBUG    | __main__:trials:24 - Trial = 27686/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.074 | DEBUG    | __main__:trials:29 - Trial = 27686/30000 | Total reward = 25.71
2022-01-26 14:18:41.078 | DEBUG    | __main__:trials:24 - Trial = 27687/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.079 | DEBUG    | __main__:trials:29 - Trial = 27687/30000 | Total reward = 41.49
2022-01-26 14:18:41.083 | DEBUG    | __main__:trials:24 - Trial = 27688/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.084 | DEBUG    | __main__:trials:29 - Trial = 27688/30000 | Total reward = 24.24
2022-01-26 14:18:41.088 | DEBUG    | __main__:trials:24 - Trial = 27689/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.089 | DEBUG    | __main__:trials:29 - Trial = 27689/30000 | Total reward = 24.41
2022-01-26 14:18:41.093 | DEBUG    | __main__:trials:24 - Trial = 27690/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.094 | DEBUG    | __main__:trials:29 - Trial = 27690/30000 | Total reward = 34.30
2022-01-26 14:18:41.098 | DEBUG    | __main__:trials:24 - Trial = 27691/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.099 | DEBUG    | __main__:trials:29 - Trial = 27691/30000 | Total reward = 25.97
2022-01-26 14:18:41.102 | DEBUG    | __main__:trials:26 - Trial = 27692/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.104 | DEBUG    | __main__:trials:29 - Trial = 27692/30000 | Total reward = 16.76
2022-01-26 14:18:41.107 | DEBUG    | __main__:trials:24 - Trial = 27693/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.109 | DEBUG    | __main__:trials:29 - Trial = 27693/30000 | Total reward = 26.25
2022-01-26 14:18:41.112 | DEBUG    | __main__:trials:26 - Trial = 27694/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.113 | DEBUG    | __main__:trials:29 - Trial = 27694/30000 | Total reward = 13.69
2022-01-26 14:18:41.117 | DEBUG    | __main__:trials:26 - Trial = 27695/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.117 | DEBUG    | __main__:trials:29 - Trial = 27695/30000 | Total reward = 23.94
2022-01-26 14:18:41.119 | DEBUG    | __main__:trials:26 - Trial = 27696/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.120 | DEBUG    | __main__:trials:29 - Trial = 27696/30000 | Total reward = 8.08
2022-01-26 14:18:41.124 | DEBUG    | __main__:trials:24 - Trial = 27697/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.124 | DEBUG    | __main__:trials:29 - Trial = 27697/30000 | Total reward = 26.10
2022-01-26 14:18:41.128 | DEBUG    | __main__:trials:26 - Trial = 27698/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.130 | DEBUG    | __main__:trials:29 - Trial = 27698/30000 | Total reward = 11.10
2022-01-26 14:18:41.133 | DEBUG    | __main__:trials:24 - Trial = 27699/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.134 | DEBUG    | __main__:trials:29 - Trial = 27699/30000 | Total reward = 30.47
2022-01-26 14:18:41.138 | DEBUG    | __main__:trials:26 - Trial = 27700/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.140 | DEBUG    | __main__:trials:29 - Trial = 27700/30000 | Total reward = 21.27
2022-01-26 14:18:41.144 | DEBUG    | __main__:trials:24 - Trial = 27701/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.144 | DEBUG    | __main__:trials:29 - Trial = 27701/30000 | Total reward = 20.63
2022-01-26 14:18:41.149 | DEBUG    | __main__:trials:24 - Trial = 27702/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.149 | DEBUG    | __main__:trials:29 - Trial = 27702/30000 | Total reward = 42.65
2022-01-26 14:18:41.153 | DEBUG    | __main__:trials:24 - Trial = 27703/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.154 | DEBUG    | __main__:trials:29 - Trial = 27703/30000 | Total reward = 29.36
2022-01-26 14:18:41.157 | DEBUG    | __main__:trials:24 - Trial = 27704/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.158 | DEBUG    | __main__:trials:29 - Trial = 27704/30000 | Total reward = 21.00
2022-01-26 14:18:41.161 | DEBUG    | __main__:trials:24 - Trial = 27705/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.162 | DEBUG    | __main__:trials:29 - Trial = 27705/30000 | Total reward = 32.80
2022-01-26 14:18:41.165 | DEBUG    | __main__:trials:24 - Trial = 27706/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.167 | DEBUG    | __main__:trials:29 - Trial = 27706/30000 | Total reward = 38.34
2022-01-26 14:18:41.170 | DEBUG    | __main__:trials:24 - Trial = 27707/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.171 | DEBUG    | __main__:trials:29 - Trial = 27707/30000 | Total reward = 36.99
2022-01-26 14:18:41.174 | DEBUG    | __main__:trials:24 - Trial = 27708/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.176 | DEBUG    | __main__:trials:29 - Trial = 27708/30000 | Total reward = 35.19
2022-01-26 14:18:41.179 | DEBUG    | __main__:trials:24 - Trial = 27709/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.182 | DEBUG    | __main__:trials:29 - Trial = 27709/30000 | Total reward = 27.11
2022-01-26 14:18:41.184 | DEBUG    | __main__:trials:24 - Trial = 27710/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.186 | DEBUG    | __main__:trials:29 - Trial = 27710/30000 | Total reward = 32.37
2022-01-26 14:18:41.189 | DEBUG    | __main__:trials:24 - Trial = 27711/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.191 | DEBUG    | __main__:trials:29 - Trial = 27711/30000 | Total reward = 34.59
2022-01-26 14:18:41.194 | DEBUG    | __main__:trials:24 - Trial = 27712/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.195 | DEBUG    | __main__:trials:29 - Trial = 27712/30000 | Total reward = 37.86
2022-01-26 14:18:41.198 | DEBUG    | __main__:trials:24 - Trial = 27713/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.200 | DEBUG    | __main__:trials:29 - Trial = 27713/30000 | Total reward = 33.32
2022-01-26 14:18:41.203 | DEBUG    | __main__:trials:24 - Trial = 27714/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.204 | DEBUG    | __main__:trials:29 - Trial = 27714/30000 | Total reward = 37.21
2022-01-26 14:18:41.208 | DEBUG    | __main__:trials:24 - Trial = 27715/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.209 | DEBUG    | __main__:trials:29 - Trial = 27715/30000 | Total reward = 35.21
2022-01-26 14:18:41.213 | DEBUG    | __main__:trials:24 - Trial = 27716/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.213 | DEBUG    | __main__:trials:29 - Trial = 27716/30000 | Total reward = 26.12
2022-01-26 14:18:41.217 | DEBUG    | __main__:trials:24 - Trial = 27717/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.217 | DEBUG    | __main__:trials:29 - Trial = 27717/30000 | Total reward = 17.63
2022-01-26 14:18:41.221 | DEBUG    | __main__:trials:24 - Trial = 27718/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.221 | DEBUG    | __main__:trials:29 - Trial = 27718/30000 | Total reward = 37.52
2022-01-26 14:18:41.224 | DEBUG    | __main__:trials:26 - Trial = 27719/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.226 | DEBUG    | __main__:trials:29 - Trial = 27719/30000 | Total reward = 11.68
2022-01-26 14:18:41.228 | DEBUG    | __main__:trials:26 - Trial = 27720/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.229 | DEBUG    | __main__:trials:29 - Trial = 27720/30000 | Total reward = 9.01
2022-01-26 14:18:41.232 | DEBUG    | __main__:trials:24 - Trial = 27721/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.233 | DEBUG    | __main__:trials:29 - Trial = 27721/30000 | Total reward = 34.78
2022-01-26 14:18:41.236 | DEBUG    | __main__:trials:24 - Trial = 27722/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.237 | DEBUG    | __main__:trials:29 - Trial = 27722/30000 | Total reward = 51.74
2022-01-26 14:18:41.240 | DEBUG    | __main__:trials:26 - Trial = 27723/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.241 | DEBUG    | __main__:trials:29 - Trial = 27723/30000 | Total reward = 21.21
2022-01-26 14:18:41.245 | DEBUG    | __main__:trials:24 - Trial = 27724/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.247 | DEBUG    | __main__:trials:29 - Trial = 27724/30000 | Total reward = 34.09
2022-01-26 14:18:41.249 | DEBUG    | __main__:trials:26 - Trial = 27725/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.250 | DEBUG    | __main__:trials:29 - Trial = 27725/30000 | Total reward = 16.57
2022-01-26 14:18:41.252 | DEBUG    | __main__:trials:26 - Trial = 27726/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.252 | DEBUG    | __main__:trials:29 - Trial = 27726/30000 | Total reward = 9.35
2022-01-26 14:18:41.256 | DEBUG    | __main__:trials:26 - Trial = 27727/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.257 | DEBUG    | __main__:trials:29 - Trial = 27727/30000 | Total reward = 21.54
2022-01-26 14:18:41.260 | DEBUG    | __main__:trials:26 - Trial = 27728/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.261 | DEBUG    | __main__:trials:29 - Trial = 27728/30000 | Total reward = 11.71
2022-01-26 14:18:41.263 | DEBUG    | __main__:trials:26 - Trial = 27729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.264 | DEBUG    | __main__:trials:29 - Trial = 27729/30000 | Total reward = 12.01
2022-01-26 14:18:41.266 | DEBUG    | __main__:trials:26 - Trial = 27730/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.267 | DEBUG    | __main__:trials:29 - Trial = 27730/30000 | Total reward = 19.99
2022-01-26 14:18:41.270 | DEBUG    | __main__:trials:24 - Trial = 27731/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.271 | DEBUG    | __main__:trials:29 - Trial = 27731/30000 | Total reward = 24.42
2022-01-26 14:18:41.274 | DEBUG    | __main__:trials:26 - Trial = 27732/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.275 | DEBUG    | __main__:trials:29 - Trial = 27732/30000 | Total reward = 19.96
2022-01-26 14:18:41.278 | DEBUG    | __main__:trials:24 - Trial = 27733/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.280 | DEBUG    | __main__:trials:29 - Trial = 27733/30000 | Total reward = 41.02
2022-01-26 14:18:41.283 | DEBUG    | __main__:trials:26 - Trial = 27734/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.285 | DEBUG    | __main__:trials:29 - Trial = 27734/30000 | Total reward = 12.95
2022-01-26 14:18:41.288 | DEBUG    | __main__:trials:24 - Trial = 27735/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.290 | DEBUG    | __main__:trials:29 - Trial = 27735/30000 | Total reward = 29.14
2022-01-26 14:18:41.293 | DEBUG    | __main__:trials:26 - Trial = 27736/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.294 | DEBUG    | __main__:trials:29 - Trial = 27736/30000 | Total reward = 17.86
2022-01-26 14:18:41.296 | DEBUG    | __main__:trials:26 - Trial = 27737/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.297 | DEBUG    | __main__:trials:29 - Trial = 27737/30000 | Total reward = 15.42
2022-01-26 14:18:41.300 | DEBUG    | __main__:trials:26 - Trial = 27738/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.302 | DEBUG    | __main__:trials:29 - Trial = 27738/30000 | Total reward = 7.63
2022-01-26 14:18:41.305 | DEBUG    | __main__:trials:26 - Trial = 27739/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.307 | DEBUG    | __main__:trials:29 - Trial = 27739/30000 | Total reward = 18.62
2022-01-26 14:18:41.311 | DEBUG    | __main__:trials:24 - Trial = 27740/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.312 | DEBUG    | __main__:trials:29 - Trial = 27740/30000 | Total reward = 25.61
2022-01-26 14:18:41.315 | DEBUG    | __main__:trials:26 - Trial = 27741/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.316 | DEBUG    | __main__:trials:29 - Trial = 27741/30000 | Total reward = 13.54
2022-01-26 14:18:41.320 | DEBUG    | __main__:trials:24 - Trial = 27742/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.321 | DEBUG    | __main__:trials:29 - Trial = 27742/30000 | Total reward = 34.64
2022-01-26 14:18:41.324 | DEBUG    | __main__:trials:24 - Trial = 27743/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.326 | DEBUG    | __main__:trials:29 - Trial = 27743/30000 | Total reward = 26.56
2022-01-26 14:18:41.328 | DEBUG    | __main__:trials:26 - Trial = 27744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.330 | DEBUG    | __main__:trials:29 - Trial = 27744/30000 | Total reward = 13.29
2022-01-26 14:18:41.334 | DEBUG    | __main__:trials:26 - Trial = 27745/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.335 | DEBUG    | __main__:trials:29 - Trial = 27745/30000 | Total reward = 23.04
2022-01-26 14:18:41.338 | DEBUG    | __main__:trials:26 - Trial = 27746/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.339 | DEBUG    | __main__:trials:29 - Trial = 27746/30000 | Total reward = 13.29
2022-01-26 14:18:41.342 | DEBUG    | __main__:trials:26 - Trial = 27747/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.344 | DEBUG    | __main__:trials:29 - Trial = 27747/30000 | Total reward = 19.81
2022-01-26 14:18:41.348 | DEBUG    | __main__:trials:24 - Trial = 27748/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.349 | DEBUG    | __main__:trials:29 - Trial = 27748/30000 | Total reward = 27.86
2022-01-26 14:18:41.352 | DEBUG    | __main__:trials:24 - Trial = 27749/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.354 | DEBUG    | __main__:trials:29 - Trial = 27749/30000 | Total reward = 27.96
2022-01-26 14:18:41.356 | DEBUG    | __main__:trials:26 - Trial = 27750/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.358 | DEBUG    | __main__:trials:29 - Trial = 27750/30000 | Total reward = 10.75
2022-01-26 14:18:41.362 | DEBUG    | __main__:trials:24 - Trial = 27751/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.363 | DEBUG    | __main__:trials:29 - Trial = 27751/30000 | Total reward = 30.57
2022-01-26 14:18:41.366 | DEBUG    | __main__:trials:26 - Trial = 27752/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.368 | DEBUG    | __main__:trials:29 - Trial = 27752/30000 | Total reward = 18.63
2022-01-26 14:18:41.372 | DEBUG    | __main__:trials:24 - Trial = 27753/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.373 | DEBUG    | __main__:trials:29 - Trial = 27753/30000 | Total reward = 36.40
2022-01-26 14:18:41.377 | DEBUG    | __main__:trials:26 - Trial = 27754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.378 | DEBUG    | __main__:trials:29 - Trial = 27754/30000 | Total reward = 16.63
2022-01-26 14:18:41.381 | DEBUG    | __main__:trials:26 - Trial = 27755/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.383 | DEBUG    | __main__:trials:29 - Trial = 27755/30000 | Total reward = 15.33
2022-01-26 14:18:41.386 | DEBUG    | __main__:trials:24 - Trial = 27756/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.388 | DEBUG    | __main__:trials:29 - Trial = 27756/30000 | Total reward = 25.64
2022-01-26 14:18:41.391 | DEBUG    | __main__:trials:24 - Trial = 27757/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.393 | DEBUG    | __main__:trials:29 - Trial = 27757/30000 | Total reward = 23.91
2022-01-26 14:18:41.397 | DEBUG    | __main__:trials:26 - Trial = 27758/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.398 | DEBUG    | __main__:trials:29 - Trial = 27758/30000 | Total reward = 19.38
2022-01-26 14:18:41.402 | DEBUG    | __main__:trials:24 - Trial = 27759/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.403 | DEBUG    | __main__:trials:29 - Trial = 27759/30000 | Total reward = 23.09
2022-01-26 14:18:41.407 | DEBUG    | __main__:trials:24 - Trial = 27760/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.409 | DEBUG    | __main__:trials:29 - Trial = 27760/30000 | Total reward = 29.38
2022-01-26 14:18:41.412 | DEBUG    | __main__:trials:26 - Trial = 27761/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.413 | DEBUG    | __main__:trials:29 - Trial = 27761/30000 | Total reward = 14.24
2022-01-26 14:18:41.417 | DEBUG    | __main__:trials:24 - Trial = 27762/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.418 | DEBUG    | __main__:trials:29 - Trial = 27762/30000 | Total reward = 25.05
2022-01-26 14:18:41.422 | DEBUG    | __main__:trials:24 - Trial = 27763/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.424 | DEBUG    | __main__:trials:29 - Trial = 27763/30000 | Total reward = 32.50
2022-01-26 14:18:41.428 | DEBUG    | __main__:trials:24 - Trial = 27764/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.429 | DEBUG    | __main__:trials:29 - Trial = 27764/30000 | Total reward = 27.36
2022-01-26 14:18:41.432 | DEBUG    | __main__:trials:24 - Trial = 27765/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.434 | DEBUG    | __main__:trials:29 - Trial = 27765/30000 | Total reward = 27.69
2022-01-26 14:18:41.438 | DEBUG    | __main__:trials:24 - Trial = 27766/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.439 | DEBUG    | __main__:trials:29 - Trial = 27766/30000 | Total reward = 27.66
2022-01-26 14:18:41.442 | DEBUG    | __main__:trials:24 - Trial = 27767/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.444 | DEBUG    | __main__:trials:29 - Trial = 27767/30000 | Total reward = 31.55
2022-01-26 14:18:41.447 | DEBUG    | __main__:trials:24 - Trial = 27768/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.449 | DEBUG    | __main__:trials:29 - Trial = 27768/30000 | Total reward = 54.11
2022-01-26 14:18:41.452 | DEBUG    | __main__:trials:24 - Trial = 27769/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.454 | DEBUG    | __main__:trials:29 - Trial = 27769/30000 | Total reward = 33.71
2022-01-26 14:18:41.458 | DEBUG    | __main__:trials:24 - Trial = 27770/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.459 | DEBUG    | __main__:trials:29 - Trial = 27770/30000 | Total reward = 22.95
2022-01-26 14:18:41.462 | DEBUG    | __main__:trials:26 - Trial = 27771/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.464 | DEBUG    | __main__:trials:29 - Trial = 27771/30000 | Total reward = 12.60
2022-01-26 14:18:41.467 | DEBUG    | __main__:trials:24 - Trial = 27772/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.469 | DEBUG    | __main__:trials:29 - Trial = 27772/30000 | Total reward = 39.85
2022-01-26 14:18:41.472 | DEBUG    | __main__:trials:24 - Trial = 27773/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.474 | DEBUG    | __main__:trials:29 - Trial = 27773/30000 | Total reward = 35.29
2022-01-26 14:18:41.478 | DEBUG    | __main__:trials:24 - Trial = 27774/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.479 | DEBUG    | __main__:trials:29 - Trial = 27774/30000 | Total reward = 25.96
2022-01-26 14:18:41.483 | DEBUG    | __main__:trials:24 - Trial = 27775/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.483 | DEBUG    | __main__:trials:29 - Trial = 27775/30000 | Total reward = 23.15
2022-01-26 14:18:41.488 | DEBUG    | __main__:trials:24 - Trial = 27776/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.489 | DEBUG    | __main__:trials:29 - Trial = 27776/30000 | Total reward = 29.60
2022-01-26 14:18:41.492 | DEBUG    | __main__:trials:24 - Trial = 27777/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.494 | DEBUG    | __main__:trials:29 - Trial = 27777/30000 | Total reward = 26.73
2022-01-26 14:18:41.498 | DEBUG    | __main__:trials:24 - Trial = 27778/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.499 | DEBUG    | __main__:trials:29 - Trial = 27778/30000 | Total reward = 36.04
2022-01-26 14:18:41.502 | DEBUG    | __main__:trials:24 - Trial = 27779/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.504 | DEBUG    | __main__:trials:29 - Trial = 27779/30000 | Total reward = 36.17
2022-01-26 14:18:41.507 | DEBUG    | __main__:trials:24 - Trial = 27780/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.509 | DEBUG    | __main__:trials:29 - Trial = 27780/30000 | Total reward = 37.06
2022-01-26 14:18:41.512 | DEBUG    | __main__:trials:24 - Trial = 27781/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.514 | DEBUG    | __main__:trials:29 - Trial = 27781/30000 | Total reward = 35.44
2022-01-26 14:18:41.517 | DEBUG    | __main__:trials:24 - Trial = 27782/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.519 | DEBUG    | __main__:trials:29 - Trial = 27782/30000 | Total reward = 27.24
2022-01-26 14:18:41.523 | DEBUG    | __main__:trials:24 - Trial = 27783/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.524 | DEBUG    | __main__:trials:29 - Trial = 27783/30000 | Total reward = 25.01
2022-01-26 14:18:41.528 | DEBUG    | __main__:trials:24 - Trial = 27784/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.530 | DEBUG    | __main__:trials:29 - Trial = 27784/30000 | Total reward = 43.36
2022-01-26 14:18:41.533 | DEBUG    | __main__:trials:26 - Trial = 27785/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.534 | DEBUG    | __main__:trials:29 - Trial = 27785/30000 | Total reward = 15.41
2022-01-26 14:18:41.537 | DEBUG    | __main__:trials:24 - Trial = 27786/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.539 | DEBUG    | __main__:trials:29 - Trial = 27786/30000 | Total reward = 24.34
2022-01-26 14:18:41.543 | DEBUG    | __main__:trials:24 - Trial = 27787/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.544 | DEBUG    | __main__:trials:29 - Trial = 27787/30000 | Total reward = 33.18
2022-01-26 14:18:41.548 | DEBUG    | __main__:trials:24 - Trial = 27788/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.550 | DEBUG    | __main__:trials:29 - Trial = 27788/30000 | Total reward = 33.85
2022-01-26 14:18:41.553 | DEBUG    | __main__:trials:24 - Trial = 27789/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.555 | DEBUG    | __main__:trials:29 - Trial = 27789/30000 | Total reward = 41.62
2022-01-26 14:18:41.558 | DEBUG    | __main__:trials:24 - Trial = 27790/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.560 | DEBUG    | __main__:trials:29 - Trial = 27790/30000 | Total reward = 37.59
2022-01-26 14:18:41.564 | DEBUG    | __main__:trials:24 - Trial = 27791/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.565 | DEBUG    | __main__:trials:29 - Trial = 27791/30000 | Total reward = 36.04
2022-01-26 14:18:41.569 | DEBUG    | __main__:trials:24 - Trial = 27792/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.570 | DEBUG    | __main__:trials:29 - Trial = 27792/30000 | Total reward = 26.38
2022-01-26 14:18:41.574 | DEBUG    | __main__:trials:24 - Trial = 27793/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.575 | DEBUG    | __main__:trials:29 - Trial = 27793/30000 | Total reward = 28.20
2022-01-26 14:18:41.579 | DEBUG    | __main__:trials:24 - Trial = 27794/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.581 | DEBUG    | __main__:trials:29 - Trial = 27794/30000 | Total reward = 46.40
2022-01-26 14:18:41.584 | DEBUG    | __main__:trials:26 - Trial = 27795/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.585 | DEBUG    | __main__:trials:29 - Trial = 27795/30000 | Total reward = 13.35
2022-01-26 14:18:41.588 | DEBUG    | __main__:trials:24 - Trial = 27796/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.590 | DEBUG    | __main__:trials:29 - Trial = 27796/30000 | Total reward = 36.09
2022-01-26 14:18:41.594 | DEBUG    | __main__:trials:24 - Trial = 27797/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.595 | DEBUG    | __main__:trials:29 - Trial = 27797/30000 | Total reward = 27.41
2022-01-26 14:18:41.599 | DEBUG    | __main__:trials:24 - Trial = 27798/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.601 | DEBUG    | __main__:trials:29 - Trial = 27798/30000 | Total reward = 30.77
2022-01-26 14:18:41.604 | DEBUG    | __main__:trials:24 - Trial = 27799/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.606 | DEBUG    | __main__:trials:29 - Trial = 27799/30000 | Total reward = 31.35
2022-01-26 14:18:41.610 | DEBUG    | __main__:trials:24 - Trial = 27800/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.611 | DEBUG    | __main__:trials:29 - Trial = 27800/30000 | Total reward = 27.71
2022-01-26 14:18:41.615 | DEBUG    | __main__:trials:24 - Trial = 27801/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.616 | DEBUG    | __main__:trials:29 - Trial = 27801/30000 | Total reward = 36.27
2022-01-26 14:18:41.620 | DEBUG    | __main__:trials:24 - Trial = 27802/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.622 | DEBUG    | __main__:trials:29 - Trial = 27802/30000 | Total reward = 38.93
2022-01-26 14:18:41.625 | DEBUG    | __main__:trials:26 - Trial = 27803/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.627 | DEBUG    | __main__:trials:29 - Trial = 27803/30000 | Total reward = 11.90
2022-01-26 14:18:41.630 | DEBUG    | __main__:trials:24 - Trial = 27804/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.632 | DEBUG    | __main__:trials:29 - Trial = 27804/30000 | Total reward = 26.10
2022-01-26 14:18:41.635 | DEBUG    | __main__:trials:26 - Trial = 27805/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.636 | DEBUG    | __main__:trials:29 - Trial = 27805/30000 | Total reward = 13.29
2022-01-26 14:18:41.638 | DEBUG    | __main__:trials:26 - Trial = 27806/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.640 | DEBUG    | __main__:trials:29 - Trial = 27806/30000 | Total reward = 12.17
2022-01-26 14:18:41.643 | DEBUG    | __main__:trials:24 - Trial = 27807/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.645 | DEBUG    | __main__:trials:29 - Trial = 27807/30000 | Total reward = 28.68
2022-01-26 14:18:41.649 | DEBUG    | __main__:trials:24 - Trial = 27808/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.651 | DEBUG    | __main__:trials:29 - Trial = 27808/30000 | Total reward = 25.48
2022-01-26 14:18:41.655 | DEBUG    | __main__:trials:24 - Trial = 27809/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.657 | DEBUG    | __main__:trials:29 - Trial = 27809/30000 | Total reward = 23.15
2022-01-26 14:18:41.659 | DEBUG    | __main__:trials:26 - Trial = 27810/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.660 | DEBUG    | __main__:trials:29 - Trial = 27810/30000 | Total reward = 13.29
2022-01-26 14:18:41.663 | DEBUG    | __main__:trials:26 - Trial = 27811/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.665 | DEBUG    | __main__:trials:29 - Trial = 27811/30000 | Total reward = 13.29
2022-01-26 14:18:41.668 | DEBUG    | __main__:trials:24 - Trial = 27812/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.670 | DEBUG    | __main__:trials:29 - Trial = 27812/30000 | Total reward = 36.41
2022-01-26 14:18:41.673 | DEBUG    | __main__:trials:24 - Trial = 27813/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.675 | DEBUG    | __main__:trials:29 - Trial = 27813/30000 | Total reward = 17.46
2022-01-26 14:18:41.679 | DEBUG    | __main__:trials:24 - Trial = 27814/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.680 | DEBUG    | __main__:trials:29 - Trial = 27814/30000 | Total reward = 46.11
2022-01-26 14:18:41.684 | DEBUG    | __main__:trials:24 - Trial = 27815/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.685 | DEBUG    | __main__:trials:29 - Trial = 27815/30000 | Total reward = 42.17
2022-01-26 14:18:41.688 | DEBUG    | __main__:trials:24 - Trial = 27816/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.690 | DEBUG    | __main__:trials:29 - Trial = 27816/30000 | Total reward = 26.84
2022-01-26 14:18:41.694 | DEBUG    | __main__:trials:24 - Trial = 27817/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.694 | DEBUG    | __main__:trials:29 - Trial = 27817/30000 | Total reward = 46.56
2022-01-26 14:18:41.698 | DEBUG    | __main__:trials:26 - Trial = 27818/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.700 | DEBUG    | __main__:trials:29 - Trial = 27818/30000 | Total reward = 16.77
2022-01-26 14:18:41.702 | DEBUG    | __main__:trials:26 - Trial = 27819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.704 | DEBUG    | __main__:trials:29 - Trial = 27819/30000 | Total reward = 13.29
2022-01-26 14:18:41.707 | DEBUG    | __main__:trials:24 - Trial = 27820/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.708 | DEBUG    | __main__:trials:29 - Trial = 27820/30000 | Total reward = 47.15
2022-01-26 14:18:41.712 | DEBUG    | __main__:trials:24 - Trial = 27821/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.714 | DEBUG    | __main__:trials:29 - Trial = 27821/30000 | Total reward = 22.60
2022-01-26 14:18:41.717 | DEBUG    | __main__:trials:26 - Trial = 27822/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.718 | DEBUG    | __main__:trials:29 - Trial = 27822/30000 | Total reward = 15.71
2022-01-26 14:18:41.721 | DEBUG    | __main__:trials:26 - Trial = 27823/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.723 | DEBUG    | __main__:trials:29 - Trial = 27823/30000 | Total reward = 18.33
2022-01-26 14:18:41.727 | DEBUG    | __main__:trials:24 - Trial = 27824/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.728 | DEBUG    | __main__:trials:29 - Trial = 27824/30000 | Total reward = 27.39
2022-01-26 14:18:41.732 | DEBUG    | __main__:trials:24 - Trial = 27825/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.734 | DEBUG    | __main__:trials:29 - Trial = 27825/30000 | Total reward = 35.42
2022-01-26 14:18:41.737 | DEBUG    | __main__:trials:24 - Trial = 27826/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.739 | DEBUG    | __main__:trials:29 - Trial = 27826/30000 | Total reward = 35.45
2022-01-26 14:18:41.743 | DEBUG    | __main__:trials:24 - Trial = 27827/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.744 | DEBUG    | __main__:trials:29 - Trial = 27827/30000 | Total reward = 42.55
2022-01-26 14:18:41.748 | DEBUG    | __main__:trials:24 - Trial = 27828/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.750 | DEBUG    | __main__:trials:29 - Trial = 27828/30000 | Total reward = 30.16
2022-01-26 14:18:41.753 | DEBUG    | __main__:trials:24 - Trial = 27829/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.755 | DEBUG    | __main__:trials:29 - Trial = 27829/30000 | Total reward = 27.33
2022-01-26 14:18:41.759 | DEBUG    | __main__:trials:24 - Trial = 27830/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.760 | DEBUG    | __main__:trials:29 - Trial = 27830/30000 | Total reward = 58.38
2022-01-26 14:18:41.762 | DEBUG    | __main__:trials:26 - Trial = 27831/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.764 | DEBUG    | __main__:trials:29 - Trial = 27831/30000 | Total reward = 15.57
2022-01-26 14:18:41.768 | DEBUG    | __main__:trials:24 - Trial = 27832/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.770 | DEBUG    | __main__:trials:29 - Trial = 27832/30000 | Total reward = 30.51
2022-01-26 14:18:41.772 | DEBUG    | __main__:trials:26 - Trial = 27833/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.774 | DEBUG    | __main__:trials:29 - Trial = 27833/30000 | Total reward = 13.83
2022-01-26 14:18:41.778 | DEBUG    | __main__:trials:24 - Trial = 27834/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.779 | DEBUG    | __main__:trials:29 - Trial = 27834/30000 | Total reward = 39.23
2022-01-26 14:18:41.783 | DEBUG    | __main__:trials:24 - Trial = 27835/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.785 | DEBUG    | __main__:trials:29 - Trial = 27835/30000 | Total reward = 20.45
2022-01-26 14:18:41.789 | DEBUG    | __main__:trials:24 - Trial = 27836/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.790 | DEBUG    | __main__:trials:29 - Trial = 27836/30000 | Total reward = 28.06
2022-01-26 14:18:41.793 | DEBUG    | __main__:trials:24 - Trial = 27837/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.793 | DEBUG    | __main__:trials:29 - Trial = 27837/30000 | Total reward = 35.98
2022-01-26 14:18:41.798 | DEBUG    | __main__:trials:24 - Trial = 27838/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.799 | DEBUG    | __main__:trials:29 - Trial = 27838/30000 | Total reward = 29.27
2022-01-26 14:18:41.801 | DEBUG    | __main__:trials:26 - Trial = 27839/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.803 | DEBUG    | __main__:trials:29 - Trial = 27839/30000 | Total reward = 11.11
2022-01-26 14:18:41.807 | DEBUG    | __main__:trials:24 - Trial = 27840/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.808 | DEBUG    | __main__:trials:29 - Trial = 27840/30000 | Total reward = 35.35
2022-01-26 14:18:41.812 | DEBUG    | __main__:trials:24 - Trial = 27841/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.814 | DEBUG    | __main__:trials:29 - Trial = 27841/30000 | Total reward = 36.41
2022-01-26 14:18:41.817 | DEBUG    | __main__:trials:26 - Trial = 27842/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.817 | DEBUG    | __main__:trials:29 - Trial = 27842/30000 | Total reward = 16.57
2022-01-26 14:18:41.820 | DEBUG    | __main__:trials:26 - Trial = 27843/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.821 | DEBUG    | __main__:trials:29 - Trial = 27843/30000 | Total reward = 14.45
2022-01-26 14:18:41.824 | DEBUG    | __main__:trials:24 - Trial = 27844/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.825 | DEBUG    | __main__:trials:29 - Trial = 27844/30000 | Total reward = 26.92
2022-01-26 14:18:41.828 | DEBUG    | __main__:trials:24 - Trial = 27845/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.830 | DEBUG    | __main__:trials:29 - Trial = 27845/30000 | Total reward = 35.08
2022-01-26 14:18:41.834 | DEBUG    | __main__:trials:24 - Trial = 27846/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.834 | DEBUG    | __main__:trials:29 - Trial = 27846/30000 | Total reward = 22.52
2022-01-26 14:18:41.838 | DEBUG    | __main__:trials:24 - Trial = 27847/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.840 | DEBUG    | __main__:trials:29 - Trial = 27847/30000 | Total reward = 23.72
2022-01-26 14:18:41.843 | DEBUG    | __main__:trials:24 - Trial = 27848/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.845 | DEBUG    | __main__:trials:29 - Trial = 27848/30000 | Total reward = 27.22
2022-01-26 14:18:41.848 | DEBUG    | __main__:trials:24 - Trial = 27849/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.849 | DEBUG    | __main__:trials:29 - Trial = 27849/30000 | Total reward = 29.92
2022-01-26 14:18:41.853 | DEBUG    | __main__:trials:24 - Trial = 27850/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.855 | DEBUG    | __main__:trials:29 - Trial = 27850/30000 | Total reward = 24.70
2022-01-26 14:18:41.858 | DEBUG    | __main__:trials:24 - Trial = 27851/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.859 | DEBUG    | __main__:trials:29 - Trial = 27851/30000 | Total reward = 26.54
2022-01-26 14:18:41.863 | DEBUG    | __main__:trials:24 - Trial = 27852/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.865 | DEBUG    | __main__:trials:29 - Trial = 27852/30000 | Total reward = 27.77
2022-01-26 14:18:41.869 | DEBUG    | __main__:trials:24 - Trial = 27853/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.869 | DEBUG    | __main__:trials:29 - Trial = 27853/30000 | Total reward = 37.87
2022-01-26 14:18:41.872 | DEBUG    | __main__:trials:24 - Trial = 27854/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.874 | DEBUG    | __main__:trials:29 - Trial = 27854/30000 | Total reward = 35.35
2022-01-26 14:18:41.878 | DEBUG    | __main__:trials:24 - Trial = 27855/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.879 | DEBUG    | __main__:trials:29 - Trial = 27855/30000 | Total reward = 31.59
2022-01-26 14:18:41.882 | DEBUG    | __main__:trials:24 - Trial = 27856/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.884 | DEBUG    | __main__:trials:29 - Trial = 27856/30000 | Total reward = 42.64
2022-01-26 14:18:41.888 | DEBUG    | __main__:trials:24 - Trial = 27857/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.889 | DEBUG    | __main__:trials:29 - Trial = 27857/30000 | Total reward = 32.35
2022-01-26 14:18:41.892 | DEBUG    | __main__:trials:26 - Trial = 27858/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.893 | DEBUG    | __main__:trials:29 - Trial = 27858/30000 | Total reward = 11.13
2022-01-26 14:18:41.896 | DEBUG    | __main__:trials:26 - Trial = 27859/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.898 | DEBUG    | __main__:trials:29 - Trial = 27859/30000 | Total reward = 13.22
2022-01-26 14:18:41.901 | DEBUG    | __main__:trials:24 - Trial = 27860/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.902 | DEBUG    | __main__:trials:29 - Trial = 27860/30000 | Total reward = 37.07
2022-01-26 14:18:41.905 | DEBUG    | __main__:trials:26 - Trial = 27861/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.906 | DEBUG    | __main__:trials:29 - Trial = 27861/30000 | Total reward = 36.88
2022-01-26 14:18:41.908 | DEBUG    | __main__:trials:26 - Trial = 27862/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.910 | DEBUG    | __main__:trials:29 - Trial = 27862/30000 | Total reward = 9.57
2022-01-26 14:18:41.914 | DEBUG    | __main__:trials:24 - Trial = 27863/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.915 | DEBUG    | __main__:trials:29 - Trial = 27863/30000 | Total reward = 49.58
2022-01-26 14:18:41.919 | DEBUG    | __main__:trials:26 - Trial = 27864/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.921 | DEBUG    | __main__:trials:29 - Trial = 27864/30000 | Total reward = 30.13
2022-01-26 14:18:41.923 | DEBUG    | __main__:trials:26 - Trial = 27865/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.925 | DEBUG    | __main__:trials:29 - Trial = 27865/30000 | Total reward = 19.15
2022-01-26 14:18:41.928 | DEBUG    | __main__:trials:24 - Trial = 27866/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.929 | DEBUG    | __main__:trials:29 - Trial = 27866/30000 | Total reward = 25.82
2022-01-26 14:18:41.933 | DEBUG    | __main__:trials:26 - Trial = 27867/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.934 | DEBUG    | __main__:trials:29 - Trial = 27867/30000 | Total reward = 16.09
2022-01-26 14:18:41.937 | DEBUG    | __main__:trials:26 - Trial = 27868/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.940 | DEBUG    | __main__:trials:29 - Trial = 27868/30000 | Total reward = 16.36
2022-01-26 14:18:41.944 | DEBUG    | __main__:trials:24 - Trial = 27869/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.946 | DEBUG    | __main__:trials:29 - Trial = 27869/30000 | Total reward = 26.20
2022-01-26 14:18:41.949 | DEBUG    | __main__:trials:24 - Trial = 27870/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.951 | DEBUG    | __main__:trials:29 - Trial = 27870/30000 | Total reward = 50.25
2022-01-26 14:18:41.954 | DEBUG    | __main__:trials:24 - Trial = 27871/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.955 | DEBUG    | __main__:trials:29 - Trial = 27871/30000 | Total reward = 25.78
2022-01-26 14:18:41.959 | DEBUG    | __main__:trials:24 - Trial = 27872/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.961 | DEBUG    | __main__:trials:29 - Trial = 27872/30000 | Total reward = 33.94
2022-01-26 14:18:41.964 | DEBUG    | __main__:trials:26 - Trial = 27873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:41.965 | DEBUG    | __main__:trials:29 - Trial = 27873/30000 | Total reward = 17.12
2022-01-26 14:18:41.968 | DEBUG    | __main__:trials:24 - Trial = 27874/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.970 | DEBUG    | __main__:trials:29 - Trial = 27874/30000 | Total reward = 27.51
2022-01-26 14:18:41.973 | DEBUG    | __main__:trials:24 - Trial = 27875/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.975 | DEBUG    | __main__:trials:29 - Trial = 27875/30000 | Total reward = 26.26
2022-01-26 14:18:41.978 | DEBUG    | __main__:trials:24 - Trial = 27876/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.979 | DEBUG    | __main__:trials:29 - Trial = 27876/30000 | Total reward = 22.56
2022-01-26 14:18:41.982 | DEBUG    | __main__:trials:24 - Trial = 27877/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.983 | DEBUG    | __main__:trials:29 - Trial = 27877/30000 | Total reward = 37.74
2022-01-26 14:18:41.987 | DEBUG    | __main__:trials:24 - Trial = 27878/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.989 | DEBUG    | __main__:trials:29 - Trial = 27878/30000 | Total reward = 37.85
2022-01-26 14:18:41.992 | DEBUG    | __main__:trials:24 - Trial = 27879/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.994 | DEBUG    | __main__:trials:29 - Trial = 27879/30000 | Total reward = 38.30
2022-01-26 14:18:41.997 | DEBUG    | __main__:trials:24 - Trial = 27880/30000 | Max number of steps (20) reached
2022-01-26 14:18:41.998 | DEBUG    | __main__:trials:29 - Trial = 27880/30000 | Total reward = 26.33
2022-01-26 14:18:42.002 | DEBUG    | __main__:trials:24 - Trial = 27881/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.003 | DEBUG    | __main__:trials:29 - Trial = 27881/30000 | Total reward = 43.30
2022-01-26 14:18:42.007 | DEBUG    | __main__:trials:24 - Trial = 27882/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.008 | DEBUG    | __main__:trials:29 - Trial = 27882/30000 | Total reward = 31.10
2022-01-26 14:18:42.012 | DEBUG    | __main__:trials:24 - Trial = 27883/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.014 | DEBUG    | __main__:trials:29 - Trial = 27883/30000 | Total reward = 38.22
2022-01-26 14:18:42.017 | DEBUG    | __main__:trials:24 - Trial = 27884/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.019 | DEBUG    | __main__:trials:29 - Trial = 27884/30000 | Total reward = 37.48
2022-01-26 14:18:42.022 | DEBUG    | __main__:trials:24 - Trial = 27885/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.024 | DEBUG    | __main__:trials:29 - Trial = 27885/30000 | Total reward = 26.00
2022-01-26 14:18:42.027 | DEBUG    | __main__:trials:24 - Trial = 27886/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.029 | DEBUG    | __main__:trials:29 - Trial = 27886/30000 | Total reward = 29.00
2022-01-26 14:18:42.032 | DEBUG    | __main__:trials:24 - Trial = 27887/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.034 | DEBUG    | __main__:trials:29 - Trial = 27887/30000 | Total reward = 48.43
2022-01-26 14:18:42.038 | DEBUG    | __main__:trials:24 - Trial = 27888/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.038 | DEBUG    | __main__:trials:29 - Trial = 27888/30000 | Total reward = 37.45
2022-01-26 14:18:42.042 | DEBUG    | __main__:trials:24 - Trial = 27889/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.044 | DEBUG    | __main__:trials:29 - Trial = 27889/30000 | Total reward = 36.23
2022-01-26 14:18:42.048 | DEBUG    | __main__:trials:24 - Trial = 27890/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.049 | DEBUG    | __main__:trials:29 - Trial = 27890/30000 | Total reward = 35.10
2022-01-26 14:18:42.053 | DEBUG    | __main__:trials:24 - Trial = 27891/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.055 | DEBUG    | __main__:trials:29 - Trial = 27891/30000 | Total reward = 30.34
2022-01-26 14:18:42.058 | DEBUG    | __main__:trials:24 - Trial = 27892/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.060 | DEBUG    | __main__:trials:29 - Trial = 27892/30000 | Total reward = 37.62
2022-01-26 14:18:42.063 | DEBUG    | __main__:trials:24 - Trial = 27893/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.065 | DEBUG    | __main__:trials:29 - Trial = 27893/30000 | Total reward = 48.38
2022-01-26 14:18:42.068 | DEBUG    | __main__:trials:24 - Trial = 27894/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.069 | DEBUG    | __main__:trials:29 - Trial = 27894/30000 | Total reward = 42.11
2022-01-26 14:18:42.072 | DEBUG    | __main__:trials:24 - Trial = 27895/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.073 | DEBUG    | __main__:trials:29 - Trial = 27895/30000 | Total reward = 40.10
2022-01-26 14:18:42.077 | DEBUG    | __main__:trials:24 - Trial = 27896/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.079 | DEBUG    | __main__:trials:29 - Trial = 27896/30000 | Total reward = 40.06
2022-01-26 14:18:42.082 | DEBUG    | __main__:trials:24 - Trial = 27897/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.084 | DEBUG    | __main__:trials:29 - Trial = 27897/30000 | Total reward = 41.90
2022-01-26 14:18:42.088 | DEBUG    | __main__:trials:24 - Trial = 27898/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.089 | DEBUG    | __main__:trials:29 - Trial = 27898/30000 | Total reward = 24.12
2022-01-26 14:18:42.093 | DEBUG    | __main__:trials:24 - Trial = 27899/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.094 | DEBUG    | __main__:trials:29 - Trial = 27899/30000 | Total reward = 46.12
2022-01-26 14:18:42.098 | DEBUG    | __main__:trials:24 - Trial = 27900/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.100 | DEBUG    | __main__:trials:29 - Trial = 27900/30000 | Total reward = 23.68
2022-01-26 14:18:42.104 | DEBUG    | __main__:trials:24 - Trial = 27901/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.105 | DEBUG    | __main__:trials:29 - Trial = 27901/30000 | Total reward = 39.75
2022-01-26 14:18:42.109 | DEBUG    | __main__:trials:24 - Trial = 27902/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.110 | DEBUG    | __main__:trials:29 - Trial = 27902/30000 | Total reward = 36.71
2022-01-26 14:18:42.114 | DEBUG    | __main__:trials:24 - Trial = 27903/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.116 | DEBUG    | __main__:trials:29 - Trial = 27903/30000 | Total reward = 54.66
2022-01-26 14:18:42.120 | DEBUG    | __main__:trials:24 - Trial = 27904/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.121 | DEBUG    | __main__:trials:29 - Trial = 27904/30000 | Total reward = 35.40
2022-01-26 14:18:42.125 | DEBUG    | __main__:trials:24 - Trial = 27905/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.127 | DEBUG    | __main__:trials:29 - Trial = 27905/30000 | Total reward = 46.63
2022-01-26 14:18:42.130 | DEBUG    | __main__:trials:24 - Trial = 27906/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.132 | DEBUG    | __main__:trials:29 - Trial = 27906/30000 | Total reward = 32.31
2022-01-26 14:18:42.136 | DEBUG    | __main__:trials:24 - Trial = 27907/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.137 | DEBUG    | __main__:trials:29 - Trial = 27907/30000 | Total reward = 38.41
2022-01-26 14:18:42.140 | DEBUG    | __main__:trials:24 - Trial = 27908/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.141 | DEBUG    | __main__:trials:29 - Trial = 27908/30000 | Total reward = 30.97
2022-01-26 14:18:42.145 | DEBUG    | __main__:trials:24 - Trial = 27909/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.147 | DEBUG    | __main__:trials:29 - Trial = 27909/30000 | Total reward = 24.13
2022-01-26 14:18:42.150 | DEBUG    | __main__:trials:24 - Trial = 27910/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.152 | DEBUG    | __main__:trials:29 - Trial = 27910/30000 | Total reward = 41.77
2022-01-26 14:18:42.155 | DEBUG    | __main__:trials:24 - Trial = 27911/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.156 | DEBUG    | __main__:trials:29 - Trial = 27911/30000 | Total reward = 27.05
2022-01-26 14:18:42.160 | DEBUG    | __main__:trials:24 - Trial = 27912/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.161 | DEBUG    | __main__:trials:29 - Trial = 27912/30000 | Total reward = 33.89
2022-01-26 14:18:42.165 | DEBUG    | __main__:trials:24 - Trial = 27913/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.166 | DEBUG    | __main__:trials:29 - Trial = 27913/30000 | Total reward = 55.68
2022-01-26 14:18:42.170 | DEBUG    | __main__:trials:24 - Trial = 27914/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.171 | DEBUG    | __main__:trials:29 - Trial = 27914/30000 | Total reward = 36.89
2022-01-26 14:18:42.175 | DEBUG    | __main__:trials:24 - Trial = 27915/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.177 | DEBUG    | __main__:trials:29 - Trial = 27915/30000 | Total reward = 42.86
2022-01-26 14:18:42.180 | DEBUG    | __main__:trials:24 - Trial = 27916/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.182 | DEBUG    | __main__:trials:29 - Trial = 27916/30000 | Total reward = 46.04
2022-01-26 14:18:42.185 | DEBUG    | __main__:trials:24 - Trial = 27917/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.187 | DEBUG    | __main__:trials:29 - Trial = 27917/30000 | Total reward = 37.18
2022-01-26 14:18:42.191 | DEBUG    | __main__:trials:24 - Trial = 27918/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.192 | DEBUG    | __main__:trials:29 - Trial = 27918/30000 | Total reward = 29.94
2022-01-26 14:18:42.196 | DEBUG    | __main__:trials:24 - Trial = 27919/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.198 | DEBUG    | __main__:trials:29 - Trial = 27919/30000 | Total reward = 46.09
2022-01-26 14:18:42.201 | DEBUG    | __main__:trials:24 - Trial = 27920/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.202 | DEBUG    | __main__:trials:29 - Trial = 27920/30000 | Total reward = 45.13
2022-01-26 14:18:42.206 | DEBUG    | __main__:trials:24 - Trial = 27921/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.208 | DEBUG    | __main__:trials:29 - Trial = 27921/30000 | Total reward = 35.57
2022-01-26 14:18:42.211 | DEBUG    | __main__:trials:24 - Trial = 27922/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.213 | DEBUG    | __main__:trials:29 - Trial = 27922/30000 | Total reward = 49.04
2022-01-26 14:18:42.217 | DEBUG    | __main__:trials:24 - Trial = 27923/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.218 | DEBUG    | __main__:trials:29 - Trial = 27923/30000 | Total reward = 39.64
2022-01-26 14:18:42.222 | DEBUG    | __main__:trials:24 - Trial = 27924/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.223 | DEBUG    | __main__:trials:29 - Trial = 27924/30000 | Total reward = 42.65
2022-01-26 14:18:42.227 | DEBUG    | __main__:trials:24 - Trial = 27925/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.229 | DEBUG    | __main__:trials:29 - Trial = 27925/30000 | Total reward = 41.82
2022-01-26 14:18:42.233 | DEBUG    | __main__:trials:24 - Trial = 27926/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.233 | DEBUG    | __main__:trials:29 - Trial = 27926/30000 | Total reward = 40.91
2022-01-26 14:18:42.237 | DEBUG    | __main__:trials:24 - Trial = 27927/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.238 | DEBUG    | __main__:trials:29 - Trial = 27927/30000 | Total reward = 47.03
2022-01-26 14:18:42.241 | DEBUG    | __main__:trials:24 - Trial = 27928/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.242 | DEBUG    | __main__:trials:29 - Trial = 27928/30000 | Total reward = 36.91
2022-01-26 14:18:42.245 | DEBUG    | __main__:trials:24 - Trial = 27929/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.247 | DEBUG    | __main__:trials:29 - Trial = 27929/30000 | Total reward = 44.08
2022-01-26 14:18:42.250 | DEBUG    | __main__:trials:24 - Trial = 27930/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.251 | DEBUG    | __main__:trials:29 - Trial = 27930/30000 | Total reward = 44.82
2022-01-26 14:18:42.254 | DEBUG    | __main__:trials:24 - Trial = 27931/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.256 | DEBUG    | __main__:trials:29 - Trial = 27931/30000 | Total reward = 45.48
2022-01-26 14:18:42.259 | DEBUG    | __main__:trials:24 - Trial = 27932/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.261 | DEBUG    | __main__:trials:29 - Trial = 27932/30000 | Total reward = 41.89
2022-01-26 14:18:42.265 | DEBUG    | __main__:trials:24 - Trial = 27933/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.267 | DEBUG    | __main__:trials:29 - Trial = 27933/30000 | Total reward = 52.62
2022-01-26 14:18:42.270 | DEBUG    | __main__:trials:24 - Trial = 27934/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.272 | DEBUG    | __main__:trials:29 - Trial = 27934/30000 | Total reward = 36.59
2022-01-26 14:18:42.276 | DEBUG    | __main__:trials:24 - Trial = 27935/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.278 | DEBUG    | __main__:trials:29 - Trial = 27935/30000 | Total reward = 36.81
2022-01-26 14:18:42.281 | DEBUG    | __main__:trials:24 - Trial = 27936/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.283 | DEBUG    | __main__:trials:29 - Trial = 27936/30000 | Total reward = 41.84
2022-01-26 14:18:42.287 | DEBUG    | __main__:trials:24 - Trial = 27937/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.289 | DEBUG    | __main__:trials:29 - Trial = 27937/30000 | Total reward = 39.68
2022-01-26 14:18:42.293 | DEBUG    | __main__:trials:24 - Trial = 27938/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.294 | DEBUG    | __main__:trials:29 - Trial = 27938/30000 | Total reward = 43.82
2022-01-26 14:18:42.297 | DEBUG    | __main__:trials:24 - Trial = 27939/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.299 | DEBUG    | __main__:trials:29 - Trial = 27939/30000 | Total reward = 44.08
2022-01-26 14:18:42.302 | DEBUG    | __main__:trials:24 - Trial = 27940/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.304 | DEBUG    | __main__:trials:29 - Trial = 27940/30000 | Total reward = 31.14
2022-01-26 14:18:42.307 | DEBUG    | __main__:trials:24 - Trial = 27941/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.309 | DEBUG    | __main__:trials:29 - Trial = 27941/30000 | Total reward = 31.19
2022-01-26 14:18:42.312 | DEBUG    | __main__:trials:24 - Trial = 27942/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.313 | DEBUG    | __main__:trials:29 - Trial = 27942/30000 | Total reward = 41.47
2022-01-26 14:18:42.317 | DEBUG    | __main__:trials:24 - Trial = 27943/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.318 | DEBUG    | __main__:trials:29 - Trial = 27943/30000 | Total reward = 42.15
2022-01-26 14:18:42.321 | DEBUG    | __main__:trials:24 - Trial = 27944/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.322 | DEBUG    | __main__:trials:29 - Trial = 27944/30000 | Total reward = 30.07
2022-01-26 14:18:42.326 | DEBUG    | __main__:trials:24 - Trial = 27945/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.327 | DEBUG    | __main__:trials:29 - Trial = 27945/30000 | Total reward = 34.64
2022-01-26 14:18:42.330 | DEBUG    | __main__:trials:24 - Trial = 27946/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.332 | DEBUG    | __main__:trials:29 - Trial = 27946/30000 | Total reward = 42.35
2022-01-26 14:18:42.335 | DEBUG    | __main__:trials:24 - Trial = 27947/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.337 | DEBUG    | __main__:trials:29 - Trial = 27947/30000 | Total reward = 33.87
2022-01-26 14:18:42.340 | DEBUG    | __main__:trials:24 - Trial = 27948/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.342 | DEBUG    | __main__:trials:29 - Trial = 27948/30000 | Total reward = 41.47
2022-01-26 14:18:42.345 | DEBUG    | __main__:trials:24 - Trial = 27949/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.347 | DEBUG    | __main__:trials:29 - Trial = 27949/30000 | Total reward = 42.07
2022-01-26 14:18:42.351 | DEBUG    | __main__:trials:24 - Trial = 27950/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.353 | DEBUG    | __main__:trials:29 - Trial = 27950/30000 | Total reward = 26.91
2022-01-26 14:18:42.356 | DEBUG    | __main__:trials:24 - Trial = 27951/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.358 | DEBUG    | __main__:trials:29 - Trial = 27951/30000 | Total reward = 38.55
2022-01-26 14:18:42.361 | DEBUG    | __main__:trials:24 - Trial = 27952/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.361 | DEBUG    | __main__:trials:29 - Trial = 27952/30000 | Total reward = 47.08
2022-01-26 14:18:42.365 | DEBUG    | __main__:trials:24 - Trial = 27953/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.366 | DEBUG    | __main__:trials:29 - Trial = 27953/30000 | Total reward = 37.80
2022-01-26 14:18:42.369 | DEBUG    | __main__:trials:24 - Trial = 27954/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.370 | DEBUG    | __main__:trials:29 - Trial = 27954/30000 | Total reward = 33.14
2022-01-26 14:18:42.373 | DEBUG    | __main__:trials:24 - Trial = 27955/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.374 | DEBUG    | __main__:trials:29 - Trial = 27955/30000 | Total reward = 43.99
2022-01-26 14:18:42.377 | DEBUG    | __main__:trials:24 - Trial = 27956/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.378 | DEBUG    | __main__:trials:29 - Trial = 27956/30000 | Total reward = 34.36
2022-01-26 14:18:42.381 | DEBUG    | __main__:trials:24 - Trial = 27957/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.382 | DEBUG    | __main__:trials:29 - Trial = 27957/30000 | Total reward = 26.63
2022-01-26 14:18:42.385 | DEBUG    | __main__:trials:24 - Trial = 27958/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.387 | DEBUG    | __main__:trials:29 - Trial = 27958/30000 | Total reward = 40.62
2022-01-26 14:18:42.390 | DEBUG    | __main__:trials:24 - Trial = 27959/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.391 | DEBUG    | __main__:trials:29 - Trial = 27959/30000 | Total reward = 39.53
2022-01-26 14:18:42.394 | DEBUG    | __main__:trials:24 - Trial = 27960/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.395 | DEBUG    | __main__:trials:29 - Trial = 27960/30000 | Total reward = 33.87
2022-01-26 14:18:42.399 | DEBUG    | __main__:trials:24 - Trial = 27961/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.400 | DEBUG    | __main__:trials:29 - Trial = 27961/30000 | Total reward = 44.44
2022-01-26 14:18:42.404 | DEBUG    | __main__:trials:24 - Trial = 27962/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.405 | DEBUG    | __main__:trials:29 - Trial = 27962/30000 | Total reward = 42.92
2022-01-26 14:18:42.408 | DEBUG    | __main__:trials:24 - Trial = 27963/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.410 | DEBUG    | __main__:trials:29 - Trial = 27963/30000 | Total reward = 35.86
2022-01-26 14:18:42.413 | DEBUG    | __main__:trials:24 - Trial = 27964/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.414 | DEBUG    | __main__:trials:29 - Trial = 27964/30000 | Total reward = 24.71
2022-01-26 14:18:42.417 | DEBUG    | __main__:trials:24 - Trial = 27965/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.419 | DEBUG    | __main__:trials:29 - Trial = 27965/30000 | Total reward = 47.56
2022-01-26 14:18:42.423 | DEBUG    | __main__:trials:24 - Trial = 27966/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.425 | DEBUG    | __main__:trials:29 - Trial = 27966/30000 | Total reward = 49.51
2022-01-26 14:18:42.429 | DEBUG    | __main__:trials:24 - Trial = 27967/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.430 | DEBUG    | __main__:trials:29 - Trial = 27967/30000 | Total reward = 45.03
2022-01-26 14:18:42.433 | DEBUG    | __main__:trials:24 - Trial = 27968/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.435 | DEBUG    | __main__:trials:29 - Trial = 27968/30000 | Total reward = 42.73
2022-01-26 14:18:42.439 | DEBUG    | __main__:trials:24 - Trial = 27969/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.440 | DEBUG    | __main__:trials:29 - Trial = 27969/30000 | Total reward = 29.58
2022-01-26 14:18:42.443 | DEBUG    | __main__:trials:24 - Trial = 27970/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.445 | DEBUG    | __main__:trials:29 - Trial = 27970/30000 | Total reward = 37.02
2022-01-26 14:18:42.449 | DEBUG    | __main__:trials:24 - Trial = 27971/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.451 | DEBUG    | __main__:trials:29 - Trial = 27971/30000 | Total reward = 42.15
2022-01-26 14:18:42.454 | DEBUG    | __main__:trials:24 - Trial = 27972/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.455 | DEBUG    | __main__:trials:29 - Trial = 27972/30000 | Total reward = 43.85
2022-01-26 14:18:42.459 | DEBUG    | __main__:trials:24 - Trial = 27973/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.460 | DEBUG    | __main__:trials:29 - Trial = 27973/30000 | Total reward = 41.04
2022-01-26 14:18:42.464 | DEBUG    | __main__:trials:24 - Trial = 27974/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.466 | DEBUG    | __main__:trials:29 - Trial = 27974/30000 | Total reward = 49.46
2022-01-26 14:18:42.470 | DEBUG    | __main__:trials:24 - Trial = 27975/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.471 | DEBUG    | __main__:trials:29 - Trial = 27975/30000 | Total reward = 55.78
2022-01-26 14:18:42.475 | DEBUG    | __main__:trials:24 - Trial = 27976/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.476 | DEBUG    | __main__:trials:29 - Trial = 27976/30000 | Total reward = 41.83
2022-01-26 14:18:42.480 | DEBUG    | __main__:trials:24 - Trial = 27977/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.482 | DEBUG    | __main__:trials:29 - Trial = 27977/30000 | Total reward = 52.08
2022-01-26 14:18:42.485 | DEBUG    | __main__:trials:24 - Trial = 27978/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.487 | DEBUG    | __main__:trials:29 - Trial = 27978/30000 | Total reward = 32.88
2022-01-26 14:18:42.491 | DEBUG    | __main__:trials:24 - Trial = 27979/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.492 | DEBUG    | __main__:trials:29 - Trial = 27979/30000 | Total reward = 40.45
2022-01-26 14:18:42.495 | DEBUG    | __main__:trials:24 - Trial = 27980/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.497 | DEBUG    | __main__:trials:29 - Trial = 27980/30000 | Total reward = 49.63
2022-01-26 14:18:42.500 | DEBUG    | __main__:trials:24 - Trial = 27981/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.502 | DEBUG    | __main__:trials:29 - Trial = 27981/30000 | Total reward = 42.15
2022-01-26 14:18:42.506 | DEBUG    | __main__:trials:24 - Trial = 27982/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.507 | DEBUG    | __main__:trials:29 - Trial = 27982/30000 | Total reward = 44.62
2022-01-26 14:18:42.511 | DEBUG    | __main__:trials:24 - Trial = 27983/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.513 | DEBUG    | __main__:trials:29 - Trial = 27983/30000 | Total reward = 44.17
2022-01-26 14:18:42.516 | DEBUG    | __main__:trials:24 - Trial = 27984/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.518 | DEBUG    | __main__:trials:29 - Trial = 27984/30000 | Total reward = 42.50
2022-01-26 14:18:42.522 | DEBUG    | __main__:trials:24 - Trial = 27985/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.522 | DEBUG    | __main__:trials:29 - Trial = 27985/30000 | Total reward = 34.55
2022-01-26 14:18:42.526 | DEBUG    | __main__:trials:24 - Trial = 27986/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.528 | DEBUG    | __main__:trials:29 - Trial = 27986/30000 | Total reward = 40.22
2022-01-26 14:18:42.532 | DEBUG    | __main__:trials:24 - Trial = 27987/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.533 | DEBUG    | __main__:trials:29 - Trial = 27987/30000 | Total reward = 37.66
2022-01-26 14:18:42.537 | DEBUG    | __main__:trials:24 - Trial = 27988/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.539 | DEBUG    | __main__:trials:29 - Trial = 27988/30000 | Total reward = 45.54
2022-01-26 14:18:42.541 | DEBUG    | __main__:trials:26 - Trial = 27989/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.543 | DEBUG    | __main__:trials:29 - Trial = 27989/30000 | Total reward = 17.91
2022-01-26 14:18:42.546 | DEBUG    | __main__:trials:24 - Trial = 27990/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.548 | DEBUG    | __main__:trials:29 - Trial = 27990/30000 | Total reward = 30.23
2022-01-26 14:18:42.551 | DEBUG    | __main__:trials:24 - Trial = 27991/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.552 | DEBUG    | __main__:trials:29 - Trial = 27991/30000 | Total reward = 40.64
2022-01-26 14:18:42.556 | DEBUG    | __main__:trials:24 - Trial = 27992/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.558 | DEBUG    | __main__:trials:29 - Trial = 27992/30000 | Total reward = 28.41
2022-01-26 14:18:42.562 | DEBUG    | __main__:trials:24 - Trial = 27993/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.563 | DEBUG    | __main__:trials:29 - Trial = 27993/30000 | Total reward = 38.93
2022-01-26 14:18:42.567 | DEBUG    | __main__:trials:24 - Trial = 27994/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.568 | DEBUG    | __main__:trials:29 - Trial = 27994/30000 | Total reward = 22.18
2022-01-26 14:18:42.572 | DEBUG    | __main__:trials:24 - Trial = 27995/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.573 | DEBUG    | __main__:trials:29 - Trial = 27995/30000 | Total reward = 43.73
2022-01-26 14:18:42.577 | DEBUG    | __main__:trials:24 - Trial = 27996/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.578 | DEBUG    | __main__:trials:29 - Trial = 27996/30000 | Total reward = 49.63
2022-01-26 14:18:42.581 | DEBUG    | __main__:trials:26 - Trial = 27997/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.581 | DEBUG    | __main__:trials:29 - Trial = 27997/30000 | Total reward = 14.80
2022-01-26 14:18:42.585 | DEBUG    | __main__:trials:24 - Trial = 27998/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.587 | DEBUG    | __main__:trials:29 - Trial = 27998/30000 | Total reward = 40.93
2022-01-26 14:18:42.591 | DEBUG    | __main__:trials:24 - Trial = 27999/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.592 | DEBUG    | __main__:trials:29 - Trial = 27999/30000 | Total reward = 43.20
2022-01-26 14:18:42.596 | DEBUG    | __main__:trials:24 - Trial = 28000/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.598 | DEBUG    | __main__:trials:29 - Trial = 28000/30000 | Total reward = 40.45
2022-01-26 14:18:42.600 | DEBUG    | __main__:trials:24 - Trial = 28001/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.602 | DEBUG    | __main__:trials:29 - Trial = 28001/30000 | Total reward = 35.02
2022-01-26 14:18:42.605 | DEBUG    | __main__:trials:24 - Trial = 28002/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.606 | DEBUG    | __main__:trials:29 - Trial = 28002/30000 | Total reward = 35.32
2022-01-26 14:18:42.611 | DEBUG    | __main__:trials:24 - Trial = 28003/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.612 | DEBUG    | __main__:trials:29 - Trial = 28003/30000 | Total reward = 25.30
2022-01-26 14:18:42.616 | DEBUG    | __main__:trials:24 - Trial = 28004/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.618 | DEBUG    | __main__:trials:29 - Trial = 28004/30000 | Total reward = 34.45
2022-01-26 14:18:42.620 | DEBUG    | __main__:trials:26 - Trial = 28005/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.622 | DEBUG    | __main__:trials:29 - Trial = 28005/30000 | Total reward = 24.07
2022-01-26 14:18:42.625 | DEBUG    | __main__:trials:26 - Trial = 28006/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.626 | DEBUG    | __main__:trials:29 - Trial = 28006/30000 | Total reward = 16.32
2022-01-26 14:18:42.628 | DEBUG    | __main__:trials:26 - Trial = 28007/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.630 | DEBUG    | __main__:trials:29 - Trial = 28007/30000 | Total reward = 12.90
2022-01-26 14:18:42.633 | DEBUG    | __main__:trials:24 - Trial = 28008/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.635 | DEBUG    | __main__:trials:29 - Trial = 28008/30000 | Total reward = 36.39
2022-01-26 14:18:42.638 | DEBUG    | __main__:trials:24 - Trial = 28009/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.640 | DEBUG    | __main__:trials:29 - Trial = 28009/30000 | Total reward = 31.06
2022-01-26 14:18:42.644 | DEBUG    | __main__:trials:24 - Trial = 28010/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.645 | DEBUG    | __main__:trials:29 - Trial = 28010/30000 | Total reward = 40.69
2022-01-26 14:18:42.649 | DEBUG    | __main__:trials:24 - Trial = 28011/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.651 | DEBUG    | __main__:trials:29 - Trial = 28011/30000 | Total reward = 38.50
2022-01-26 14:18:42.653 | DEBUG    | __main__:trials:24 - Trial = 28012/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.655 | DEBUG    | __main__:trials:29 - Trial = 28012/30000 | Total reward = 44.04
2022-01-26 14:18:42.658 | DEBUG    | __main__:trials:24 - Trial = 28013/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.660 | DEBUG    | __main__:trials:29 - Trial = 28013/30000 | Total reward = 40.82
2022-01-26 14:18:42.663 | DEBUG    | __main__:trials:24 - Trial = 28014/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.665 | DEBUG    | __main__:trials:29 - Trial = 28014/30000 | Total reward = 47.84
2022-01-26 14:18:42.668 | DEBUG    | __main__:trials:24 - Trial = 28015/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.670 | DEBUG    | __main__:trials:29 - Trial = 28015/30000 | Total reward = 52.46
2022-01-26 14:18:42.674 | DEBUG    | __main__:trials:24 - Trial = 28016/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.674 | DEBUG    | __main__:trials:29 - Trial = 28016/30000 | Total reward = 48.55
2022-01-26 14:18:42.678 | DEBUG    | __main__:trials:24 - Trial = 28017/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.679 | DEBUG    | __main__:trials:29 - Trial = 28017/30000 | Total reward = 33.65
2022-01-26 14:18:42.682 | DEBUG    | __main__:trials:26 - Trial = 28018/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.683 | DEBUG    | __main__:trials:29 - Trial = 28018/30000 | Total reward = 19.36
2022-01-26 14:18:42.687 | DEBUG    | __main__:trials:24 - Trial = 28019/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.688 | DEBUG    | __main__:trials:29 - Trial = 28019/30000 | Total reward = 42.56
2022-01-26 14:18:42.692 | DEBUG    | __main__:trials:24 - Trial = 28020/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.693 | DEBUG    | __main__:trials:29 - Trial = 28020/30000 | Total reward = 46.09
2022-01-26 14:18:42.697 | DEBUG    | __main__:trials:24 - Trial = 28021/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.698 | DEBUG    | __main__:trials:29 - Trial = 28021/30000 | Total reward = 45.78
2022-01-26 14:18:42.702 | DEBUG    | __main__:trials:24 - Trial = 28022/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.704 | DEBUG    | __main__:trials:29 - Trial = 28022/30000 | Total reward = 39.87
2022-01-26 14:18:42.706 | DEBUG    | __main__:trials:24 - Trial = 28023/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.708 | DEBUG    | __main__:trials:29 - Trial = 28023/30000 | Total reward = 36.09
2022-01-26 14:18:42.712 | DEBUG    | __main__:trials:24 - Trial = 28024/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.714 | DEBUG    | __main__:trials:29 - Trial = 28024/30000 | Total reward = 30.33
2022-01-26 14:18:42.717 | DEBUG    | __main__:trials:26 - Trial = 28025/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.718 | DEBUG    | __main__:trials:29 - Trial = 28025/30000 | Total reward = 17.96
2022-01-26 14:18:42.722 | DEBUG    | __main__:trials:24 - Trial = 28026/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.723 | DEBUG    | __main__:trials:29 - Trial = 28026/30000 | Total reward = 36.42
2022-01-26 14:18:42.726 | DEBUG    | __main__:trials:24 - Trial = 28027/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.728 | DEBUG    | __main__:trials:29 - Trial = 28027/30000 | Total reward = 38.83
2022-01-26 14:18:42.732 | DEBUG    | __main__:trials:24 - Trial = 28028/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.733 | DEBUG    | __main__:trials:29 - Trial = 28028/30000 | Total reward = 33.63
2022-01-26 14:18:42.736 | DEBUG    | __main__:trials:26 - Trial = 28029/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.738 | DEBUG    | __main__:trials:29 - Trial = 28029/30000 | Total reward = 17.08
2022-01-26 14:18:42.742 | DEBUG    | __main__:trials:24 - Trial = 28030/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.743 | DEBUG    | __main__:trials:29 - Trial = 28030/30000 | Total reward = 28.58
2022-01-26 14:18:42.747 | DEBUG    | __main__:trials:24 - Trial = 28031/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.748 | DEBUG    | __main__:trials:29 - Trial = 28031/30000 | Total reward = 37.76
2022-01-26 14:18:42.752 | DEBUG    | __main__:trials:24 - Trial = 28032/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.754 | DEBUG    | __main__:trials:29 - Trial = 28032/30000 | Total reward = 37.27
2022-01-26 14:18:42.757 | DEBUG    | __main__:trials:24 - Trial = 28033/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.759 | DEBUG    | __main__:trials:29 - Trial = 28033/30000 | Total reward = 34.42
2022-01-26 14:18:42.762 | DEBUG    | __main__:trials:26 - Trial = 28034/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.764 | DEBUG    | __main__:trials:29 - Trial = 28034/30000 | Total reward = 29.58
2022-01-26 14:18:42.767 | DEBUG    | __main__:trials:24 - Trial = 28035/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.769 | DEBUG    | __main__:trials:29 - Trial = 28035/30000 | Total reward = 25.92
2022-01-26 14:18:42.772 | DEBUG    | __main__:trials:24 - Trial = 28036/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.774 | DEBUG    | __main__:trials:29 - Trial = 28036/30000 | Total reward = 42.70
2022-01-26 14:18:42.778 | DEBUG    | __main__:trials:24 - Trial = 28037/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.779 | DEBUG    | __main__:trials:29 - Trial = 28037/30000 | Total reward = 39.36
2022-01-26 14:18:42.783 | DEBUG    | __main__:trials:24 - Trial = 28038/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.784 | DEBUG    | __main__:trials:29 - Trial = 28038/30000 | Total reward = 42.24
2022-01-26 14:18:42.787 | DEBUG    | __main__:trials:24 - Trial = 28039/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.789 | DEBUG    | __main__:trials:29 - Trial = 28039/30000 | Total reward = 50.15
2022-01-26 14:18:42.793 | DEBUG    | __main__:trials:24 - Trial = 28040/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.795 | DEBUG    | __main__:trials:29 - Trial = 28040/30000 | Total reward = 39.23
2022-01-26 14:18:42.798 | DEBUG    | __main__:trials:24 - Trial = 28041/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.800 | DEBUG    | __main__:trials:29 - Trial = 28041/30000 | Total reward = 45.80
2022-01-26 14:18:42.804 | DEBUG    | __main__:trials:24 - Trial = 28042/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.805 | DEBUG    | __main__:trials:29 - Trial = 28042/30000 | Total reward = 37.18
2022-01-26 14:18:42.808 | DEBUG    | __main__:trials:24 - Trial = 28043/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.810 | DEBUG    | __main__:trials:29 - Trial = 28043/30000 | Total reward = 43.49
2022-01-26 14:18:42.814 | DEBUG    | __main__:trials:24 - Trial = 28044/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.816 | DEBUG    | __main__:trials:29 - Trial = 28044/30000 | Total reward = 44.44
2022-01-26 14:18:42.819 | DEBUG    | __main__:trials:24 - Trial = 28045/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.821 | DEBUG    | __main__:trials:29 - Trial = 28045/30000 | Total reward = 50.31
2022-01-26 14:18:42.824 | DEBUG    | __main__:trials:24 - Trial = 28046/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.826 | DEBUG    | __main__:trials:29 - Trial = 28046/30000 | Total reward = 47.73
2022-01-26 14:18:42.829 | DEBUG    | __main__:trials:24 - Trial = 28047/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.831 | DEBUG    | __main__:trials:29 - Trial = 28047/30000 | Total reward = 60.65
2022-01-26 14:18:42.835 | DEBUG    | __main__:trials:24 - Trial = 28048/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.836 | DEBUG    | __main__:trials:29 - Trial = 28048/30000 | Total reward = 36.00
2022-01-26 14:18:42.840 | DEBUG    | __main__:trials:24 - Trial = 28049/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.841 | DEBUG    | __main__:trials:29 - Trial = 28049/30000 | Total reward = 43.21
2022-01-26 14:18:42.845 | DEBUG    | __main__:trials:24 - Trial = 28050/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.846 | DEBUG    | __main__:trials:29 - Trial = 28050/30000 | Total reward = 31.96
2022-01-26 14:18:42.850 | DEBUG    | __main__:trials:24 - Trial = 28051/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.852 | DEBUG    | __main__:trials:29 - Trial = 28051/30000 | Total reward = 54.76
2022-01-26 14:18:42.856 | DEBUG    | __main__:trials:24 - Trial = 28052/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.857 | DEBUG    | __main__:trials:29 - Trial = 28052/30000 | Total reward = 29.88
2022-01-26 14:18:42.860 | DEBUG    | __main__:trials:24 - Trial = 28053/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.862 | DEBUG    | __main__:trials:29 - Trial = 28053/30000 | Total reward = 36.89
2022-01-26 14:18:42.866 | DEBUG    | __main__:trials:24 - Trial = 28054/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.867 | DEBUG    | __main__:trials:29 - Trial = 28054/30000 | Total reward = 35.77
2022-01-26 14:18:42.870 | DEBUG    | __main__:trials:24 - Trial = 28055/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.872 | DEBUG    | __main__:trials:29 - Trial = 28055/30000 | Total reward = 36.64
2022-01-26 14:18:42.876 | DEBUG    | __main__:trials:26 - Trial = 28056/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.877 | DEBUG    | __main__:trials:29 - Trial = 28056/30000 | Total reward = 26.43
2022-01-26 14:18:42.880 | DEBUG    | __main__:trials:24 - Trial = 28057/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.882 | DEBUG    | __main__:trials:29 - Trial = 28057/30000 | Total reward = 39.87
2022-01-26 14:18:42.886 | DEBUG    | __main__:trials:24 - Trial = 28058/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.886 | DEBUG    | __main__:trials:29 - Trial = 28058/30000 | Total reward = 38.03
2022-01-26 14:18:42.890 | DEBUG    | __main__:trials:24 - Trial = 28059/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.892 | DEBUG    | __main__:trials:29 - Trial = 28059/30000 | Total reward = 39.63
2022-01-26 14:18:42.896 | DEBUG    | __main__:trials:24 - Trial = 28060/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.897 | DEBUG    | __main__:trials:29 - Trial = 28060/30000 | Total reward = 40.29
2022-01-26 14:18:42.901 | DEBUG    | __main__:trials:24 - Trial = 28061/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.903 | DEBUG    | __main__:trials:29 - Trial = 28061/30000 | Total reward = 36.16
2022-01-26 14:18:42.906 | DEBUG    | __main__:trials:24 - Trial = 28062/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.908 | DEBUG    | __main__:trials:29 - Trial = 28062/30000 | Total reward = 46.80
2022-01-26 14:18:42.912 | DEBUG    | __main__:trials:24 - Trial = 28063/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.912 | DEBUG    | __main__:trials:29 - Trial = 28063/30000 | Total reward = 49.06
2022-01-26 14:18:42.916 | DEBUG    | __main__:trials:24 - Trial = 28064/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.918 | DEBUG    | __main__:trials:29 - Trial = 28064/30000 | Total reward = 53.11
2022-01-26 14:18:42.921 | DEBUG    | __main__:trials:24 - Trial = 28065/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.923 | DEBUG    | __main__:trials:29 - Trial = 28065/30000 | Total reward = 41.33
2022-01-26 14:18:42.927 | DEBUG    | __main__:trials:24 - Trial = 28066/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.928 | DEBUG    | __main__:trials:29 - Trial = 28066/30000 | Total reward = 37.98
2022-01-26 14:18:42.932 | DEBUG    | __main__:trials:24 - Trial = 28067/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.933 | DEBUG    | __main__:trials:29 - Trial = 28067/30000 | Total reward = 39.62
2022-01-26 14:18:42.937 | DEBUG    | __main__:trials:24 - Trial = 28068/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.939 | DEBUG    | __main__:trials:29 - Trial = 28068/30000 | Total reward = 35.45
2022-01-26 14:18:42.942 | DEBUG    | __main__:trials:24 - Trial = 28069/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.944 | DEBUG    | __main__:trials:29 - Trial = 28069/30000 | Total reward = 44.86
2022-01-26 14:18:42.947 | DEBUG    | __main__:trials:24 - Trial = 28070/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.949 | DEBUG    | __main__:trials:29 - Trial = 28070/30000 | Total reward = 47.45
2022-01-26 14:18:42.953 | DEBUG    | __main__:trials:26 - Trial = 28071/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.954 | DEBUG    | __main__:trials:29 - Trial = 28071/30000 | Total reward = 22.62
2022-01-26 14:18:42.957 | DEBUG    | __main__:trials:24 - Trial = 28072/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.958 | DEBUG    | __main__:trials:29 - Trial = 28072/30000 | Total reward = 42.25
2022-01-26 14:18:42.962 | DEBUG    | __main__:trials:24 - Trial = 28073/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.963 | DEBUG    | __main__:trials:29 - Trial = 28073/30000 | Total reward = 37.23
2022-01-26 14:18:42.966 | DEBUG    | __main__:trials:26 - Trial = 28074/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.968 | DEBUG    | __main__:trials:29 - Trial = 28074/30000 | Total reward = 17.83
2022-01-26 14:18:42.972 | DEBUG    | __main__:trials:24 - Trial = 28075/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.973 | DEBUG    | __main__:trials:29 - Trial = 28075/30000 | Total reward = 35.14
2022-01-26 14:18:42.977 | DEBUG    | __main__:trials:24 - Trial = 28076/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.979 | DEBUG    | __main__:trials:29 - Trial = 28076/30000 | Total reward = 41.18
2022-01-26 14:18:42.982 | DEBUG    | __main__:trials:26 - Trial = 28077/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:42.984 | DEBUG    | __main__:trials:29 - Trial = 28077/30000 | Total reward = 21.61
2022-01-26 14:18:42.987 | DEBUG    | __main__:trials:24 - Trial = 28078/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.989 | DEBUG    | __main__:trials:29 - Trial = 28078/30000 | Total reward = 41.78
2022-01-26 14:18:42.996 | DEBUG    | __main__:trials:24 - Trial = 28079/30000 | Max number of steps (20) reached
2022-01-26 14:18:42.998 | DEBUG    | __main__:trials:29 - Trial = 28079/30000 | Total reward = 42.15
2022-01-26 14:18:43.001 | DEBUG    | __main__:trials:24 - Trial = 28080/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.003 | DEBUG    | __main__:trials:29 - Trial = 28080/30000 | Total reward = 39.14
2022-01-26 14:18:43.006 | DEBUG    | __main__:trials:24 - Trial = 28081/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.008 | DEBUG    | __main__:trials:29 - Trial = 28081/30000 | Total reward = 46.05
2022-01-26 14:18:43.012 | DEBUG    | __main__:trials:24 - Trial = 28082/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.013 | DEBUG    | __main__:trials:29 - Trial = 28082/30000 | Total reward = 41.37
2022-01-26 14:18:43.017 | DEBUG    | __main__:trials:24 - Trial = 28083/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.018 | DEBUG    | __main__:trials:29 - Trial = 28083/30000 | Total reward = 39.01
2022-01-26 14:18:43.022 | DEBUG    | __main__:trials:24 - Trial = 28084/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.023 | DEBUG    | __main__:trials:29 - Trial = 28084/30000 | Total reward = 33.21
2022-01-26 14:18:43.026 | DEBUG    | __main__:trials:24 - Trial = 28085/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.028 | DEBUG    | __main__:trials:29 - Trial = 28085/30000 | Total reward = 41.34
2022-01-26 14:18:43.032 | DEBUG    | __main__:trials:24 - Trial = 28086/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.033 | DEBUG    | __main__:trials:29 - Trial = 28086/30000 | Total reward = 42.95
2022-01-26 14:18:43.037 | DEBUG    | __main__:trials:24 - Trial = 28087/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.038 | DEBUG    | __main__:trials:29 - Trial = 28087/30000 | Total reward = 28.43
2022-01-26 14:18:43.042 | DEBUG    | __main__:trials:24 - Trial = 28088/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.044 | DEBUG    | __main__:trials:29 - Trial = 28088/30000 | Total reward = 47.32
2022-01-26 14:18:43.048 | DEBUG    | __main__:trials:24 - Trial = 28089/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.049 | DEBUG    | __main__:trials:29 - Trial = 28089/30000 | Total reward = 22.42
2022-01-26 14:18:43.053 | DEBUG    | __main__:trials:24 - Trial = 28090/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.054 | DEBUG    | __main__:trials:29 - Trial = 28090/30000 | Total reward = 42.59
2022-01-26 14:18:43.058 | DEBUG    | __main__:trials:24 - Trial = 28091/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.060 | DEBUG    | __main__:trials:29 - Trial = 28091/30000 | Total reward = 35.65
2022-01-26 14:18:43.063 | DEBUG    | __main__:trials:24 - Trial = 28092/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.065 | DEBUG    | __main__:trials:29 - Trial = 28092/30000 | Total reward = 38.68
2022-01-26 14:18:43.068 | DEBUG    | __main__:trials:24 - Trial = 28093/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.069 | DEBUG    | __main__:trials:29 - Trial = 28093/30000 | Total reward = 39.19
2022-01-26 14:18:43.073 | DEBUG    | __main__:trials:24 - Trial = 28094/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.075 | DEBUG    | __main__:trials:29 - Trial = 28094/30000 | Total reward = 49.74
2022-01-26 14:18:43.078 | DEBUG    | __main__:trials:24 - Trial = 28095/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.080 | DEBUG    | __main__:trials:29 - Trial = 28095/30000 | Total reward = 41.85
2022-01-26 14:18:43.083 | DEBUG    | __main__:trials:24 - Trial = 28096/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.084 | DEBUG    | __main__:trials:29 - Trial = 28096/30000 | Total reward = 44.83
2022-01-26 14:18:43.088 | DEBUG    | __main__:trials:24 - Trial = 28097/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.090 | DEBUG    | __main__:trials:29 - Trial = 28097/30000 | Total reward = 33.29
2022-01-26 14:18:43.093 | DEBUG    | __main__:trials:24 - Trial = 28098/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.095 | DEBUG    | __main__:trials:29 - Trial = 28098/30000 | Total reward = 49.01
2022-01-26 14:18:43.099 | DEBUG    | __main__:trials:24 - Trial = 28099/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.100 | DEBUG    | __main__:trials:29 - Trial = 28099/30000 | Total reward = 35.35
2022-01-26 14:18:43.104 | DEBUG    | __main__:trials:24 - Trial = 28100/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.106 | DEBUG    | __main__:trials:29 - Trial = 28100/30000 | Total reward = 27.32
2022-01-26 14:18:43.109 | DEBUG    | __main__:trials:24 - Trial = 28101/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.111 | DEBUG    | __main__:trials:29 - Trial = 28101/30000 | Total reward = 42.34
2022-01-26 14:18:43.114 | DEBUG    | __main__:trials:26 - Trial = 28102/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.116 | DEBUG    | __main__:trials:29 - Trial = 28102/30000 | Total reward = 23.08
2022-01-26 14:18:43.120 | DEBUG    | __main__:trials:24 - Trial = 28103/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.121 | DEBUG    | __main__:trials:29 - Trial = 28103/30000 | Total reward = 47.09
2022-01-26 14:18:43.124 | DEBUG    | __main__:trials:24 - Trial = 28104/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.126 | DEBUG    | __main__:trials:29 - Trial = 28104/30000 | Total reward = 36.15
2022-01-26 14:18:43.130 | DEBUG    | __main__:trials:24 - Trial = 28105/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.131 | DEBUG    | __main__:trials:29 - Trial = 28105/30000 | Total reward = 42.76
2022-01-26 14:18:43.134 | DEBUG    | __main__:trials:24 - Trial = 28106/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.136 | DEBUG    | __main__:trials:29 - Trial = 28106/30000 | Total reward = 42.24
2022-01-26 14:18:43.140 | DEBUG    | __main__:trials:24 - Trial = 28107/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.142 | DEBUG    | __main__:trials:29 - Trial = 28107/30000 | Total reward = 48.66
2022-01-26 14:18:43.145 | DEBUG    | __main__:trials:24 - Trial = 28108/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.147 | DEBUG    | __main__:trials:29 - Trial = 28108/30000 | Total reward = 52.10
2022-01-26 14:18:43.150 | DEBUG    | __main__:trials:24 - Trial = 28109/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.152 | DEBUG    | __main__:trials:29 - Trial = 28109/30000 | Total reward = 41.28
2022-01-26 14:18:43.155 | DEBUG    | __main__:trials:24 - Trial = 28110/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.158 | DEBUG    | __main__:trials:29 - Trial = 28110/30000 | Total reward = 49.99
2022-01-26 14:18:43.162 | DEBUG    | __main__:trials:24 - Trial = 28111/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.164 | DEBUG    | __main__:trials:29 - Trial = 28111/30000 | Total reward = 43.74
2022-01-26 14:18:43.168 | DEBUG    | __main__:trials:24 - Trial = 28112/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.169 | DEBUG    | __main__:trials:29 - Trial = 28112/30000 | Total reward = 33.16
2022-01-26 14:18:43.173 | DEBUG    | __main__:trials:24 - Trial = 28113/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.175 | DEBUG    | __main__:trials:29 - Trial = 28113/30000 | Total reward = 39.76
2022-01-26 14:18:43.178 | DEBUG    | __main__:trials:24 - Trial = 28114/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.180 | DEBUG    | __main__:trials:29 - Trial = 28114/30000 | Total reward = 34.13
2022-01-26 14:18:43.183 | DEBUG    | __main__:trials:24 - Trial = 28115/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.185 | DEBUG    | __main__:trials:29 - Trial = 28115/30000 | Total reward = 34.30
2022-01-26 14:18:43.188 | DEBUG    | __main__:trials:26 - Trial = 28116/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.190 | DEBUG    | __main__:trials:29 - Trial = 28116/30000 | Total reward = 20.66
2022-01-26 14:18:43.194 | DEBUG    | __main__:trials:24 - Trial = 28117/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.195 | DEBUG    | __main__:trials:29 - Trial = 28117/30000 | Total reward = 42.56
2022-01-26 14:18:43.199 | DEBUG    | __main__:trials:24 - Trial = 28118/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.201 | DEBUG    | __main__:trials:29 - Trial = 28118/30000 | Total reward = 50.90
2022-01-26 14:18:43.204 | DEBUG    | __main__:trials:26 - Trial = 28119/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.205 | DEBUG    | __main__:trials:29 - Trial = 28119/30000 | Total reward = 12.77
2022-01-26 14:18:43.209 | DEBUG    | __main__:trials:24 - Trial = 28120/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.210 | DEBUG    | __main__:trials:29 - Trial = 28120/30000 | Total reward = 40.81
2022-01-26 14:18:43.214 | DEBUG    | __main__:trials:24 - Trial = 28121/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.216 | DEBUG    | __main__:trials:29 - Trial = 28121/30000 | Total reward = 37.59
2022-01-26 14:18:43.220 | DEBUG    | __main__:trials:24 - Trial = 28122/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.221 | DEBUG    | __main__:trials:29 - Trial = 28122/30000 | Total reward = 36.48
2022-01-26 14:18:43.225 | DEBUG    | __main__:trials:26 - Trial = 28123/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.225 | DEBUG    | __main__:trials:29 - Trial = 28123/30000 | Total reward = 32.66
2022-01-26 14:18:43.229 | DEBUG    | __main__:trials:24 - Trial = 28124/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.229 | DEBUG    | __main__:trials:29 - Trial = 28124/30000 | Total reward = 43.30
2022-01-26 14:18:43.234 | DEBUG    | __main__:trials:24 - Trial = 28125/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.235 | DEBUG    | __main__:trials:29 - Trial = 28125/30000 | Total reward = 39.02
2022-01-26 14:18:43.239 | DEBUG    | __main__:trials:24 - Trial = 28126/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.240 | DEBUG    | __main__:trials:29 - Trial = 28126/30000 | Total reward = 36.95
2022-01-26 14:18:43.244 | DEBUG    | __main__:trials:24 - Trial = 28127/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.246 | DEBUG    | __main__:trials:29 - Trial = 28127/30000 | Total reward = 35.35
2022-01-26 14:18:43.248 | DEBUG    | __main__:trials:24 - Trial = 28128/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.250 | DEBUG    | __main__:trials:29 - Trial = 28128/30000 | Total reward = 33.64
2022-01-26 14:18:43.254 | DEBUG    | __main__:trials:24 - Trial = 28129/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.256 | DEBUG    | __main__:trials:29 - Trial = 28129/30000 | Total reward = 46.45
2022-01-26 14:18:43.259 | DEBUG    | __main__:trials:24 - Trial = 28130/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.261 | DEBUG    | __main__:trials:29 - Trial = 28130/30000 | Total reward = 40.32
2022-01-26 14:18:43.265 | DEBUG    | __main__:trials:24 - Trial = 28131/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.265 | DEBUG    | __main__:trials:29 - Trial = 28131/30000 | Total reward = 44.76
2022-01-26 14:18:43.269 | DEBUG    | __main__:trials:24 - Trial = 28132/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.270 | DEBUG    | __main__:trials:29 - Trial = 28132/30000 | Total reward = 36.03
2022-01-26 14:18:43.274 | DEBUG    | __main__:trials:24 - Trial = 28133/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.274 | DEBUG    | __main__:trials:29 - Trial = 28133/30000 | Total reward = 42.20
2022-01-26 14:18:43.278 | DEBUG    | __main__:trials:24 - Trial = 28134/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.280 | DEBUG    | __main__:trials:29 - Trial = 28134/30000 | Total reward = 45.66
2022-01-26 14:18:43.284 | DEBUG    | __main__:trials:24 - Trial = 28135/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.284 | DEBUG    | __main__:trials:29 - Trial = 28135/30000 | Total reward = 37.62
2022-01-26 14:18:43.288 | DEBUG    | __main__:trials:24 - Trial = 28136/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.289 | DEBUG    | __main__:trials:29 - Trial = 28136/30000 | Total reward = 41.26
2022-01-26 14:18:43.293 | DEBUG    | __main__:trials:24 - Trial = 28137/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.293 | DEBUG    | __main__:trials:29 - Trial = 28137/30000 | Total reward = 45.76
2022-01-26 14:18:43.298 | DEBUG    | __main__:trials:24 - Trial = 28138/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.299 | DEBUG    | __main__:trials:29 - Trial = 28138/30000 | Total reward = 36.50
2022-01-26 14:18:43.303 | DEBUG    | __main__:trials:24 - Trial = 28139/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.304 | DEBUG    | __main__:trials:29 - Trial = 28139/30000 | Total reward = 28.33
2022-01-26 14:18:43.307 | DEBUG    | __main__:trials:24 - Trial = 28140/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.309 | DEBUG    | __main__:trials:29 - Trial = 28140/30000 | Total reward = 41.22
2022-01-26 14:18:43.313 | DEBUG    | __main__:trials:24 - Trial = 28141/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.315 | DEBUG    | __main__:trials:29 - Trial = 28141/30000 | Total reward = 41.91
2022-01-26 14:18:43.317 | DEBUG    | __main__:trials:24 - Trial = 28142/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.319 | DEBUG    | __main__:trials:29 - Trial = 28142/30000 | Total reward = 42.15
2022-01-26 14:18:43.323 | DEBUG    | __main__:trials:24 - Trial = 28143/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.325 | DEBUG    | __main__:trials:29 - Trial = 28143/30000 | Total reward = 42.27
2022-01-26 14:18:43.328 | DEBUG    | __main__:trials:24 - Trial = 28144/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.330 | DEBUG    | __main__:trials:29 - Trial = 28144/30000 | Total reward = 62.52
2022-01-26 14:18:43.333 | DEBUG    | __main__:trials:26 - Trial = 28145/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.334 | DEBUG    | __main__:trials:29 - Trial = 28145/30000 | Total reward = 18.80
2022-01-26 14:18:43.337 | DEBUG    | __main__:trials:26 - Trial = 28146/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.338 | DEBUG    | __main__:trials:29 - Trial = 28146/30000 | Total reward = 15.74
2022-01-26 14:18:43.341 | DEBUG    | __main__:trials:24 - Trial = 28147/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.343 | DEBUG    | __main__:trials:29 - Trial = 28147/30000 | Total reward = 42.90
2022-01-26 14:18:43.346 | DEBUG    | __main__:trials:24 - Trial = 28148/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.347 | DEBUG    | __main__:trials:29 - Trial = 28148/30000 | Total reward = 35.35
2022-01-26 14:18:43.350 | DEBUG    | __main__:trials:24 - Trial = 28149/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.352 | DEBUG    | __main__:trials:29 - Trial = 28149/30000 | Total reward = 37.65
2022-01-26 14:18:43.355 | DEBUG    | __main__:trials:24 - Trial = 28150/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.356 | DEBUG    | __main__:trials:29 - Trial = 28150/30000 | Total reward = 38.22
2022-01-26 14:18:43.360 | DEBUG    | __main__:trials:24 - Trial = 28151/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.360 | DEBUG    | __main__:trials:29 - Trial = 28151/30000 | Total reward = 56.16
2022-01-26 14:18:43.364 | DEBUG    | __main__:trials:24 - Trial = 28152/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.365 | DEBUG    | __main__:trials:29 - Trial = 28152/30000 | Total reward = 47.21
2022-01-26 14:18:43.369 | DEBUG    | __main__:trials:24 - Trial = 28153/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.369 | DEBUG    | __main__:trials:29 - Trial = 28153/30000 | Total reward = 37.98
2022-01-26 14:18:43.373 | DEBUG    | __main__:trials:24 - Trial = 28154/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.375 | DEBUG    | __main__:trials:29 - Trial = 28154/30000 | Total reward = 41.05
2022-01-26 14:18:43.379 | DEBUG    | __main__:trials:24 - Trial = 28155/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.380 | DEBUG    | __main__:trials:29 - Trial = 28155/30000 | Total reward = 40.44
2022-01-26 14:18:43.384 | DEBUG    | __main__:trials:24 - Trial = 28156/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.385 | DEBUG    | __main__:trials:29 - Trial = 28156/30000 | Total reward = 37.38
2022-01-26 14:18:43.389 | DEBUG    | __main__:trials:24 - Trial = 28157/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.391 | DEBUG    | __main__:trials:29 - Trial = 28157/30000 | Total reward = 42.34
2022-01-26 14:18:43.394 | DEBUG    | __main__:trials:24 - Trial = 28158/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.396 | DEBUG    | __main__:trials:29 - Trial = 28158/30000 | Total reward = 27.70
2022-01-26 14:18:43.400 | DEBUG    | __main__:trials:24 - Trial = 28159/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.401 | DEBUG    | __main__:trials:29 - Trial = 28159/30000 | Total reward = 49.68
2022-01-26 14:18:43.405 | DEBUG    | __main__:trials:24 - Trial = 28160/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.406 | DEBUG    | __main__:trials:29 - Trial = 28160/30000 | Total reward = 36.71
2022-01-26 14:18:43.409 | DEBUG    | __main__:trials:24 - Trial = 28161/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.411 | DEBUG    | __main__:trials:29 - Trial = 28161/30000 | Total reward = 36.01
2022-01-26 14:18:43.414 | DEBUG    | __main__:trials:26 - Trial = 28162/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.416 | DEBUG    | __main__:trials:29 - Trial = 28162/30000 | Total reward = 26.94
2022-01-26 14:18:43.419 | DEBUG    | __main__:trials:24 - Trial = 28163/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.421 | DEBUG    | __main__:trials:29 - Trial = 28163/30000 | Total reward = 46.54
2022-01-26 14:18:43.424 | DEBUG    | __main__:trials:24 - Trial = 28164/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.426 | DEBUG    | __main__:trials:29 - Trial = 28164/30000 | Total reward = 50.84
2022-01-26 14:18:43.429 | DEBUG    | __main__:trials:24 - Trial = 28165/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.430 | DEBUG    | __main__:trials:29 - Trial = 28165/30000 | Total reward = 35.60
2022-01-26 14:18:43.433 | DEBUG    | __main__:trials:24 - Trial = 28166/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.434 | DEBUG    | __main__:trials:29 - Trial = 28166/30000 | Total reward = 45.96
2022-01-26 14:18:43.437 | DEBUG    | __main__:trials:24 - Trial = 28167/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.438 | DEBUG    | __main__:trials:29 - Trial = 28167/30000 | Total reward = 50.40
2022-01-26 14:18:43.442 | DEBUG    | __main__:trials:24 - Trial = 28168/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.443 | DEBUG    | __main__:trials:29 - Trial = 28168/30000 | Total reward = 31.45
2022-01-26 14:18:43.447 | DEBUG    | __main__:trials:24 - Trial = 28169/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.447 | DEBUG    | __main__:trials:29 - Trial = 28169/30000 | Total reward = 38.70
2022-01-26 14:18:43.451 | DEBUG    | __main__:trials:26 - Trial = 28170/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.453 | DEBUG    | __main__:trials:29 - Trial = 28170/30000 | Total reward = 33.84
2022-01-26 14:18:43.456 | DEBUG    | __main__:trials:24 - Trial = 28171/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.458 | DEBUG    | __main__:trials:29 - Trial = 28171/30000 | Total reward = 45.21
2022-01-26 14:18:43.460 | DEBUG    | __main__:trials:26 - Trial = 28172/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.462 | DEBUG    | __main__:trials:29 - Trial = 28172/30000 | Total reward = 23.04
2022-01-26 14:18:43.466 | DEBUG    | __main__:trials:24 - Trial = 28173/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.467 | DEBUG    | __main__:trials:29 - Trial = 28173/30000 | Total reward = 45.71
2022-01-26 14:18:43.471 | DEBUG    | __main__:trials:24 - Trial = 28174/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.473 | DEBUG    | __main__:trials:29 - Trial = 28174/30000 | Total reward = 41.76
2022-01-26 14:18:43.476 | DEBUG    | __main__:trials:24 - Trial = 28175/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.478 | DEBUG    | __main__:trials:29 - Trial = 28175/30000 | Total reward = 35.77
2022-01-26 14:18:43.481 | DEBUG    | __main__:trials:24 - Trial = 28176/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.483 | DEBUG    | __main__:trials:29 - Trial = 28176/30000 | Total reward = 45.87
2022-01-26 14:18:43.487 | DEBUG    | __main__:trials:24 - Trial = 28177/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.488 | DEBUG    | __main__:trials:29 - Trial = 28177/30000 | Total reward = 43.43
2022-01-26 14:18:43.492 | DEBUG    | __main__:trials:24 - Trial = 28178/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.494 | DEBUG    | __main__:trials:29 - Trial = 28178/30000 | Total reward = 47.66
2022-01-26 14:18:43.497 | DEBUG    | __main__:trials:24 - Trial = 28179/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.499 | DEBUG    | __main__:trials:29 - Trial = 28179/30000 | Total reward = 45.60
2022-01-26 14:18:43.502 | DEBUG    | __main__:trials:24 - Trial = 28180/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.504 | DEBUG    | __main__:trials:29 - Trial = 28180/30000 | Total reward = 45.95
2022-01-26 14:18:43.507 | DEBUG    | __main__:trials:24 - Trial = 28181/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.509 | DEBUG    | __main__:trials:29 - Trial = 28181/30000 | Total reward = 45.87
2022-01-26 14:18:43.512 | DEBUG    | __main__:trials:24 - Trial = 28182/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.513 | DEBUG    | __main__:trials:29 - Trial = 28182/30000 | Total reward = 39.53
2022-01-26 14:18:43.516 | DEBUG    | __main__:trials:24 - Trial = 28183/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.518 | DEBUG    | __main__:trials:29 - Trial = 28183/30000 | Total reward = 32.31
2022-01-26 14:18:43.521 | DEBUG    | __main__:trials:26 - Trial = 28184/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.523 | DEBUG    | __main__:trials:29 - Trial = 28184/30000 | Total reward = 22.32
2022-01-26 14:18:43.526 | DEBUG    | __main__:trials:24 - Trial = 28185/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.527 | DEBUG    | __main__:trials:29 - Trial = 28185/30000 | Total reward = 45.48
2022-01-26 14:18:43.530 | DEBUG    | __main__:trials:24 - Trial = 28186/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.532 | DEBUG    | __main__:trials:29 - Trial = 28186/30000 | Total reward = 38.98
2022-01-26 14:18:43.534 | DEBUG    | __main__:trials:26 - Trial = 28187/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.536 | DEBUG    | __main__:trials:29 - Trial = 28187/30000 | Total reward = 13.00
2022-01-26 14:18:43.540 | DEBUG    | __main__:trials:24 - Trial = 28188/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.542 | DEBUG    | __main__:trials:29 - Trial = 28188/30000 | Total reward = 45.54
2022-01-26 14:18:43.545 | DEBUG    | __main__:trials:24 - Trial = 28189/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.546 | DEBUG    | __main__:trials:29 - Trial = 28189/30000 | Total reward = 38.77
2022-01-26 14:18:43.550 | DEBUG    | __main__:trials:24 - Trial = 28190/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.552 | DEBUG    | __main__:trials:29 - Trial = 28190/30000 | Total reward = 25.59
2022-01-26 14:18:43.555 | DEBUG    | __main__:trials:26 - Trial = 28191/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.557 | DEBUG    | __main__:trials:29 - Trial = 28191/30000 | Total reward = 23.32
2022-01-26 14:18:43.560 | DEBUG    | __main__:trials:26 - Trial = 28192/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.562 | DEBUG    | __main__:trials:29 - Trial = 28192/30000 | Total reward = 19.31
2022-01-26 14:18:43.566 | DEBUG    | __main__:trials:24 - Trial = 28193/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.567 | DEBUG    | __main__:trials:29 - Trial = 28193/30000 | Total reward = 38.24
2022-01-26 14:18:43.571 | DEBUG    | __main__:trials:24 - Trial = 28194/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.573 | DEBUG    | __main__:trials:29 - Trial = 28194/30000 | Total reward = 27.78
2022-01-26 14:18:43.577 | DEBUG    | __main__:trials:24 - Trial = 28195/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.578 | DEBUG    | __main__:trials:29 - Trial = 28195/30000 | Total reward = 47.53
2022-01-26 14:18:43.582 | DEBUG    | __main__:trials:24 - Trial = 28196/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.584 | DEBUG    | __main__:trials:29 - Trial = 28196/30000 | Total reward = 50.02
2022-01-26 14:18:43.587 | DEBUG    | __main__:trials:24 - Trial = 28197/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.589 | DEBUG    | __main__:trials:29 - Trial = 28197/30000 | Total reward = 30.59
2022-01-26 14:18:43.592 | DEBUG    | __main__:trials:24 - Trial = 28198/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.594 | DEBUG    | __main__:trials:29 - Trial = 28198/30000 | Total reward = 41.14
2022-01-26 14:18:43.598 | DEBUG    | __main__:trials:24 - Trial = 28199/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.599 | DEBUG    | __main__:trials:29 - Trial = 28199/30000 | Total reward = 50.28
2022-01-26 14:18:43.603 | DEBUG    | __main__:trials:24 - Trial = 28200/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.604 | DEBUG    | __main__:trials:29 - Trial = 28200/30000 | Total reward = 44.11
2022-01-26 14:18:43.608 | DEBUG    | __main__:trials:24 - Trial = 28201/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.610 | DEBUG    | __main__:trials:29 - Trial = 28201/30000 | Total reward = 47.20
2022-01-26 14:18:43.614 | DEBUG    | __main__:trials:24 - Trial = 28202/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.615 | DEBUG    | __main__:trials:29 - Trial = 28202/30000 | Total reward = 34.43
2022-01-26 14:18:43.619 | DEBUG    | __main__:trials:24 - Trial = 28203/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.619 | DEBUG    | __main__:trials:29 - Trial = 28203/30000 | Total reward = 47.20
2022-01-26 14:18:43.624 | DEBUG    | __main__:trials:24 - Trial = 28204/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.625 | DEBUG    | __main__:trials:29 - Trial = 28204/30000 | Total reward = 44.59
2022-01-26 14:18:43.629 | DEBUG    | __main__:trials:24 - Trial = 28205/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.630 | DEBUG    | __main__:trials:29 - Trial = 28205/30000 | Total reward = 46.81
2022-01-26 14:18:43.634 | DEBUG    | __main__:trials:24 - Trial = 28206/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.634 | DEBUG    | __main__:trials:29 - Trial = 28206/30000 | Total reward = 47.20
2022-01-26 14:18:43.638 | DEBUG    | __main__:trials:24 - Trial = 28207/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.641 | DEBUG    | __main__:trials:29 - Trial = 28207/30000 | Total reward = 38.71
2022-01-26 14:18:43.643 | DEBUG    | __main__:trials:24 - Trial = 28208/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.645 | DEBUG    | __main__:trials:29 - Trial = 28208/30000 | Total reward = 35.95
2022-01-26 14:18:43.648 | DEBUG    | __main__:trials:24 - Trial = 28209/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.649 | DEBUG    | __main__:trials:29 - Trial = 28209/30000 | Total reward = 41.04
2022-01-26 14:18:43.652 | DEBUG    | __main__:trials:24 - Trial = 28210/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.654 | DEBUG    | __main__:trials:29 - Trial = 28210/30000 | Total reward = 42.11
2022-01-26 14:18:43.657 | DEBUG    | __main__:trials:24 - Trial = 28211/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.658 | DEBUG    | __main__:trials:29 - Trial = 28211/30000 | Total reward = 38.53
2022-01-26 14:18:43.663 | DEBUG    | __main__:trials:24 - Trial = 28212/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.664 | DEBUG    | __main__:trials:29 - Trial = 28212/30000 | Total reward = 36.09
2022-01-26 14:18:43.667 | DEBUG    | __main__:trials:24 - Trial = 28213/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.669 | DEBUG    | __main__:trials:29 - Trial = 28213/30000 | Total reward = 47.20
2022-01-26 14:18:43.673 | DEBUG    | __main__:trials:24 - Trial = 28214/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.675 | DEBUG    | __main__:trials:29 - Trial = 28214/30000 | Total reward = 34.39
2022-01-26 14:18:43.678 | DEBUG    | __main__:trials:24 - Trial = 28215/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.680 | DEBUG    | __main__:trials:29 - Trial = 28215/30000 | Total reward = 39.61
2022-01-26 14:18:43.684 | DEBUG    | __main__:trials:24 - Trial = 28216/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.685 | DEBUG    | __main__:trials:29 - Trial = 28216/30000 | Total reward = 42.90
2022-01-26 14:18:43.689 | DEBUG    | __main__:trials:24 - Trial = 28217/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.691 | DEBUG    | __main__:trials:29 - Trial = 28217/30000 | Total reward = 36.19
2022-01-26 14:18:43.694 | DEBUG    | __main__:trials:26 - Trial = 28218/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.694 | DEBUG    | __main__:trials:29 - Trial = 28218/30000 | Total reward = 16.69
2022-01-26 14:18:43.698 | DEBUG    | __main__:trials:24 - Trial = 28219/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.700 | DEBUG    | __main__:trials:29 - Trial = 28219/30000 | Total reward = 50.84
2022-01-26 14:18:43.703 | DEBUG    | __main__:trials:24 - Trial = 28220/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.704 | DEBUG    | __main__:trials:29 - Trial = 28220/30000 | Total reward = 45.66
2022-01-26 14:18:43.708 | DEBUG    | __main__:trials:24 - Trial = 28221/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.710 | DEBUG    | __main__:trials:29 - Trial = 28221/30000 | Total reward = 42.64
2022-01-26 14:18:43.713 | DEBUG    | __main__:trials:24 - Trial = 28222/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.715 | DEBUG    | __main__:trials:29 - Trial = 28222/30000 | Total reward = 37.36
2022-01-26 14:18:43.719 | DEBUG    | __main__:trials:24 - Trial = 28223/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.720 | DEBUG    | __main__:trials:29 - Trial = 28223/30000 | Total reward = 29.15
2022-01-26 14:18:43.723 | DEBUG    | __main__:trials:24 - Trial = 28224/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.725 | DEBUG    | __main__:trials:29 - Trial = 28224/30000 | Total reward = 47.47
2022-01-26 14:18:43.729 | DEBUG    | __main__:trials:24 - Trial = 28225/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.731 | DEBUG    | __main__:trials:29 - Trial = 28225/30000 | Total reward = 42.46
2022-01-26 14:18:43.735 | DEBUG    | __main__:trials:24 - Trial = 28226/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.736 | DEBUG    | __main__:trials:29 - Trial = 28226/30000 | Total reward = 39.05
2022-01-26 14:18:43.740 | DEBUG    | __main__:trials:24 - Trial = 28227/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.741 | DEBUG    | __main__:trials:29 - Trial = 28227/30000 | Total reward = 46.83
2022-01-26 14:18:43.745 | DEBUG    | __main__:trials:24 - Trial = 28228/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.747 | DEBUG    | __main__:trials:29 - Trial = 28228/30000 | Total reward = 51.97
2022-01-26 14:18:43.750 | DEBUG    | __main__:trials:24 - Trial = 28229/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.752 | DEBUG    | __main__:trials:29 - Trial = 28229/30000 | Total reward = 46.64
2022-01-26 14:18:43.756 | DEBUG    | __main__:trials:24 - Trial = 28230/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.757 | DEBUG    | __main__:trials:29 - Trial = 28230/30000 | Total reward = 45.16
2022-01-26 14:18:43.761 | DEBUG    | __main__:trials:24 - Trial = 28231/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.761 | DEBUG    | __main__:trials:29 - Trial = 28231/30000 | Total reward = 26.17
2022-01-26 14:18:43.764 | DEBUG    | __main__:trials:24 - Trial = 28232/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.766 | DEBUG    | __main__:trials:29 - Trial = 28232/30000 | Total reward = 47.61
2022-01-26 14:18:43.770 | DEBUG    | __main__:trials:24 - Trial = 28233/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.771 | DEBUG    | __main__:trials:29 - Trial = 28233/30000 | Total reward = 45.68
2022-01-26 14:18:43.775 | DEBUG    | __main__:trials:24 - Trial = 28234/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.776 | DEBUG    | __main__:trials:29 - Trial = 28234/30000 | Total reward = 48.55
2022-01-26 14:18:43.783 | DEBUG    | __main__:trials:24 - Trial = 28235/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.785 | DEBUG    | __main__:trials:29 - Trial = 28235/30000 | Total reward = 41.27
2022-01-26 14:18:43.788 | DEBUG    | __main__:trials:24 - Trial = 28236/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.790 | DEBUG    | __main__:trials:29 - Trial = 28236/30000 | Total reward = 42.07
2022-01-26 14:18:43.794 | DEBUG    | __main__:trials:24 - Trial = 28237/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.795 | DEBUG    | __main__:trials:29 - Trial = 28237/30000 | Total reward = 46.21
2022-01-26 14:18:43.798 | DEBUG    | __main__:trials:24 - Trial = 28238/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.800 | DEBUG    | __main__:trials:29 - Trial = 28238/30000 | Total reward = 45.79
2022-01-26 14:18:43.804 | DEBUG    | __main__:trials:24 - Trial = 28239/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.805 | DEBUG    | __main__:trials:29 - Trial = 28239/30000 | Total reward = 34.53
2022-01-26 14:18:43.809 | DEBUG    | __main__:trials:24 - Trial = 28240/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.810 | DEBUG    | __main__:trials:29 - Trial = 28240/30000 | Total reward = 28.21
2022-01-26 14:18:43.814 | DEBUG    | __main__:trials:24 - Trial = 28241/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.814 | DEBUG    | __main__:trials:29 - Trial = 28241/30000 | Total reward = 34.00
2022-01-26 14:18:43.818 | DEBUG    | __main__:trials:24 - Trial = 28242/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.820 | DEBUG    | __main__:trials:29 - Trial = 28242/30000 | Total reward = 47.34
2022-01-26 14:18:43.824 | DEBUG    | __main__:trials:24 - Trial = 28243/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.825 | DEBUG    | __main__:trials:29 - Trial = 28243/30000 | Total reward = 48.30
2022-01-26 14:18:43.829 | DEBUG    | __main__:trials:24 - Trial = 28244/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.831 | DEBUG    | __main__:trials:29 - Trial = 28244/30000 | Total reward = 51.11
2022-01-26 14:18:43.834 | DEBUG    | __main__:trials:24 - Trial = 28245/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.836 | DEBUG    | __main__:trials:29 - Trial = 28245/30000 | Total reward = 27.31
2022-01-26 14:18:43.839 | DEBUG    | __main__:trials:24 - Trial = 28246/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.841 | DEBUG    | __main__:trials:29 - Trial = 28246/30000 | Total reward = 53.52
2022-01-26 14:18:43.844 | DEBUG    | __main__:trials:24 - Trial = 28247/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.846 | DEBUG    | __main__:trials:29 - Trial = 28247/30000 | Total reward = 42.01
2022-01-26 14:18:43.849 | DEBUG    | __main__:trials:24 - Trial = 28248/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.851 | DEBUG    | __main__:trials:29 - Trial = 28248/30000 | Total reward = 44.24
2022-01-26 14:18:43.855 | DEBUG    | __main__:trials:24 - Trial = 28249/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.857 | DEBUG    | __main__:trials:29 - Trial = 28249/30000 | Total reward = 35.94
2022-01-26 14:18:43.860 | DEBUG    | __main__:trials:24 - Trial = 28250/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.862 | DEBUG    | __main__:trials:29 - Trial = 28250/30000 | Total reward = 43.86
2022-01-26 14:18:43.866 | DEBUG    | __main__:trials:24 - Trial = 28251/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.867 | DEBUG    | __main__:trials:29 - Trial = 28251/30000 | Total reward = 42.18
2022-01-26 14:18:43.870 | DEBUG    | __main__:trials:26 - Trial = 28252/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.871 | DEBUG    | __main__:trials:29 - Trial = 28252/30000 | Total reward = 11.69
2022-01-26 14:18:43.875 | DEBUG    | __main__:trials:24 - Trial = 28253/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.877 | DEBUG    | __main__:trials:29 - Trial = 28253/30000 | Total reward = 26.66
2022-01-26 14:18:43.880 | DEBUG    | __main__:trials:24 - Trial = 28254/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.882 | DEBUG    | __main__:trials:29 - Trial = 28254/30000 | Total reward = 50.49
2022-01-26 14:18:43.886 | DEBUG    | __main__:trials:24 - Trial = 28255/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.887 | DEBUG    | __main__:trials:29 - Trial = 28255/30000 | Total reward = 46.05
2022-01-26 14:18:43.891 | DEBUG    | __main__:trials:24 - Trial = 28256/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.892 | DEBUG    | __main__:trials:29 - Trial = 28256/30000 | Total reward = 41.26
2022-01-26 14:18:43.896 | DEBUG    | __main__:trials:24 - Trial = 28257/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.898 | DEBUG    | __main__:trials:29 - Trial = 28257/30000 | Total reward = 44.89
2022-01-26 14:18:43.901 | DEBUG    | __main__:trials:24 - Trial = 28258/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.903 | DEBUG    | __main__:trials:29 - Trial = 28258/30000 | Total reward = 48.95
2022-01-26 14:18:43.906 | DEBUG    | __main__:trials:26 - Trial = 28259/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.908 | DEBUG    | __main__:trials:29 - Trial = 28259/30000 | Total reward = 27.28
2022-01-26 14:18:43.911 | DEBUG    | __main__:trials:26 - Trial = 28260/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.913 | DEBUG    | __main__:trials:29 - Trial = 28260/30000 | Total reward = 28.37
2022-01-26 14:18:43.916 | DEBUG    | __main__:trials:24 - Trial = 28261/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.918 | DEBUG    | __main__:trials:29 - Trial = 28261/30000 | Total reward = 46.85
2022-01-26 14:18:43.921 | DEBUG    | __main__:trials:24 - Trial = 28262/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.923 | DEBUG    | __main__:trials:29 - Trial = 28262/30000 | Total reward = 34.84
2022-01-26 14:18:43.927 | DEBUG    | __main__:trials:24 - Trial = 28263/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.928 | DEBUG    | __main__:trials:29 - Trial = 28263/30000 | Total reward = 38.24
2022-01-26 14:18:43.931 | DEBUG    | __main__:trials:26 - Trial = 28264/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.933 | DEBUG    | __main__:trials:29 - Trial = 28264/30000 | Total reward = 15.40
2022-01-26 14:18:43.936 | DEBUG    | __main__:trials:24 - Trial = 28265/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.938 | DEBUG    | __main__:trials:29 - Trial = 28265/30000 | Total reward = 47.18
2022-01-26 14:18:43.941 | DEBUG    | __main__:trials:24 - Trial = 28266/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.943 | DEBUG    | __main__:trials:29 - Trial = 28266/30000 | Total reward = 38.37
2022-01-26 14:18:43.946 | DEBUG    | __main__:trials:24 - Trial = 28267/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.948 | DEBUG    | __main__:trials:29 - Trial = 28267/30000 | Total reward = 42.46
2022-01-26 14:18:43.952 | DEBUG    | __main__:trials:24 - Trial = 28268/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.953 | DEBUG    | __main__:trials:29 - Trial = 28268/30000 | Total reward = 42.10
2022-01-26 14:18:43.956 | DEBUG    | __main__:trials:24 - Trial = 28269/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.958 | DEBUG    | __main__:trials:29 - Trial = 28269/30000 | Total reward = 35.14
2022-01-26 14:18:43.961 | DEBUG    | __main__:trials:24 - Trial = 28270/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.962 | DEBUG    | __main__:trials:29 - Trial = 28270/30000 | Total reward = 47.94
2022-01-26 14:18:43.965 | DEBUG    | __main__:trials:24 - Trial = 28271/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.966 | DEBUG    | __main__:trials:29 - Trial = 28271/30000 | Total reward = 37.50
2022-01-26 14:18:43.970 | DEBUG    | __main__:trials:24 - Trial = 28272/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.971 | DEBUG    | __main__:trials:29 - Trial = 28272/30000 | Total reward = 45.41
2022-01-26 14:18:43.975 | DEBUG    | __main__:trials:24 - Trial = 28273/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.975 | DEBUG    | __main__:trials:29 - Trial = 28273/30000 | Total reward = 47.32
2022-01-26 14:18:43.980 | DEBUG    | __main__:trials:24 - Trial = 28274/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.981 | DEBUG    | __main__:trials:29 - Trial = 28274/30000 | Total reward = 24.11
2022-01-26 14:18:43.985 | DEBUG    | __main__:trials:24 - Trial = 28275/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.987 | DEBUG    | __main__:trials:29 - Trial = 28275/30000 | Total reward = 44.53
2022-01-26 14:18:43.991 | DEBUG    | __main__:trials:24 - Trial = 28276/30000 | Max number of steps (20) reached
2022-01-26 14:18:43.992 | DEBUG    | __main__:trials:29 - Trial = 28276/30000 | Total reward = 51.96
2022-01-26 14:18:43.995 | DEBUG    | __main__:trials:26 - Trial = 28277/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:43.996 | DEBUG    | __main__:trials:29 - Trial = 28277/30000 | Total reward = 9.12
2022-01-26 14:18:44.000 | DEBUG    | __main__:trials:24 - Trial = 28278/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.000 | DEBUG    | __main__:trials:29 - Trial = 28278/30000 | Total reward = 41.97
2022-01-26 14:18:44.004 | DEBUG    | __main__:trials:24 - Trial = 28279/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.005 | DEBUG    | __main__:trials:29 - Trial = 28279/30000 | Total reward = 39.38
2022-01-26 14:18:44.009 | DEBUG    | __main__:trials:24 - Trial = 28280/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.009 | DEBUG    | __main__:trials:29 - Trial = 28280/30000 | Total reward = 48.77
2022-01-26 14:18:44.013 | DEBUG    | __main__:trials:24 - Trial = 28281/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.014 | DEBUG    | __main__:trials:29 - Trial = 28281/30000 | Total reward = 30.19
2022-01-26 14:18:44.018 | DEBUG    | __main__:trials:24 - Trial = 28282/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.019 | DEBUG    | __main__:trials:29 - Trial = 28282/30000 | Total reward = 42.96
2022-01-26 14:18:44.022 | DEBUG    | __main__:trials:24 - Trial = 28283/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.024 | DEBUG    | __main__:trials:29 - Trial = 28283/30000 | Total reward = 44.40
2022-01-26 14:18:44.028 | DEBUG    | __main__:trials:24 - Trial = 28284/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.029 | DEBUG    | __main__:trials:29 - Trial = 28284/30000 | Total reward = 31.71
2022-01-26 14:18:44.033 | DEBUG    | __main__:trials:24 - Trial = 28285/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.034 | DEBUG    | __main__:trials:29 - Trial = 28285/30000 | Total reward = 37.97
2022-01-26 14:18:44.038 | DEBUG    | __main__:trials:24 - Trial = 28286/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.040 | DEBUG    | __main__:trials:29 - Trial = 28286/30000 | Total reward = 39.85
2022-01-26 14:18:44.043 | DEBUG    | __main__:trials:24 - Trial = 28287/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.044 | DEBUG    | __main__:trials:29 - Trial = 28287/30000 | Total reward = 35.89
2022-01-26 14:18:44.048 | DEBUG    | __main__:trials:24 - Trial = 28288/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.050 | DEBUG    | __main__:trials:29 - Trial = 28288/30000 | Total reward = 17.99
2022-01-26 14:18:44.053 | DEBUG    | __main__:trials:24 - Trial = 28289/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.055 | DEBUG    | __main__:trials:29 - Trial = 28289/30000 | Total reward = 45.41
2022-01-26 14:18:44.059 | DEBUG    | __main__:trials:24 - Trial = 28290/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.060 | DEBUG    | __main__:trials:29 - Trial = 28290/30000 | Total reward = 42.01
2022-01-26 14:18:44.064 | DEBUG    | __main__:trials:24 - Trial = 28291/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.065 | DEBUG    | __main__:trials:29 - Trial = 28291/30000 | Total reward = 29.30
2022-01-26 14:18:44.069 | DEBUG    | __main__:trials:24 - Trial = 28292/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.071 | DEBUG    | __main__:trials:29 - Trial = 28292/30000 | Total reward = 52.61
2022-01-26 14:18:44.074 | DEBUG    | __main__:trials:24 - Trial = 28293/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.076 | DEBUG    | __main__:trials:29 - Trial = 28293/30000 | Total reward = 40.14
2022-01-26 14:18:44.079 | DEBUG    | __main__:trials:24 - Trial = 28294/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.080 | DEBUG    | __main__:trials:29 - Trial = 28294/30000 | Total reward = 43.29
2022-01-26 14:18:44.084 | DEBUG    | __main__:trials:24 - Trial = 28295/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.086 | DEBUG    | __main__:trials:29 - Trial = 28295/30000 | Total reward = 41.64
2022-01-26 14:18:44.089 | DEBUG    | __main__:trials:24 - Trial = 28296/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.091 | DEBUG    | __main__:trials:29 - Trial = 28296/30000 | Total reward = 45.86
2022-01-26 14:18:44.094 | DEBUG    | __main__:trials:24 - Trial = 28297/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.096 | DEBUG    | __main__:trials:29 - Trial = 28297/30000 | Total reward = 30.39
2022-01-26 14:18:44.099 | DEBUG    | __main__:trials:24 - Trial = 28298/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.101 | DEBUG    | __main__:trials:29 - Trial = 28298/30000 | Total reward = 51.16
2022-01-26 14:18:44.104 | DEBUG    | __main__:trials:24 - Trial = 28299/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.105 | DEBUG    | __main__:trials:29 - Trial = 28299/30000 | Total reward = 41.49
2022-01-26 14:18:44.109 | DEBUG    | __main__:trials:24 - Trial = 28300/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.109 | DEBUG    | __main__:trials:29 - Trial = 28300/30000 | Total reward = 22.98
2022-01-26 14:18:44.112 | DEBUG    | __main__:trials:26 - Trial = 28301/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.113 | DEBUG    | __main__:trials:29 - Trial = 28301/30000 | Total reward = 34.61
2022-01-26 14:18:44.116 | DEBUG    | __main__:trials:24 - Trial = 28302/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.118 | DEBUG    | __main__:trials:29 - Trial = 28302/30000 | Total reward = 48.06
2022-01-26 14:18:44.121 | DEBUG    | __main__:trials:26 - Trial = 28303/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.123 | DEBUG    | __main__:trials:29 - Trial = 28303/30000 | Total reward = 34.61
2022-01-26 14:18:44.126 | DEBUG    | __main__:trials:24 - Trial = 28304/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.128 | DEBUG    | __main__:trials:29 - Trial = 28304/30000 | Total reward = 47.20
2022-01-26 14:18:44.131 | DEBUG    | __main__:trials:24 - Trial = 28305/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.133 | DEBUG    | __main__:trials:29 - Trial = 28305/30000 | Total reward = 47.20
2022-01-26 14:18:44.135 | DEBUG    | __main__:trials:26 - Trial = 28306/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.136 | DEBUG    | __main__:trials:29 - Trial = 28306/30000 | Total reward = 10.89
2022-01-26 14:18:44.140 | DEBUG    | __main__:trials:24 - Trial = 28307/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.141 | DEBUG    | __main__:trials:29 - Trial = 28307/30000 | Total reward = 30.99
2022-01-26 14:18:44.144 | DEBUG    | __main__:trials:24 - Trial = 28308/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.146 | DEBUG    | __main__:trials:29 - Trial = 28308/30000 | Total reward = 41.13
2022-01-26 14:18:44.150 | DEBUG    | __main__:trials:24 - Trial = 28309/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.151 | DEBUG    | __main__:trials:29 - Trial = 28309/30000 | Total reward = 42.76
2022-01-26 14:18:44.155 | DEBUG    | __main__:trials:24 - Trial = 28310/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.157 | DEBUG    | __main__:trials:29 - Trial = 28310/30000 | Total reward = 40.95
2022-01-26 14:18:44.161 | DEBUG    | __main__:trials:24 - Trial = 28311/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.161 | DEBUG    | __main__:trials:29 - Trial = 28311/30000 | Total reward = 51.10
2022-01-26 14:18:44.165 | DEBUG    | __main__:trials:24 - Trial = 28312/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.165 | DEBUG    | __main__:trials:29 - Trial = 28312/30000 | Total reward = 44.94
2022-01-26 14:18:44.168 | DEBUG    | __main__:trials:24 - Trial = 28313/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.169 | DEBUG    | __main__:trials:29 - Trial = 28313/30000 | Total reward = 48.87
2022-01-26 14:18:44.172 | DEBUG    | __main__:trials:24 - Trial = 28314/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.173 | DEBUG    | __main__:trials:29 - Trial = 28314/30000 | Total reward = 52.63
2022-01-26 14:18:44.177 | DEBUG    | __main__:trials:24 - Trial = 28315/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.178 | DEBUG    | __main__:trials:29 - Trial = 28315/30000 | Total reward = 44.11
2022-01-26 14:18:44.182 | DEBUG    | __main__:trials:24 - Trial = 28316/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.183 | DEBUG    | __main__:trials:29 - Trial = 28316/30000 | Total reward = 45.94
2022-01-26 14:18:44.186 | DEBUG    | __main__:trials:24 - Trial = 28317/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.188 | DEBUG    | __main__:trials:29 - Trial = 28317/30000 | Total reward = 45.79
2022-01-26 14:18:44.192 | DEBUG    | __main__:trials:26 - Trial = 28318/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.193 | DEBUG    | __main__:trials:29 - Trial = 28318/30000 | Total reward = 19.73
2022-01-26 14:18:44.197 | DEBUG    | __main__:trials:24 - Trial = 28319/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.199 | DEBUG    | __main__:trials:29 - Trial = 28319/30000 | Total reward = 45.89
2022-01-26 14:18:44.203 | DEBUG    | __main__:trials:24 - Trial = 28320/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.205 | DEBUG    | __main__:trials:29 - Trial = 28320/30000 | Total reward = 44.89
2022-01-26 14:18:44.208 | DEBUG    | __main__:trials:24 - Trial = 28321/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.210 | DEBUG    | __main__:trials:29 - Trial = 28321/30000 | Total reward = 33.39
2022-01-26 14:18:44.214 | DEBUG    | __main__:trials:24 - Trial = 28322/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.215 | DEBUG    | __main__:trials:29 - Trial = 28322/30000 | Total reward = 54.27
2022-01-26 14:18:44.219 | DEBUG    | __main__:trials:24 - Trial = 28323/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.221 | DEBUG    | __main__:trials:29 - Trial = 28323/30000 | Total reward = 46.58
2022-01-26 14:18:44.224 | DEBUG    | __main__:trials:24 - Trial = 28324/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.226 | DEBUG    | __main__:trials:29 - Trial = 28324/30000 | Total reward = 45.59
2022-01-26 14:18:44.229 | DEBUG    | __main__:trials:26 - Trial = 28325/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.230 | DEBUG    | __main__:trials:29 - Trial = 28325/30000 | Total reward = 27.85
2022-01-26 14:18:44.233 | DEBUG    | __main__:trials:24 - Trial = 28326/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.234 | DEBUG    | __main__:trials:29 - Trial = 28326/30000 | Total reward = 23.21
2022-01-26 14:18:44.237 | DEBUG    | __main__:trials:24 - Trial = 28327/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.238 | DEBUG    | __main__:trials:29 - Trial = 28327/30000 | Total reward = 46.19
2022-01-26 14:18:44.241 | DEBUG    | __main__:trials:24 - Trial = 28328/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.243 | DEBUG    | __main__:trials:29 - Trial = 28328/30000 | Total reward = 45.94
2022-01-26 14:18:44.246 | DEBUG    | __main__:trials:24 - Trial = 28329/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.248 | DEBUG    | __main__:trials:29 - Trial = 28329/30000 | Total reward = 39.08
2022-01-26 14:18:44.252 | DEBUG    | __main__:trials:24 - Trial = 28330/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.252 | DEBUG    | __main__:trials:29 - Trial = 28330/30000 | Total reward = 57.17
2022-01-26 14:18:44.256 | DEBUG    | __main__:trials:24 - Trial = 28331/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.258 | DEBUG    | __main__:trials:29 - Trial = 28331/30000 | Total reward = 51.00
2022-01-26 14:18:44.262 | DEBUG    | __main__:trials:24 - Trial = 28332/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.263 | DEBUG    | __main__:trials:29 - Trial = 28332/30000 | Total reward = 32.19
2022-01-26 14:18:44.267 | DEBUG    | __main__:trials:24 - Trial = 28333/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.268 | DEBUG    | __main__:trials:29 - Trial = 28333/30000 | Total reward = 39.85
2022-01-26 14:18:44.272 | DEBUG    | __main__:trials:24 - Trial = 28334/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.274 | DEBUG    | __main__:trials:29 - Trial = 28334/30000 | Total reward = 28.77
2022-01-26 14:18:44.278 | DEBUG    | __main__:trials:24 - Trial = 28335/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.280 | DEBUG    | __main__:trials:29 - Trial = 28335/30000 | Total reward = 32.65
2022-01-26 14:18:44.283 | DEBUG    | __main__:trials:24 - Trial = 28336/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.285 | DEBUG    | __main__:trials:29 - Trial = 28336/30000 | Total reward = 49.60
2022-01-26 14:18:44.288 | DEBUG    | __main__:trials:24 - Trial = 28337/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.290 | DEBUG    | __main__:trials:29 - Trial = 28337/30000 | Total reward = 42.82
2022-01-26 14:18:44.293 | DEBUG    | __main__:trials:24 - Trial = 28338/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.294 | DEBUG    | __main__:trials:29 - Trial = 28338/30000 | Total reward = 30.99
2022-01-26 14:18:44.297 | DEBUG    | __main__:trials:24 - Trial = 28339/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.299 | DEBUG    | __main__:trials:29 - Trial = 28339/30000 | Total reward = 59.85
2022-01-26 14:18:44.302 | DEBUG    | __main__:trials:24 - Trial = 28340/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.304 | DEBUG    | __main__:trials:29 - Trial = 28340/30000 | Total reward = 45.99
2022-01-26 14:18:44.308 | DEBUG    | __main__:trials:24 - Trial = 28341/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.309 | DEBUG    | __main__:trials:29 - Trial = 28341/30000 | Total reward = 61.09
2022-01-26 14:18:44.312 | DEBUG    | __main__:trials:24 - Trial = 28342/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.314 | DEBUG    | __main__:trials:29 - Trial = 28342/30000 | Total reward = 46.03
2022-01-26 14:18:44.318 | DEBUG    | __main__:trials:24 - Trial = 28343/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.320 | DEBUG    | __main__:trials:29 - Trial = 28343/30000 | Total reward = 26.32
2022-01-26 14:18:44.323 | DEBUG    | __main__:trials:26 - Trial = 28344/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.325 | DEBUG    | __main__:trials:29 - Trial = 28344/30000 | Total reward = 22.02
2022-01-26 14:18:44.328 | DEBUG    | __main__:trials:24 - Trial = 28345/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.330 | DEBUG    | __main__:trials:29 - Trial = 28345/30000 | Total reward = 29.61
2022-01-26 14:18:44.334 | DEBUG    | __main__:trials:24 - Trial = 28346/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.335 | DEBUG    | __main__:trials:29 - Trial = 28346/30000 | Total reward = 54.62
2022-01-26 14:18:44.339 | DEBUG    | __main__:trials:24 - Trial = 28347/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.341 | DEBUG    | __main__:trials:29 - Trial = 28347/30000 | Total reward = 40.77
2022-01-26 14:18:44.344 | DEBUG    | __main__:trials:24 - Trial = 28348/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.345 | DEBUG    | __main__:trials:29 - Trial = 28348/30000 | Total reward = 44.45
2022-01-26 14:18:44.348 | DEBUG    | __main__:trials:24 - Trial = 28349/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.350 | DEBUG    | __main__:trials:29 - Trial = 28349/30000 | Total reward = 43.87
2022-01-26 14:18:44.353 | DEBUG    | __main__:trials:24 - Trial = 28350/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.355 | DEBUG    | __main__:trials:29 - Trial = 28350/30000 | Total reward = 29.17
2022-01-26 14:18:44.359 | DEBUG    | __main__:trials:24 - Trial = 28351/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.360 | DEBUG    | __main__:trials:29 - Trial = 28351/30000 | Total reward = 40.50
2022-01-26 14:18:44.364 | DEBUG    | __main__:trials:24 - Trial = 28352/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.365 | DEBUG    | __main__:trials:29 - Trial = 28352/30000 | Total reward = 26.09
2022-01-26 14:18:44.369 | DEBUG    | __main__:trials:24 - Trial = 28353/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.370 | DEBUG    | __main__:trials:29 - Trial = 28353/30000 | Total reward = 25.77
2022-01-26 14:18:44.373 | DEBUG    | __main__:trials:24 - Trial = 28354/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.374 | DEBUG    | __main__:trials:29 - Trial = 28354/30000 | Total reward = 45.18
2022-01-26 14:18:44.377 | DEBUG    | __main__:trials:24 - Trial = 28355/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.378 | DEBUG    | __main__:trials:29 - Trial = 28355/30000 | Total reward = 27.67
2022-01-26 14:18:44.381 | DEBUG    | __main__:trials:24 - Trial = 28356/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.382 | DEBUG    | __main__:trials:29 - Trial = 28356/30000 | Total reward = 52.46
2022-01-26 14:18:44.385 | DEBUG    | __main__:trials:24 - Trial = 28357/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.387 | DEBUG    | __main__:trials:29 - Trial = 28357/30000 | Total reward = 43.86
2022-01-26 14:18:44.390 | DEBUG    | __main__:trials:24 - Trial = 28358/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.392 | DEBUG    | __main__:trials:29 - Trial = 28358/30000 | Total reward = 42.18
2022-01-26 14:18:44.396 | DEBUG    | __main__:trials:24 - Trial = 28359/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.397 | DEBUG    | __main__:trials:29 - Trial = 28359/30000 | Total reward = 48.69
2022-01-26 14:18:44.400 | DEBUG    | __main__:trials:24 - Trial = 28360/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.402 | DEBUG    | __main__:trials:29 - Trial = 28360/30000 | Total reward = 46.40
2022-01-26 14:18:44.405 | DEBUG    | __main__:trials:24 - Trial = 28361/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.407 | DEBUG    | __main__:trials:29 - Trial = 28361/30000 | Total reward = 45.15
2022-01-26 14:18:44.411 | DEBUG    | __main__:trials:24 - Trial = 28362/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.412 | DEBUG    | __main__:trials:29 - Trial = 28362/30000 | Total reward = 45.76
2022-01-26 14:18:44.415 | DEBUG    | __main__:trials:24 - Trial = 28363/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.417 | DEBUG    | __main__:trials:29 - Trial = 28363/30000 | Total reward = 46.20
2022-01-26 14:18:44.421 | DEBUG    | __main__:trials:24 - Trial = 28364/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.422 | DEBUG    | __main__:trials:29 - Trial = 28364/30000 | Total reward = 39.12
2022-01-26 14:18:44.426 | DEBUG    | __main__:trials:24 - Trial = 28365/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.428 | DEBUG    | __main__:trials:29 - Trial = 28365/30000 | Total reward = 39.26
2022-01-26 14:18:44.432 | DEBUG    | __main__:trials:24 - Trial = 28366/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.433 | DEBUG    | __main__:trials:29 - Trial = 28366/30000 | Total reward = 46.27
2022-01-26 14:18:44.436 | DEBUG    | __main__:trials:24 - Trial = 28367/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.438 | DEBUG    | __main__:trials:29 - Trial = 28367/30000 | Total reward = 39.51
2022-01-26 14:18:44.441 | DEBUG    | __main__:trials:24 - Trial = 28368/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.443 | DEBUG    | __main__:trials:29 - Trial = 28368/30000 | Total reward = 52.06
2022-01-26 14:18:44.447 | DEBUG    | __main__:trials:24 - Trial = 28369/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.448 | DEBUG    | __main__:trials:29 - Trial = 28369/30000 | Total reward = 43.24
2022-01-26 14:18:44.452 | DEBUG    | __main__:trials:24 - Trial = 28370/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.453 | DEBUG    | __main__:trials:29 - Trial = 28370/30000 | Total reward = 37.02
2022-01-26 14:18:44.457 | DEBUG    | __main__:trials:24 - Trial = 28371/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.458 | DEBUG    | __main__:trials:29 - Trial = 28371/30000 | Total reward = 47.13
2022-01-26 14:18:44.462 | DEBUG    | __main__:trials:24 - Trial = 28372/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.463 | DEBUG    | __main__:trials:29 - Trial = 28372/30000 | Total reward = 46.45
2022-01-26 14:18:44.467 | DEBUG    | __main__:trials:24 - Trial = 28373/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.469 | DEBUG    | __main__:trials:29 - Trial = 28373/30000 | Total reward = 46.07
2022-01-26 14:18:44.471 | DEBUG    | __main__:trials:24 - Trial = 28374/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.473 | DEBUG    | __main__:trials:29 - Trial = 28374/30000 | Total reward = 40.64
2022-01-26 14:18:44.477 | DEBUG    | __main__:trials:24 - Trial = 28375/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.478 | DEBUG    | __main__:trials:29 - Trial = 28375/30000 | Total reward = 44.49
2022-01-26 14:18:44.482 | DEBUG    | __main__:trials:24 - Trial = 28376/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.483 | DEBUG    | __main__:trials:29 - Trial = 28376/30000 | Total reward = 32.27
2022-01-26 14:18:44.487 | DEBUG    | __main__:trials:24 - Trial = 28377/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.488 | DEBUG    | __main__:trials:29 - Trial = 28377/30000 | Total reward = 45.53
2022-01-26 14:18:44.492 | DEBUG    | __main__:trials:26 - Trial = 28378/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.492 | DEBUG    | __main__:trials:29 - Trial = 28378/30000 | Total reward = 16.31
2022-01-26 14:18:44.496 | DEBUG    | __main__:trials:24 - Trial = 28379/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.497 | DEBUG    | __main__:trials:29 - Trial = 28379/30000 | Total reward = 39.54
2022-01-26 14:18:44.500 | DEBUG    | __main__:trials:24 - Trial = 28380/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.502 | DEBUG    | __main__:trials:29 - Trial = 28380/30000 | Total reward = 49.16
2022-01-26 14:18:44.506 | DEBUG    | __main__:trials:24 - Trial = 28381/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.507 | DEBUG    | __main__:trials:29 - Trial = 28381/30000 | Total reward = 39.00
2022-01-26 14:18:44.511 | DEBUG    | __main__:trials:24 - Trial = 28382/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.513 | DEBUG    | __main__:trials:29 - Trial = 28382/30000 | Total reward = 43.60
2022-01-26 14:18:44.516 | DEBUG    | __main__:trials:24 - Trial = 28383/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.518 | DEBUG    | __main__:trials:29 - Trial = 28383/30000 | Total reward = 43.36
2022-01-26 14:18:44.522 | DEBUG    | __main__:trials:24 - Trial = 28384/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.523 | DEBUG    | __main__:trials:29 - Trial = 28384/30000 | Total reward = 37.07
2022-01-26 14:18:44.527 | DEBUG    | __main__:trials:26 - Trial = 28385/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.529 | DEBUG    | __main__:trials:29 - Trial = 28385/30000 | Total reward = 27.45
2022-01-26 14:18:44.532 | DEBUG    | __main__:trials:24 - Trial = 28386/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.533 | DEBUG    | __main__:trials:29 - Trial = 28386/30000 | Total reward = 42.22
2022-01-26 14:18:44.536 | DEBUG    | __main__:trials:26 - Trial = 28387/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.537 | DEBUG    | __main__:trials:29 - Trial = 28387/30000 | Total reward = 22.27
2022-01-26 14:18:44.541 | DEBUG    | __main__:trials:24 - Trial = 28388/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.543 | DEBUG    | __main__:trials:29 - Trial = 28388/30000 | Total reward = 43.37
2022-01-26 14:18:44.546 | DEBUG    | __main__:trials:24 - Trial = 28389/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.548 | DEBUG    | __main__:trials:29 - Trial = 28389/30000 | Total reward = 53.35
2022-01-26 14:18:44.552 | DEBUG    | __main__:trials:24 - Trial = 28390/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.553 | DEBUG    | __main__:trials:29 - Trial = 28390/30000 | Total reward = 41.07
2022-01-26 14:18:44.556 | DEBUG    | __main__:trials:24 - Trial = 28391/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.558 | DEBUG    | __main__:trials:29 - Trial = 28391/30000 | Total reward = 45.45
2022-01-26 14:18:44.561 | DEBUG    | __main__:trials:24 - Trial = 28392/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.563 | DEBUG    | __main__:trials:29 - Trial = 28392/30000 | Total reward = 32.77
2022-01-26 14:18:44.567 | DEBUG    | __main__:trials:24 - Trial = 28393/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.568 | DEBUG    | __main__:trials:29 - Trial = 28393/30000 | Total reward = 50.84
2022-01-26 14:18:44.572 | DEBUG    | __main__:trials:24 - Trial = 28394/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.573 | DEBUG    | __main__:trials:29 - Trial = 28394/30000 | Total reward = 26.47
2022-01-26 14:18:44.577 | DEBUG    | __main__:trials:24 - Trial = 28395/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.579 | DEBUG    | __main__:trials:29 - Trial = 28395/30000 | Total reward = 45.25
2022-01-26 14:18:44.582 | DEBUG    | __main__:trials:24 - Trial = 28396/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.584 | DEBUG    | __main__:trials:29 - Trial = 28396/30000 | Total reward = 43.82
2022-01-26 14:18:44.587 | DEBUG    | __main__:trials:24 - Trial = 28397/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.589 | DEBUG    | __main__:trials:29 - Trial = 28397/30000 | Total reward = 30.28
2022-01-26 14:18:44.592 | DEBUG    | __main__:trials:24 - Trial = 28398/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.594 | DEBUG    | __main__:trials:29 - Trial = 28398/30000 | Total reward = 36.62
2022-01-26 14:18:44.598 | DEBUG    | __main__:trials:24 - Trial = 28399/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.598 | DEBUG    | __main__:trials:29 - Trial = 28399/30000 | Total reward = 31.66
2022-01-26 14:18:44.602 | DEBUG    | __main__:trials:24 - Trial = 28400/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.604 | DEBUG    | __main__:trials:29 - Trial = 28400/30000 | Total reward = 37.50
2022-01-26 14:18:44.607 | DEBUG    | __main__:trials:24 - Trial = 28401/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.609 | DEBUG    | __main__:trials:29 - Trial = 28401/30000 | Total reward = 49.76
2022-01-26 14:18:44.612 | DEBUG    | __main__:trials:26 - Trial = 28402/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.613 | DEBUG    | __main__:trials:29 - Trial = 28402/30000 | Total reward = 17.20
2022-01-26 14:18:44.616 | DEBUG    | __main__:trials:24 - Trial = 28403/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.617 | DEBUG    | __main__:trials:29 - Trial = 28403/30000 | Total reward = 39.85
2022-01-26 14:18:44.621 | DEBUG    | __main__:trials:24 - Trial = 28404/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.622 | DEBUG    | __main__:trials:29 - Trial = 28404/30000 | Total reward = 44.83
2022-01-26 14:18:44.625 | DEBUG    | __main__:trials:26 - Trial = 28405/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.626 | DEBUG    | __main__:trials:29 - Trial = 28405/30000 | Total reward = 20.34
2022-01-26 14:18:44.630 | DEBUG    | __main__:trials:24 - Trial = 28406/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.631 | DEBUG    | __main__:trials:29 - Trial = 28406/30000 | Total reward = 36.18
2022-01-26 14:18:44.634 | DEBUG    | __main__:trials:24 - Trial = 28407/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.636 | DEBUG    | __main__:trials:29 - Trial = 28407/30000 | Total reward = 38.03
2022-01-26 14:18:44.640 | DEBUG    | __main__:trials:24 - Trial = 28408/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.642 | DEBUG    | __main__:trials:29 - Trial = 28408/30000 | Total reward = 44.56
2022-01-26 14:18:44.645 | DEBUG    | __main__:trials:24 - Trial = 28409/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.647 | DEBUG    | __main__:trials:29 - Trial = 28409/30000 | Total reward = 46.64
2022-01-26 14:18:44.651 | DEBUG    | __main__:trials:24 - Trial = 28410/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.652 | DEBUG    | __main__:trials:29 - Trial = 28410/30000 | Total reward = 43.40
2022-01-26 14:18:44.656 | DEBUG    | __main__:trials:24 - Trial = 28411/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.658 | DEBUG    | __main__:trials:29 - Trial = 28411/30000 | Total reward = 45.16
2022-01-26 14:18:44.661 | DEBUG    | __main__:trials:24 - Trial = 28412/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.663 | DEBUG    | __main__:trials:29 - Trial = 28412/30000 | Total reward = 35.96
2022-01-26 14:18:44.667 | DEBUG    | __main__:trials:24 - Trial = 28413/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.668 | DEBUG    | __main__:trials:29 - Trial = 28413/30000 | Total reward = 44.01
2022-01-26 14:18:44.671 | DEBUG    | __main__:trials:24 - Trial = 28414/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.673 | DEBUG    | __main__:trials:29 - Trial = 28414/30000 | Total reward = 50.33
2022-01-26 14:18:44.677 | DEBUG    | __main__:trials:24 - Trial = 28415/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.678 | DEBUG    | __main__:trials:29 - Trial = 28415/30000 | Total reward = 41.60
2022-01-26 14:18:44.682 | DEBUG    | __main__:trials:26 - Trial = 28416/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.682 | DEBUG    | __main__:trials:29 - Trial = 28416/30000 | Total reward = 24.13
2022-01-26 14:18:44.687 | DEBUG    | __main__:trials:24 - Trial = 28417/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.687 | DEBUG    | __main__:trials:29 - Trial = 28417/30000 | Total reward = 39.62
2022-01-26 14:18:44.691 | DEBUG    | __main__:trials:26 - Trial = 28418/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.692 | DEBUG    | __main__:trials:29 - Trial = 28418/30000 | Total reward = 22.54
2022-01-26 14:18:44.696 | DEBUG    | __main__:trials:24 - Trial = 28419/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.698 | DEBUG    | __main__:trials:29 - Trial = 28419/30000 | Total reward = 44.52
2022-01-26 14:18:44.701 | DEBUG    | __main__:trials:24 - Trial = 28420/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.703 | DEBUG    | __main__:trials:29 - Trial = 28420/30000 | Total reward = 42.47
2022-01-26 14:18:44.706 | DEBUG    | __main__:trials:24 - Trial = 28421/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.707 | DEBUG    | __main__:trials:29 - Trial = 28421/30000 | Total reward = 35.89
2022-01-26 14:18:44.711 | DEBUG    | __main__:trials:24 - Trial = 28422/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.713 | DEBUG    | __main__:trials:29 - Trial = 28422/30000 | Total reward = 45.99
2022-01-26 14:18:44.716 | DEBUG    | __main__:trials:24 - Trial = 28423/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.718 | DEBUG    | __main__:trials:29 - Trial = 28423/30000 | Total reward = 37.03
2022-01-26 14:18:44.721 | DEBUG    | __main__:trials:24 - Trial = 28424/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.723 | DEBUG    | __main__:trials:29 - Trial = 28424/30000 | Total reward = 42.99
2022-01-26 14:18:44.727 | DEBUG    | __main__:trials:24 - Trial = 28425/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.727 | DEBUG    | __main__:trials:29 - Trial = 28425/30000 | Total reward = 37.05
2022-01-26 14:18:44.732 | DEBUG    | __main__:trials:24 - Trial = 28426/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.733 | DEBUG    | __main__:trials:29 - Trial = 28426/30000 | Total reward = 49.17
2022-01-26 14:18:44.737 | DEBUG    | __main__:trials:24 - Trial = 28427/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.739 | DEBUG    | __main__:trials:29 - Trial = 28427/30000 | Total reward = 37.38
2022-01-26 14:18:44.741 | DEBUG    | __main__:trials:24 - Trial = 28428/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.743 | DEBUG    | __main__:trials:29 - Trial = 28428/30000 | Total reward = 45.35
2022-01-26 14:18:44.746 | DEBUG    | __main__:trials:24 - Trial = 28429/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.748 | DEBUG    | __main__:trials:29 - Trial = 28429/30000 | Total reward = 23.08
2022-01-26 14:18:44.752 | DEBUG    | __main__:trials:24 - Trial = 28430/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.753 | DEBUG    | __main__:trials:29 - Trial = 28430/30000 | Total reward = 41.62
2022-01-26 14:18:44.757 | DEBUG    | __main__:trials:24 - Trial = 28431/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.759 | DEBUG    | __main__:trials:29 - Trial = 28431/30000 | Total reward = 45.16
2022-01-26 14:18:44.763 | DEBUG    | __main__:trials:24 - Trial = 28432/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.764 | DEBUG    | __main__:trials:29 - Trial = 28432/30000 | Total reward = 47.12
2022-01-26 14:18:44.767 | DEBUG    | __main__:trials:24 - Trial = 28433/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.769 | DEBUG    | __main__:trials:29 - Trial = 28433/30000 | Total reward = 42.12
2022-01-26 14:18:44.772 | DEBUG    | __main__:trials:24 - Trial = 28434/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.774 | DEBUG    | __main__:trials:29 - Trial = 28434/30000 | Total reward = 43.38
2022-01-26 14:18:44.778 | DEBUG    | __main__:trials:24 - Trial = 28435/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.779 | DEBUG    | __main__:trials:29 - Trial = 28435/30000 | Total reward = 42.97
2022-01-26 14:18:44.783 | DEBUG    | __main__:trials:24 - Trial = 28436/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.784 | DEBUG    | __main__:trials:29 - Trial = 28436/30000 | Total reward = 37.28
2022-01-26 14:18:44.787 | DEBUG    | __main__:trials:24 - Trial = 28437/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.788 | DEBUG    | __main__:trials:29 - Trial = 28437/30000 | Total reward = 36.06
2022-01-26 14:18:44.791 | DEBUG    | __main__:trials:24 - Trial = 28438/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.793 | DEBUG    | __main__:trials:29 - Trial = 28438/30000 | Total reward = 45.97
2022-01-26 14:18:44.796 | DEBUG    | __main__:trials:24 - Trial = 28439/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.797 | DEBUG    | __main__:trials:29 - Trial = 28439/30000 | Total reward = 43.73
2022-01-26 14:18:44.801 | DEBUG    | __main__:trials:24 - Trial = 28440/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.801 | DEBUG    | __main__:trials:29 - Trial = 28440/30000 | Total reward = 44.30
2022-01-26 14:18:44.805 | DEBUG    | __main__:trials:24 - Trial = 28441/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.805 | DEBUG    | __main__:trials:29 - Trial = 28441/30000 | Total reward = 38.47
2022-01-26 14:18:44.809 | DEBUG    | __main__:trials:24 - Trial = 28442/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.810 | DEBUG    | __main__:trials:29 - Trial = 28442/30000 | Total reward = 43.84
2022-01-26 14:18:44.813 | DEBUG    | __main__:trials:24 - Trial = 28443/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.814 | DEBUG    | __main__:trials:29 - Trial = 28443/30000 | Total reward = 27.71
2022-01-26 14:18:44.818 | DEBUG    | __main__:trials:24 - Trial = 28444/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.820 | DEBUG    | __main__:trials:29 - Trial = 28444/30000 | Total reward = 51.82
2022-01-26 14:18:44.823 | DEBUG    | __main__:trials:24 - Trial = 28445/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.824 | DEBUG    | __main__:trials:29 - Trial = 28445/30000 | Total reward = 42.42
2022-01-26 14:18:44.827 | DEBUG    | __main__:trials:24 - Trial = 28446/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.828 | DEBUG    | __main__:trials:29 - Trial = 28446/30000 | Total reward = 41.84
2022-01-26 14:18:44.831 | DEBUG    | __main__:trials:24 - Trial = 28447/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.833 | DEBUG    | __main__:trials:29 - Trial = 28447/30000 | Total reward = 49.70
2022-01-26 14:18:44.836 | DEBUG    | __main__:trials:24 - Trial = 28448/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.838 | DEBUG    | __main__:trials:29 - Trial = 28448/30000 | Total reward = 39.60
2022-01-26 14:18:44.842 | DEBUG    | __main__:trials:24 - Trial = 28449/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.843 | DEBUG    | __main__:trials:29 - Trial = 28449/30000 | Total reward = 38.73
2022-01-26 14:18:44.846 | DEBUG    | __main__:trials:24 - Trial = 28450/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.847 | DEBUG    | __main__:trials:29 - Trial = 28450/30000 | Total reward = 41.31
2022-01-26 14:18:44.851 | DEBUG    | __main__:trials:24 - Trial = 28451/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.851 | DEBUG    | __main__:trials:29 - Trial = 28451/30000 | Total reward = 35.73
2022-01-26 14:18:44.854 | DEBUG    | __main__:trials:26 - Trial = 28452/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.856 | DEBUG    | __main__:trials:29 - Trial = 28452/30000 | Total reward = 16.09
2022-01-26 14:18:44.859 | DEBUG    | __main__:trials:24 - Trial = 28453/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.860 | DEBUG    | __main__:trials:29 - Trial = 28453/30000 | Total reward = 42.61
2022-01-26 14:18:44.863 | DEBUG    | __main__:trials:24 - Trial = 28454/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.865 | DEBUG    | __main__:trials:29 - Trial = 28454/30000 | Total reward = 39.47
2022-01-26 14:18:44.868 | DEBUG    | __main__:trials:24 - Trial = 28455/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.870 | DEBUG    | __main__:trials:29 - Trial = 28455/30000 | Total reward = 41.69
2022-01-26 14:18:44.874 | DEBUG    | __main__:trials:24 - Trial = 28456/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.875 | DEBUG    | __main__:trials:29 - Trial = 28456/30000 | Total reward = 46.45
2022-01-26 14:18:44.878 | DEBUG    | __main__:trials:24 - Trial = 28457/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.879 | DEBUG    | __main__:trials:29 - Trial = 28457/30000 | Total reward = 32.41
2022-01-26 14:18:44.882 | DEBUG    | __main__:trials:26 - Trial = 28458/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.883 | DEBUG    | __main__:trials:29 - Trial = 28458/30000 | Total reward = 24.60
2022-01-26 14:18:44.887 | DEBUG    | __main__:trials:24 - Trial = 28459/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.888 | DEBUG    | __main__:trials:29 - Trial = 28459/30000 | Total reward = 45.59
2022-01-26 14:18:44.891 | DEBUG    | __main__:trials:26 - Trial = 28460/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.893 | DEBUG    | __main__:trials:29 - Trial = 28460/30000 | Total reward = 34.46
2022-01-26 14:18:44.896 | DEBUG    | __main__:trials:24 - Trial = 28461/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.898 | DEBUG    | __main__:trials:29 - Trial = 28461/30000 | Total reward = 37.78
2022-01-26 14:18:44.901 | DEBUG    | __main__:trials:24 - Trial = 28462/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.903 | DEBUG    | __main__:trials:29 - Trial = 28462/30000 | Total reward = 40.11
2022-01-26 14:18:44.905 | DEBUG    | __main__:trials:24 - Trial = 28463/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.907 | DEBUG    | __main__:trials:29 - Trial = 28463/30000 | Total reward = 33.36
2022-01-26 14:18:44.910 | DEBUG    | __main__:trials:26 - Trial = 28464/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.911 | DEBUG    | __main__:trials:29 - Trial = 28464/30000 | Total reward = 32.70
2022-01-26 14:18:44.914 | DEBUG    | __main__:trials:24 - Trial = 28465/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.916 | DEBUG    | __main__:trials:29 - Trial = 28465/30000 | Total reward = 25.38
2022-01-26 14:18:44.920 | DEBUG    | __main__:trials:24 - Trial = 28466/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.921 | DEBUG    | __main__:trials:29 - Trial = 28466/30000 | Total reward = 48.29
2022-01-26 14:18:44.924 | DEBUG    | __main__:trials:24 - Trial = 28467/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.926 | DEBUG    | __main__:trials:29 - Trial = 28467/30000 | Total reward = 46.45
2022-01-26 14:18:44.929 | DEBUG    | __main__:trials:24 - Trial = 28468/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.930 | DEBUG    | __main__:trials:29 - Trial = 28468/30000 | Total reward = 50.56
2022-01-26 14:18:44.933 | DEBUG    | __main__:trials:24 - Trial = 28469/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.935 | DEBUG    | __main__:trials:29 - Trial = 28469/30000 | Total reward = 50.91
2022-01-26 14:18:44.938 | DEBUG    | __main__:trials:24 - Trial = 28470/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.939 | DEBUG    | __main__:trials:29 - Trial = 28470/30000 | Total reward = 42.51
2022-01-26 14:18:44.943 | DEBUG    | __main__:trials:24 - Trial = 28471/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.945 | DEBUG    | __main__:trials:29 - Trial = 28471/30000 | Total reward = 32.65
2022-01-26 14:18:44.947 | DEBUG    | __main__:trials:24 - Trial = 28472/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.949 | DEBUG    | __main__:trials:29 - Trial = 28472/30000 | Total reward = 40.97
2022-01-26 14:18:44.953 | DEBUG    | __main__:trials:24 - Trial = 28473/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.955 | DEBUG    | __main__:trials:29 - Trial = 28473/30000 | Total reward = 46.45
2022-01-26 14:18:44.958 | DEBUG    | __main__:trials:24 - Trial = 28474/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.960 | DEBUG    | __main__:trials:29 - Trial = 28474/30000 | Total reward = 40.44
2022-01-26 14:18:44.963 | DEBUG    | __main__:trials:24 - Trial = 28475/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.964 | DEBUG    | __main__:trials:29 - Trial = 28475/30000 | Total reward = 41.84
2022-01-26 14:18:44.966 | DEBUG    | __main__:trials:26 - Trial = 28476/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:44.967 | DEBUG    | __main__:trials:29 - Trial = 28476/30000 | Total reward = 10.38
2022-01-26 14:18:44.971 | DEBUG    | __main__:trials:24 - Trial = 28477/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.972 | DEBUG    | __main__:trials:29 - Trial = 28477/30000 | Total reward = 36.11
2022-01-26 14:18:44.975 | DEBUG    | __main__:trials:24 - Trial = 28478/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.977 | DEBUG    | __main__:trials:29 - Trial = 28478/30000 | Total reward = 29.05
2022-01-26 14:18:44.980 | DEBUG    | __main__:trials:24 - Trial = 28479/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.981 | DEBUG    | __main__:trials:29 - Trial = 28479/30000 | Total reward = 44.33
2022-01-26 14:18:44.985 | DEBUG    | __main__:trials:24 - Trial = 28480/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.985 | DEBUG    | __main__:trials:29 - Trial = 28480/30000 | Total reward = 44.84
2022-01-26 14:18:44.989 | DEBUG    | __main__:trials:24 - Trial = 28481/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.991 | DEBUG    | __main__:trials:29 - Trial = 28481/30000 | Total reward = 44.56
2022-01-26 14:18:44.994 | DEBUG    | __main__:trials:24 - Trial = 28482/30000 | Max number of steps (20) reached
2022-01-26 14:18:44.994 | DEBUG    | __main__:trials:29 - Trial = 28482/30000 | Total reward = 41.17
2022-01-26 14:18:44.998 | DEBUG    | __main__:trials:24 - Trial = 28483/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.000 | DEBUG    | __main__:trials:29 - Trial = 28483/30000 | Total reward = 54.22
2022-01-26 14:18:45.003 | DEBUG    | __main__:trials:24 - Trial = 28484/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.003 | DEBUG    | __main__:trials:29 - Trial = 28484/30000 | Total reward = 32.55
2022-01-26 14:18:45.007 | DEBUG    | __main__:trials:24 - Trial = 28485/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.007 | DEBUG    | __main__:trials:29 - Trial = 28485/30000 | Total reward = 37.61
2022-01-26 14:18:45.011 | DEBUG    | __main__:trials:24 - Trial = 28486/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.012 | DEBUG    | __main__:trials:29 - Trial = 28486/30000 | Total reward = 37.26
2022-01-26 14:18:45.016 | DEBUG    | __main__:trials:24 - Trial = 28487/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.017 | DEBUG    | __main__:trials:29 - Trial = 28487/30000 | Total reward = 45.28
2022-01-26 14:18:45.021 | DEBUG    | __main__:trials:24 - Trial = 28488/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.022 | DEBUG    | __main__:trials:29 - Trial = 28488/30000 | Total reward = 41.84
2022-01-26 14:18:45.026 | DEBUG    | __main__:trials:24 - Trial = 28489/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.028 | DEBUG    | __main__:trials:29 - Trial = 28489/30000 | Total reward = 41.22
2022-01-26 14:18:45.031 | DEBUG    | __main__:trials:24 - Trial = 28490/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.033 | DEBUG    | __main__:trials:29 - Trial = 28490/30000 | Total reward = 39.07
2022-01-26 14:18:45.035 | DEBUG    | __main__:trials:24 - Trial = 28491/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.037 | DEBUG    | __main__:trials:29 - Trial = 28491/30000 | Total reward = 43.00
2022-01-26 14:18:45.041 | DEBUG    | __main__:trials:24 - Trial = 28492/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.042 | DEBUG    | __main__:trials:29 - Trial = 28492/30000 | Total reward = 48.37
2022-01-26 14:18:45.046 | DEBUG    | __main__:trials:24 - Trial = 28493/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.047 | DEBUG    | __main__:trials:29 - Trial = 28493/30000 | Total reward = 48.29
2022-01-26 14:18:45.051 | DEBUG    | __main__:trials:24 - Trial = 28494/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.053 | DEBUG    | __main__:trials:29 - Trial = 28494/30000 | Total reward = 48.76
2022-01-26 14:18:45.056 | DEBUG    | __main__:trials:24 - Trial = 28495/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.058 | DEBUG    | __main__:trials:29 - Trial = 28495/30000 | Total reward = 43.23
2022-01-26 14:18:45.061 | DEBUG    | __main__:trials:24 - Trial = 28496/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.062 | DEBUG    | __main__:trials:29 - Trial = 28496/30000 | Total reward = 46.61
2022-01-26 14:18:45.066 | DEBUG    | __main__:trials:24 - Trial = 28497/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.068 | DEBUG    | __main__:trials:29 - Trial = 28497/30000 | Total reward = 47.11
2022-01-26 14:18:45.071 | DEBUG    | __main__:trials:24 - Trial = 28498/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.073 | DEBUG    | __main__:trials:29 - Trial = 28498/30000 | Total reward = 41.49
2022-01-26 14:18:45.076 | DEBUG    | __main__:trials:24 - Trial = 28499/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.078 | DEBUG    | __main__:trials:29 - Trial = 28499/30000 | Total reward = 48.29
2022-01-26 14:18:45.082 | DEBUG    | __main__:trials:24 - Trial = 28500/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.083 | DEBUG    | __main__:trials:29 - Trial = 28500/30000 | Total reward = 41.25
2022-01-26 14:18:45.087 | DEBUG    | __main__:trials:24 - Trial = 28501/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.089 | DEBUG    | __main__:trials:29 - Trial = 28501/30000 | Total reward = 40.85
2022-01-26 14:18:45.092 | DEBUG    | __main__:trials:24 - Trial = 28502/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.094 | DEBUG    | __main__:trials:29 - Trial = 28502/30000 | Total reward = 33.62
2022-01-26 14:18:45.097 | DEBUG    | __main__:trials:24 - Trial = 28503/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.099 | DEBUG    | __main__:trials:29 - Trial = 28503/30000 | Total reward = 39.02
2022-01-26 14:18:45.104 | DEBUG    | __main__:trials:24 - Trial = 28504/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.104 | DEBUG    | __main__:trials:29 - Trial = 28504/30000 | Total reward = 25.33
2022-01-26 14:18:45.109 | DEBUG    | __main__:trials:24 - Trial = 28505/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.110 | DEBUG    | __main__:trials:29 - Trial = 28505/30000 | Total reward = 41.84
2022-01-26 14:18:45.113 | DEBUG    | __main__:trials:24 - Trial = 28506/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.115 | DEBUG    | __main__:trials:29 - Trial = 28506/30000 | Total reward = 46.08
2022-01-26 14:18:45.118 | DEBUG    | __main__:trials:24 - Trial = 28507/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.120 | DEBUG    | __main__:trials:29 - Trial = 28507/30000 | Total reward = 32.89
2022-01-26 14:18:45.123 | DEBUG    | __main__:trials:24 - Trial = 28508/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.124 | DEBUG    | __main__:trials:29 - Trial = 28508/30000 | Total reward = 42.34
2022-01-26 14:18:45.127 | DEBUG    | __main__:trials:24 - Trial = 28509/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.129 | DEBUG    | __main__:trials:29 - Trial = 28509/30000 | Total reward = 39.90
2022-01-26 14:18:45.132 | DEBUG    | __main__:trials:24 - Trial = 28510/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.133 | DEBUG    | __main__:trials:29 - Trial = 28510/30000 | Total reward = 44.26
2022-01-26 14:18:45.137 | DEBUG    | __main__:trials:24 - Trial = 28511/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.138 | DEBUG    | __main__:trials:29 - Trial = 28511/30000 | Total reward = 31.55
2022-01-26 14:18:45.143 | DEBUG    | __main__:trials:24 - Trial = 28512/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.143 | DEBUG    | __main__:trials:29 - Trial = 28512/30000 | Total reward = 44.65
2022-01-26 14:18:45.147 | DEBUG    | __main__:trials:24 - Trial = 28513/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.149 | DEBUG    | __main__:trials:29 - Trial = 28513/30000 | Total reward = 39.92
2022-01-26 14:18:45.152 | DEBUG    | __main__:trials:24 - Trial = 28514/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.154 | DEBUG    | __main__:trials:29 - Trial = 28514/30000 | Total reward = 39.47
2022-01-26 14:18:45.157 | DEBUG    | __main__:trials:24 - Trial = 28515/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.158 | DEBUG    | __main__:trials:29 - Trial = 28515/30000 | Total reward = 38.16
2022-01-26 14:18:45.163 | DEBUG    | __main__:trials:24 - Trial = 28516/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.163 | DEBUG    | __main__:trials:29 - Trial = 28516/30000 | Total reward = 46.17
2022-01-26 14:18:45.168 | DEBUG    | __main__:trials:24 - Trial = 28517/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.170 | DEBUG    | __main__:trials:29 - Trial = 28517/30000 | Total reward = 42.18
2022-01-26 14:18:45.173 | DEBUG    | __main__:trials:24 - Trial = 28518/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.174 | DEBUG    | __main__:trials:29 - Trial = 28518/30000 | Total reward = 38.09
2022-01-26 14:18:45.178 | DEBUG    | __main__:trials:26 - Trial = 28519/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.178 | DEBUG    | __main__:trials:29 - Trial = 28519/30000 | Total reward = 14.15
2022-01-26 14:18:45.182 | DEBUG    | __main__:trials:24 - Trial = 28520/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.184 | DEBUG    | __main__:trials:29 - Trial = 28520/30000 | Total reward = 48.51
2022-01-26 14:18:45.187 | DEBUG    | __main__:trials:24 - Trial = 28521/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.188 | DEBUG    | __main__:trials:29 - Trial = 28521/30000 | Total reward = 45.94
2022-01-26 14:18:45.191 | DEBUG    | __main__:trials:26 - Trial = 28522/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.193 | DEBUG    | __main__:trials:29 - Trial = 28522/30000 | Total reward = 23.86
2022-01-26 14:18:45.196 | DEBUG    | __main__:trials:24 - Trial = 28523/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.198 | DEBUG    | __main__:trials:29 - Trial = 28523/30000 | Total reward = 35.35
2022-01-26 14:18:45.201 | DEBUG    | __main__:trials:24 - Trial = 28524/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.202 | DEBUG    | __main__:trials:29 - Trial = 28524/30000 | Total reward = 38.40
2022-01-26 14:18:45.205 | DEBUG    | __main__:trials:24 - Trial = 28525/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.207 | DEBUG    | __main__:trials:29 - Trial = 28525/30000 | Total reward = 37.63
2022-01-26 14:18:45.210 | DEBUG    | __main__:trials:26 - Trial = 28526/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.211 | DEBUG    | __main__:trials:29 - Trial = 28526/30000 | Total reward = 20.11
2022-01-26 14:18:45.215 | DEBUG    | __main__:trials:24 - Trial = 28527/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.215 | DEBUG    | __main__:trials:29 - Trial = 28527/30000 | Total reward = 35.35
2022-01-26 14:18:45.220 | DEBUG    | __main__:trials:24 - Trial = 28528/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.221 | DEBUG    | __main__:trials:29 - Trial = 28528/30000 | Total reward = 35.69
2022-01-26 14:18:45.225 | DEBUG    | __main__:trials:24 - Trial = 28529/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.226 | DEBUG    | __main__:trials:29 - Trial = 28529/30000 | Total reward = 47.62
2022-01-26 14:18:45.230 | DEBUG    | __main__:trials:24 - Trial = 28530/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.232 | DEBUG    | __main__:trials:29 - Trial = 28530/30000 | Total reward = 43.33
2022-01-26 14:18:45.234 | DEBUG    | __main__:trials:26 - Trial = 28531/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.236 | DEBUG    | __main__:trials:29 - Trial = 28531/30000 | Total reward = 28.76
2022-01-26 14:18:45.239 | DEBUG    | __main__:trials:24 - Trial = 28532/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.241 | DEBUG    | __main__:trials:29 - Trial = 28532/30000 | Total reward = 47.22
2022-01-26 14:18:45.244 | DEBUG    | __main__:trials:24 - Trial = 28533/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.246 | DEBUG    | __main__:trials:29 - Trial = 28533/30000 | Total reward = 46.16
2022-01-26 14:18:45.249 | DEBUG    | __main__:trials:24 - Trial = 28534/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.250 | DEBUG    | __main__:trials:29 - Trial = 28534/30000 | Total reward = 35.85
2022-01-26 14:18:45.255 | DEBUG    | __main__:trials:24 - Trial = 28535/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.255 | DEBUG    | __main__:trials:29 - Trial = 28535/30000 | Total reward = 45.51
2022-01-26 14:18:45.260 | DEBUG    | __main__:trials:24 - Trial = 28536/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.262 | DEBUG    | __main__:trials:29 - Trial = 28536/30000 | Total reward = 41.71
2022-01-26 14:18:45.265 | DEBUG    | __main__:trials:24 - Trial = 28537/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.267 | DEBUG    | __main__:trials:29 - Trial = 28537/30000 | Total reward = 42.64
2022-01-26 14:18:45.271 | DEBUG    | __main__:trials:24 - Trial = 28538/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.272 | DEBUG    | __main__:trials:29 - Trial = 28538/30000 | Total reward = 59.64
2022-01-26 14:18:45.275 | DEBUG    | __main__:trials:24 - Trial = 28539/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.277 | DEBUG    | __main__:trials:29 - Trial = 28539/30000 | Total reward = 36.63
2022-01-26 14:18:45.281 | DEBUG    | __main__:trials:24 - Trial = 28540/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.282 | DEBUG    | __main__:trials:29 - Trial = 28540/30000 | Total reward = 54.42
2022-01-26 14:18:45.285 | DEBUG    | __main__:trials:24 - Trial = 28541/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.288 | DEBUG    | __main__:trials:29 - Trial = 28541/30000 | Total reward = 41.63
2022-01-26 14:18:45.291 | DEBUG    | __main__:trials:24 - Trial = 28542/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.293 | DEBUG    | __main__:trials:29 - Trial = 28542/30000 | Total reward = 50.48
2022-01-26 14:18:45.296 | DEBUG    | __main__:trials:24 - Trial = 28543/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.298 | DEBUG    | __main__:trials:29 - Trial = 28543/30000 | Total reward = 39.96
2022-01-26 14:18:45.301 | DEBUG    | __main__:trials:24 - Trial = 28544/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.302 | DEBUG    | __main__:trials:29 - Trial = 28544/30000 | Total reward = 44.49
2022-01-26 14:18:45.305 | DEBUG    | __main__:trials:26 - Trial = 28545/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.307 | DEBUG    | __main__:trials:29 - Trial = 28545/30000 | Total reward = 25.35
2022-01-26 14:18:45.311 | DEBUG    | __main__:trials:24 - Trial = 28546/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.313 | DEBUG    | __main__:trials:29 - Trial = 28546/30000 | Total reward = 51.88
2022-01-26 14:18:45.316 | DEBUG    | __main__:trials:24 - Trial = 28547/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.317 | DEBUG    | __main__:trials:29 - Trial = 28547/30000 | Total reward = 35.76
2022-01-26 14:18:45.320 | DEBUG    | __main__:trials:24 - Trial = 28548/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.322 | DEBUG    | __main__:trials:29 - Trial = 28548/30000 | Total reward = 36.89
2022-01-26 14:18:45.325 | DEBUG    | __main__:trials:24 - Trial = 28549/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.326 | DEBUG    | __main__:trials:29 - Trial = 28549/30000 | Total reward = 45.87
2022-01-26 14:18:45.329 | DEBUG    | __main__:trials:26 - Trial = 28550/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.331 | DEBUG    | __main__:trials:29 - Trial = 28550/30000 | Total reward = 15.02
2022-01-26 14:18:45.335 | DEBUG    | __main__:trials:24 - Trial = 28551/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.336 | DEBUG    | __main__:trials:29 - Trial = 28551/30000 | Total reward = 46.67
2022-01-26 14:18:45.340 | DEBUG    | __main__:trials:24 - Trial = 28552/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.340 | DEBUG    | __main__:trials:29 - Trial = 28552/30000 | Total reward = 38.84
2022-01-26 14:18:45.344 | DEBUG    | __main__:trials:24 - Trial = 28553/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.346 | DEBUG    | __main__:trials:29 - Trial = 28553/30000 | Total reward = 36.50
2022-01-26 14:18:45.349 | DEBUG    | __main__:trials:24 - Trial = 28554/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.350 | DEBUG    | __main__:trials:29 - Trial = 28554/30000 | Total reward = 32.75
2022-01-26 14:18:45.355 | DEBUG    | __main__:trials:24 - Trial = 28555/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.356 | DEBUG    | __main__:trials:29 - Trial = 28555/30000 | Total reward = 46.97
2022-01-26 14:18:45.360 | DEBUG    | __main__:trials:24 - Trial = 28556/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.361 | DEBUG    | __main__:trials:29 - Trial = 28556/30000 | Total reward = 31.90
2022-01-26 14:18:45.365 | DEBUG    | __main__:trials:24 - Trial = 28557/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.367 | DEBUG    | __main__:trials:29 - Trial = 28557/30000 | Total reward = 43.98
2022-01-26 14:18:45.369 | DEBUG    | __main__:trials:26 - Trial = 28558/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.370 | DEBUG    | __main__:trials:29 - Trial = 28558/30000 | Total reward = 15.00
2022-01-26 14:18:45.373 | DEBUG    | __main__:trials:24 - Trial = 28559/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.374 | DEBUG    | __main__:trials:29 - Trial = 28559/30000 | Total reward = 41.84
2022-01-26 14:18:45.377 | DEBUG    | __main__:trials:24 - Trial = 28560/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.379 | DEBUG    | __main__:trials:29 - Trial = 28560/30000 | Total reward = 43.80
2022-01-26 14:18:45.382 | DEBUG    | __main__:trials:24 - Trial = 28561/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.383 | DEBUG    | __main__:trials:29 - Trial = 28561/30000 | Total reward = 35.05
2022-01-26 14:18:45.386 | DEBUG    | __main__:trials:24 - Trial = 28562/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.388 | DEBUG    | __main__:trials:29 - Trial = 28562/30000 | Total reward = 47.54
2022-01-26 14:18:45.392 | DEBUG    | __main__:trials:24 - Trial = 28563/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.393 | DEBUG    | __main__:trials:29 - Trial = 28563/30000 | Total reward = 31.12
2022-01-26 14:18:45.396 | DEBUG    | __main__:trials:24 - Trial = 28564/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.398 | DEBUG    | __main__:trials:29 - Trial = 28564/30000 | Total reward = 42.51
2022-01-26 14:18:45.402 | DEBUG    | __main__:trials:24 - Trial = 28565/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.402 | DEBUG    | __main__:trials:29 - Trial = 28565/30000 | Total reward = 39.84
2022-01-26 14:18:45.406 | DEBUG    | __main__:trials:24 - Trial = 28566/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.408 | DEBUG    | __main__:trials:29 - Trial = 28566/30000 | Total reward = 43.17
2022-01-26 14:18:45.412 | DEBUG    | __main__:trials:24 - Trial = 28567/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.413 | DEBUG    | __main__:trials:29 - Trial = 28567/30000 | Total reward = 28.53
2022-01-26 14:18:45.416 | DEBUG    | __main__:trials:26 - Trial = 28568/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.417 | DEBUG    | __main__:trials:29 - Trial = 28568/30000 | Total reward = 22.26
2022-01-26 14:18:45.421 | DEBUG    | __main__:trials:24 - Trial = 28569/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.422 | DEBUG    | __main__:trials:29 - Trial = 28569/30000 | Total reward = 43.20
2022-01-26 14:18:45.426 | DEBUG    | __main__:trials:24 - Trial = 28570/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.427 | DEBUG    | __main__:trials:29 - Trial = 28570/30000 | Total reward = 35.94
2022-01-26 14:18:45.431 | DEBUG    | __main__:trials:26 - Trial = 28571/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.432 | DEBUG    | __main__:trials:29 - Trial = 28571/30000 | Total reward = 20.20
2022-01-26 14:18:45.436 | DEBUG    | __main__:trials:24 - Trial = 28572/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.437 | DEBUG    | __main__:trials:29 - Trial = 28572/30000 | Total reward = 46.59
2022-01-26 14:18:45.441 | DEBUG    | __main__:trials:24 - Trial = 28573/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.442 | DEBUG    | __main__:trials:29 - Trial = 28573/30000 | Total reward = 50.87
2022-01-26 14:18:45.446 | DEBUG    | __main__:trials:24 - Trial = 28574/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.448 | DEBUG    | __main__:trials:29 - Trial = 28574/30000 | Total reward = 44.31
2022-01-26 14:18:45.452 | DEBUG    | __main__:trials:24 - Trial = 28575/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.453 | DEBUG    | __main__:trials:29 - Trial = 28575/30000 | Total reward = 35.12
2022-01-26 14:18:45.457 | DEBUG    | __main__:trials:24 - Trial = 28576/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.458 | DEBUG    | __main__:trials:29 - Trial = 28576/30000 | Total reward = 41.19
2022-01-26 14:18:45.462 | DEBUG    | __main__:trials:24 - Trial = 28577/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.463 | DEBUG    | __main__:trials:29 - Trial = 28577/30000 | Total reward = 37.57
2022-01-26 14:18:45.467 | DEBUG    | __main__:trials:24 - Trial = 28578/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.468 | DEBUG    | __main__:trials:29 - Trial = 28578/30000 | Total reward = 36.21
2022-01-26 14:18:45.472 | DEBUG    | __main__:trials:26 - Trial = 28579/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.474 | DEBUG    | __main__:trials:29 - Trial = 28579/30000 | Total reward = 23.14
2022-01-26 14:18:45.477 | DEBUG    | __main__:trials:24 - Trial = 28580/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.478 | DEBUG    | __main__:trials:29 - Trial = 28580/30000 | Total reward = 41.44
2022-01-26 14:18:45.482 | DEBUG    | __main__:trials:24 - Trial = 28581/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.483 | DEBUG    | __main__:trials:29 - Trial = 28581/30000 | Total reward = 33.20
2022-01-26 14:18:45.487 | DEBUG    | __main__:trials:24 - Trial = 28582/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.488 | DEBUG    | __main__:trials:29 - Trial = 28582/30000 | Total reward = 51.51
2022-01-26 14:18:45.492 | DEBUG    | __main__:trials:24 - Trial = 28583/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.493 | DEBUG    | __main__:trials:29 - Trial = 28583/30000 | Total reward = 35.64
2022-01-26 14:18:45.497 | DEBUG    | __main__:trials:24 - Trial = 28584/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.498 | DEBUG    | __main__:trials:29 - Trial = 28584/30000 | Total reward = 41.98
2022-01-26 14:18:45.502 | DEBUG    | __main__:trials:24 - Trial = 28585/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.503 | DEBUG    | __main__:trials:29 - Trial = 28585/30000 | Total reward = 39.79
2022-01-26 14:18:45.507 | DEBUG    | __main__:trials:24 - Trial = 28586/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.507 | DEBUG    | __main__:trials:29 - Trial = 28586/30000 | Total reward = 34.90
2022-01-26 14:18:45.512 | DEBUG    | __main__:trials:24 - Trial = 28587/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.513 | DEBUG    | __main__:trials:29 - Trial = 28587/30000 | Total reward = 37.51
2022-01-26 14:18:45.517 | DEBUG    | __main__:trials:26 - Trial = 28588/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.517 | DEBUG    | __main__:trials:29 - Trial = 28588/30000 | Total reward = 24.32
2022-01-26 14:18:45.521 | DEBUG    | __main__:trials:24 - Trial = 28589/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.522 | DEBUG    | __main__:trials:29 - Trial = 28589/30000 | Total reward = 25.48
2022-01-26 14:18:45.527 | DEBUG    | __main__:trials:24 - Trial = 28590/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.527 | DEBUG    | __main__:trials:29 - Trial = 28590/30000 | Total reward = 48.03
2022-01-26 14:18:45.531 | DEBUG    | __main__:trials:24 - Trial = 28591/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.533 | DEBUG    | __main__:trials:29 - Trial = 28591/30000 | Total reward = 21.54
2022-01-26 14:18:45.536 | DEBUG    | __main__:trials:24 - Trial = 28592/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.538 | DEBUG    | __main__:trials:29 - Trial = 28592/30000 | Total reward = 47.78
2022-01-26 14:18:45.541 | DEBUG    | __main__:trials:24 - Trial = 28593/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.541 | DEBUG    | __main__:trials:29 - Trial = 28593/30000 | Total reward = 47.47
2022-01-26 14:18:45.546 | DEBUG    | __main__:trials:24 - Trial = 28594/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.547 | DEBUG    | __main__:trials:29 - Trial = 28594/30000 | Total reward = 46.71
2022-01-26 14:18:45.550 | DEBUG    | __main__:trials:24 - Trial = 28595/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.552 | DEBUG    | __main__:trials:29 - Trial = 28595/30000 | Total reward = 50.62
2022-01-26 14:18:45.555 | DEBUG    | __main__:trials:24 - Trial = 28596/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.556 | DEBUG    | __main__:trials:29 - Trial = 28596/30000 | Total reward = 40.24
2022-01-26 14:18:45.560 | DEBUG    | __main__:trials:24 - Trial = 28597/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.561 | DEBUG    | __main__:trials:29 - Trial = 28597/30000 | Total reward = 30.63
2022-01-26 14:18:45.564 | DEBUG    | __main__:trials:24 - Trial = 28598/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.566 | DEBUG    | __main__:trials:29 - Trial = 28598/30000 | Total reward = 25.99
2022-01-26 14:18:45.569 | DEBUG    | __main__:trials:24 - Trial = 28599/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.569 | DEBUG    | __main__:trials:29 - Trial = 28599/30000 | Total reward = 42.78
2022-01-26 14:18:45.574 | DEBUG    | __main__:trials:24 - Trial = 28600/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.575 | DEBUG    | __main__:trials:29 - Trial = 28600/30000 | Total reward = 30.63
2022-01-26 14:18:45.579 | DEBUG    | __main__:trials:24 - Trial = 28601/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.581 | DEBUG    | __main__:trials:29 - Trial = 28601/30000 | Total reward = 61.31
2022-01-26 14:18:45.584 | DEBUG    | __main__:trials:24 - Trial = 28602/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.586 | DEBUG    | __main__:trials:29 - Trial = 28602/30000 | Total reward = 34.40
2022-01-26 14:18:45.589 | DEBUG    | __main__:trials:24 - Trial = 28603/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.590 | DEBUG    | __main__:trials:29 - Trial = 28603/30000 | Total reward = 41.89
2022-01-26 14:18:45.594 | DEBUG    | __main__:trials:24 - Trial = 28604/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.595 | DEBUG    | __main__:trials:29 - Trial = 28604/30000 | Total reward = 45.79
2022-01-26 14:18:45.599 | DEBUG    | __main__:trials:24 - Trial = 28605/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.599 | DEBUG    | __main__:trials:29 - Trial = 28605/30000 | Total reward = 48.29
2022-01-26 14:18:45.604 | DEBUG    | __main__:trials:24 - Trial = 28606/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.605 | DEBUG    | __main__:trials:29 - Trial = 28606/30000 | Total reward = 41.03
2022-01-26 14:18:45.609 | DEBUG    | __main__:trials:24 - Trial = 28607/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.611 | DEBUG    | __main__:trials:29 - Trial = 28607/30000 | Total reward = 35.77
2022-01-26 14:18:45.614 | DEBUG    | __main__:trials:24 - Trial = 28608/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.615 | DEBUG    | __main__:trials:29 - Trial = 28608/30000 | Total reward = 48.85
2022-01-26 14:18:45.618 | DEBUG    | __main__:trials:24 - Trial = 28609/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.620 | DEBUG    | __main__:trials:29 - Trial = 28609/30000 | Total reward = 36.98
2022-01-26 14:18:45.623 | DEBUG    | __main__:trials:24 - Trial = 28610/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.624 | DEBUG    | __main__:trials:29 - Trial = 28610/30000 | Total reward = 41.39
2022-01-26 14:18:45.628 | DEBUG    | __main__:trials:24 - Trial = 28611/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.629 | DEBUG    | __main__:trials:29 - Trial = 28611/30000 | Total reward = 42.82
2022-01-26 14:18:45.633 | DEBUG    | __main__:trials:24 - Trial = 28612/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.634 | DEBUG    | __main__:trials:29 - Trial = 28612/30000 | Total reward = 41.14
2022-01-26 14:18:45.638 | DEBUG    | __main__:trials:24 - Trial = 28613/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.639 | DEBUG    | __main__:trials:29 - Trial = 28613/30000 | Total reward = 43.88
2022-01-26 14:18:45.643 | DEBUG    | __main__:trials:24 - Trial = 28614/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.644 | DEBUG    | __main__:trials:29 - Trial = 28614/30000 | Total reward = 43.09
2022-01-26 14:18:45.647 | DEBUG    | __main__:trials:26 - Trial = 28615/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.649 | DEBUG    | __main__:trials:29 - Trial = 28615/30000 | Total reward = 20.33
2022-01-26 14:18:45.652 | DEBUG    | __main__:trials:24 - Trial = 28616/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.654 | DEBUG    | __main__:trials:29 - Trial = 28616/30000 | Total reward = 48.57
2022-01-26 14:18:45.657 | DEBUG    | __main__:trials:24 - Trial = 28617/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.659 | DEBUG    | __main__:trials:29 - Trial = 28617/30000 | Total reward = 55.61
2022-01-26 14:18:45.663 | DEBUG    | __main__:trials:24 - Trial = 28618/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.663 | DEBUG    | __main__:trials:29 - Trial = 28618/30000 | Total reward = 52.52
2022-01-26 14:18:45.668 | DEBUG    | __main__:trials:24 - Trial = 28619/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.669 | DEBUG    | __main__:trials:29 - Trial = 28619/30000 | Total reward = 38.29
2022-01-26 14:18:45.673 | DEBUG    | __main__:trials:24 - Trial = 28620/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.674 | DEBUG    | __main__:trials:29 - Trial = 28620/30000 | Total reward = 45.68
2022-01-26 14:18:45.677 | DEBUG    | __main__:trials:24 - Trial = 28621/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.679 | DEBUG    | __main__:trials:29 - Trial = 28621/30000 | Total reward = 32.74
2022-01-26 14:18:45.683 | DEBUG    | __main__:trials:24 - Trial = 28622/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.684 | DEBUG    | __main__:trials:29 - Trial = 28622/30000 | Total reward = 38.20
2022-01-26 14:18:45.688 | DEBUG    | __main__:trials:24 - Trial = 28623/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.690 | DEBUG    | __main__:trials:29 - Trial = 28623/30000 | Total reward = 36.01
2022-01-26 14:18:45.693 | DEBUG    | __main__:trials:26 - Trial = 28624/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.694 | DEBUG    | __main__:trials:29 - Trial = 28624/30000 | Total reward = 27.05
2022-01-26 14:18:45.698 | DEBUG    | __main__:trials:24 - Trial = 28625/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.698 | DEBUG    | __main__:trials:29 - Trial = 28625/30000 | Total reward = 41.98
2022-01-26 14:18:45.703 | DEBUG    | __main__:trials:24 - Trial = 28626/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.704 | DEBUG    | __main__:trials:29 - Trial = 28626/30000 | Total reward = 38.12
2022-01-26 14:18:45.707 | DEBUG    | __main__:trials:24 - Trial = 28627/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.709 | DEBUG    | __main__:trials:29 - Trial = 28627/30000 | Total reward = 34.49
2022-01-26 14:18:45.712 | DEBUG    | __main__:trials:24 - Trial = 28628/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.714 | DEBUG    | __main__:trials:29 - Trial = 28628/30000 | Total reward = 28.16
2022-01-26 14:18:45.717 | DEBUG    | __main__:trials:24 - Trial = 28629/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.719 | DEBUG    | __main__:trials:29 - Trial = 28629/30000 | Total reward = 41.00
2022-01-26 14:18:45.722 | DEBUG    | __main__:trials:24 - Trial = 28630/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.723 | DEBUG    | __main__:trials:29 - Trial = 28630/30000 | Total reward = 36.01
2022-01-26 14:18:45.727 | DEBUG    | __main__:trials:24 - Trial = 28631/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.729 | DEBUG    | __main__:trials:29 - Trial = 28631/30000 | Total reward = 52.33
2022-01-26 14:18:45.732 | DEBUG    | __main__:trials:24 - Trial = 28632/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.733 | DEBUG    | __main__:trials:29 - Trial = 28632/30000 | Total reward = 51.17
2022-01-26 14:18:45.737 | DEBUG    | __main__:trials:24 - Trial = 28633/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.738 | DEBUG    | __main__:trials:29 - Trial = 28633/30000 | Total reward = 61.31
2022-01-26 14:18:45.743 | DEBUG    | __main__:trials:24 - Trial = 28634/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.744 | DEBUG    | __main__:trials:29 - Trial = 28634/30000 | Total reward = 40.00
2022-01-26 14:18:45.748 | DEBUG    | __main__:trials:24 - Trial = 28635/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.749 | DEBUG    | __main__:trials:29 - Trial = 28635/30000 | Total reward = 41.98
2022-01-26 14:18:45.753 | DEBUG    | __main__:trials:24 - Trial = 28636/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.754 | DEBUG    | __main__:trials:29 - Trial = 28636/30000 | Total reward = 40.26
2022-01-26 14:18:45.757 | DEBUG    | __main__:trials:24 - Trial = 28637/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.759 | DEBUG    | __main__:trials:29 - Trial = 28637/30000 | Total reward = 54.90
2022-01-26 14:18:45.762 | DEBUG    | __main__:trials:24 - Trial = 28638/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.764 | DEBUG    | __main__:trials:29 - Trial = 28638/30000 | Total reward = 38.14
2022-01-26 14:18:45.766 | DEBUG    | __main__:trials:24 - Trial = 28639/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.768 | DEBUG    | __main__:trials:29 - Trial = 28639/30000 | Total reward = 38.82
2022-01-26 14:18:45.772 | DEBUG    | __main__:trials:24 - Trial = 28640/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.773 | DEBUG    | __main__:trials:29 - Trial = 28640/30000 | Total reward = 46.07
2022-01-26 14:18:45.776 | DEBUG    | __main__:trials:26 - Trial = 28641/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.776 | DEBUG    | __main__:trials:29 - Trial = 28641/30000 | Total reward = 23.61
2022-01-26 14:18:45.781 | DEBUG    | __main__:trials:24 - Trial = 28642/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.781 | DEBUG    | __main__:trials:29 - Trial = 28642/30000 | Total reward = 37.01
2022-01-26 14:18:45.785 | DEBUG    | __main__:trials:24 - Trial = 28643/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.786 | DEBUG    | __main__:trials:29 - Trial = 28643/30000 | Total reward = 46.22
2022-01-26 14:18:45.789 | DEBUG    | __main__:trials:24 - Trial = 28644/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.791 | DEBUG    | __main__:trials:29 - Trial = 28644/30000 | Total reward = 40.91
2022-01-26 14:18:45.794 | DEBUG    | __main__:trials:24 - Trial = 28645/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.796 | DEBUG    | __main__:trials:29 - Trial = 28645/30000 | Total reward = 28.96
2022-01-26 14:18:45.799 | DEBUG    | __main__:trials:24 - Trial = 28646/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.801 | DEBUG    | __main__:trials:29 - Trial = 28646/30000 | Total reward = 32.88
2022-01-26 14:18:45.805 | DEBUG    | __main__:trials:24 - Trial = 28647/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.806 | DEBUG    | __main__:trials:29 - Trial = 28647/30000 | Total reward = 39.96
2022-01-26 14:18:45.810 | DEBUG    | __main__:trials:24 - Trial = 28648/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.811 | DEBUG    | __main__:trials:29 - Trial = 28648/30000 | Total reward = 44.54
2022-01-26 14:18:45.815 | DEBUG    | __main__:trials:24 - Trial = 28649/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.816 | DEBUG    | __main__:trials:29 - Trial = 28649/30000 | Total reward = 47.01
2022-01-26 14:18:45.819 | DEBUG    | __main__:trials:24 - Trial = 28650/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.821 | DEBUG    | __main__:trials:29 - Trial = 28650/30000 | Total reward = 39.78
2022-01-26 14:18:45.824 | DEBUG    | __main__:trials:24 - Trial = 28651/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.825 | DEBUG    | __main__:trials:29 - Trial = 28651/30000 | Total reward = 40.93
2022-01-26 14:18:45.829 | DEBUG    | __main__:trials:24 - Trial = 28652/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.829 | DEBUG    | __main__:trials:29 - Trial = 28652/30000 | Total reward = 35.39
2022-01-26 14:18:45.833 | DEBUG    | __main__:trials:24 - Trial = 28653/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.834 | DEBUG    | __main__:trials:29 - Trial = 28653/30000 | Total reward = 52.37
2022-01-26 14:18:45.837 | DEBUG    | __main__:trials:24 - Trial = 28654/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.838 | DEBUG    | __main__:trials:29 - Trial = 28654/30000 | Total reward = 22.51
2022-01-26 14:18:45.841 | DEBUG    | __main__:trials:24 - Trial = 28655/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.842 | DEBUG    | __main__:trials:29 - Trial = 28655/30000 | Total reward = 56.29
2022-01-26 14:18:45.845 | DEBUG    | __main__:trials:24 - Trial = 28656/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.846 | DEBUG    | __main__:trials:29 - Trial = 28656/30000 | Total reward = 40.14
2022-01-26 14:18:45.849 | DEBUG    | __main__:trials:24 - Trial = 28657/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.850 | DEBUG    | __main__:trials:29 - Trial = 28657/30000 | Total reward = 50.36
2022-01-26 14:18:45.853 | DEBUG    | __main__:trials:24 - Trial = 28658/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.854 | DEBUG    | __main__:trials:29 - Trial = 28658/30000 | Total reward = 38.97
2022-01-26 14:18:45.858 | DEBUG    | __main__:trials:24 - Trial = 28659/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.858 | DEBUG    | __main__:trials:29 - Trial = 28659/30000 | Total reward = 34.05
2022-01-26 14:18:45.862 | DEBUG    | __main__:trials:24 - Trial = 28660/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.863 | DEBUG    | __main__:trials:29 - Trial = 28660/30000 | Total reward = 63.26
2022-01-26 14:18:45.867 | DEBUG    | __main__:trials:24 - Trial = 28661/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.868 | DEBUG    | __main__:trials:29 - Trial = 28661/30000 | Total reward = 47.48
2022-01-26 14:18:45.871 | DEBUG    | __main__:trials:24 - Trial = 28662/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.872 | DEBUG    | __main__:trials:29 - Trial = 28662/30000 | Total reward = 31.83
2022-01-26 14:18:45.875 | DEBUG    | __main__:trials:24 - Trial = 28663/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.876 | DEBUG    | __main__:trials:29 - Trial = 28663/30000 | Total reward = 30.96
2022-01-26 14:18:45.879 | DEBUG    | __main__:trials:24 - Trial = 28664/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.881 | DEBUG    | __main__:trials:29 - Trial = 28664/30000 | Total reward = 30.57
2022-01-26 14:18:45.884 | DEBUG    | __main__:trials:24 - Trial = 28665/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.886 | DEBUG    | __main__:trials:29 - Trial = 28665/30000 | Total reward = 36.28
2022-01-26 14:18:45.889 | DEBUG    | __main__:trials:26 - Trial = 28666/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.889 | DEBUG    | __main__:trials:29 - Trial = 28666/30000 | Total reward = 13.34
2022-01-26 14:18:45.892 | DEBUG    | __main__:trials:24 - Trial = 28667/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.894 | DEBUG    | __main__:trials:29 - Trial = 28667/30000 | Total reward = 40.94
2022-01-26 14:18:45.897 | DEBUG    | __main__:trials:24 - Trial = 28668/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.898 | DEBUG    | __main__:trials:29 - Trial = 28668/30000 | Total reward = 39.66
2022-01-26 14:18:45.901 | DEBUG    | __main__:trials:26 - Trial = 28669/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.903 | DEBUG    | __main__:trials:29 - Trial = 28669/30000 | Total reward = 24.42
2022-01-26 14:18:45.906 | DEBUG    | __main__:trials:24 - Trial = 28670/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.907 | DEBUG    | __main__:trials:29 - Trial = 28670/30000 | Total reward = 38.22
2022-01-26 14:18:45.910 | DEBUG    | __main__:trials:24 - Trial = 28671/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.911 | DEBUG    | __main__:trials:29 - Trial = 28671/30000 | Total reward = 43.80
2022-01-26 14:18:45.913 | DEBUG    | __main__:trials:26 - Trial = 28672/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.914 | DEBUG    | __main__:trials:29 - Trial = 28672/30000 | Total reward = 15.74
2022-01-26 14:18:45.917 | DEBUG    | __main__:trials:24 - Trial = 28673/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.918 | DEBUG    | __main__:trials:29 - Trial = 28673/30000 | Total reward = 37.72
2022-01-26 14:18:45.922 | DEBUG    | __main__:trials:24 - Trial = 28674/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.923 | DEBUG    | __main__:trials:29 - Trial = 28674/30000 | Total reward = 38.15
2022-01-26 14:18:45.926 | DEBUG    | __main__:trials:24 - Trial = 28675/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.928 | DEBUG    | __main__:trials:29 - Trial = 28675/30000 | Total reward = 37.78
2022-01-26 14:18:45.930 | DEBUG    | __main__:trials:26 - Trial = 28676/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.932 | DEBUG    | __main__:trials:29 - Trial = 28676/30000 | Total reward = 21.76
2022-01-26 14:18:45.934 | DEBUG    | __main__:trials:26 - Trial = 28677/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.935 | DEBUG    | __main__:trials:29 - Trial = 28677/30000 | Total reward = 15.49
2022-01-26 14:18:45.938 | DEBUG    | __main__:trials:24 - Trial = 28678/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.939 | DEBUG    | __main__:trials:29 - Trial = 28678/30000 | Total reward = 43.74
2022-01-26 14:18:45.942 | DEBUG    | __main__:trials:24 - Trial = 28679/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.943 | DEBUG    | __main__:trials:29 - Trial = 28679/30000 | Total reward = 35.57
2022-01-26 14:18:45.947 | DEBUG    | __main__:trials:24 - Trial = 28680/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.948 | DEBUG    | __main__:trials:29 - Trial = 28680/30000 | Total reward = 55.38
2022-01-26 14:18:45.951 | DEBUG    | __main__:trials:26 - Trial = 28681/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.952 | DEBUG    | __main__:trials:29 - Trial = 28681/30000 | Total reward = 30.02
2022-01-26 14:18:45.956 | DEBUG    | __main__:trials:24 - Trial = 28682/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.958 | DEBUG    | __main__:trials:29 - Trial = 28682/30000 | Total reward = 49.44
2022-01-26 14:18:45.961 | DEBUG    | __main__:trials:24 - Trial = 28683/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.962 | DEBUG    | __main__:trials:29 - Trial = 28683/30000 | Total reward = 38.62
2022-01-26 14:18:45.965 | DEBUG    | __main__:trials:24 - Trial = 28684/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.966 | DEBUG    | __main__:trials:29 - Trial = 28684/30000 | Total reward = 50.09
2022-01-26 14:18:45.969 | DEBUG    | __main__:trials:24 - Trial = 28685/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.970 | DEBUG    | __main__:trials:29 - Trial = 28685/30000 | Total reward = 46.05
2022-01-26 14:18:45.972 | DEBUG    | __main__:trials:26 - Trial = 28686/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:45.973 | DEBUG    | __main__:trials:29 - Trial = 28686/30000 | Total reward = 10.11
2022-01-26 14:18:45.977 | DEBUG    | __main__:trials:24 - Trial = 28687/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.978 | DEBUG    | __main__:trials:29 - Trial = 28687/30000 | Total reward = 43.92
2022-01-26 14:18:45.981 | DEBUG    | __main__:trials:24 - Trial = 28688/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.982 | DEBUG    | __main__:trials:29 - Trial = 28688/30000 | Total reward = 38.03
2022-01-26 14:18:45.985 | DEBUG    | __main__:trials:24 - Trial = 28689/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.985 | DEBUG    | __main__:trials:29 - Trial = 28689/30000 | Total reward = 35.04
2022-01-26 14:18:45.989 | DEBUG    | __main__:trials:24 - Trial = 28690/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.989 | DEBUG    | __main__:trials:29 - Trial = 28690/30000 | Total reward = 44.94
2022-01-26 14:18:45.993 | DEBUG    | __main__:trials:24 - Trial = 28691/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.994 | DEBUG    | __main__:trials:29 - Trial = 28691/30000 | Total reward = 47.25
2022-01-26 14:18:45.997 | DEBUG    | __main__:trials:24 - Trial = 28692/30000 | Max number of steps (20) reached
2022-01-26 14:18:45.999 | DEBUG    | __main__:trials:29 - Trial = 28692/30000 | Total reward = 48.94
2022-01-26 14:18:46.002 | DEBUG    | __main__:trials:24 - Trial = 28693/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.003 | DEBUG    | __main__:trials:29 - Trial = 28693/30000 | Total reward = 39.47
2022-01-26 14:18:46.006 | DEBUG    | __main__:trials:24 - Trial = 28694/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.007 | DEBUG    | __main__:trials:29 - Trial = 28694/30000 | Total reward = 55.78
2022-01-26 14:18:46.010 | DEBUG    | __main__:trials:24 - Trial = 28695/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.011 | DEBUG    | __main__:trials:29 - Trial = 28695/30000 | Total reward = 45.41
2022-01-26 14:18:46.015 | DEBUG    | __main__:trials:24 - Trial = 28696/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.017 | DEBUG    | __main__:trials:29 - Trial = 28696/30000 | Total reward = 42.97
2022-01-26 14:18:46.020 | DEBUG    | __main__:trials:24 - Trial = 28697/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.021 | DEBUG    | __main__:trials:29 - Trial = 28697/30000 | Total reward = 32.51
2022-01-26 14:18:46.025 | DEBUG    | __main__:trials:24 - Trial = 28698/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.026 | DEBUG    | __main__:trials:29 - Trial = 28698/30000 | Total reward = 45.49
2022-01-26 14:18:46.028 | DEBUG    | __main__:trials:26 - Trial = 28699/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.028 | DEBUG    | __main__:trials:29 - Trial = 28699/30000 | Total reward = 8.43
2022-01-26 14:18:46.032 | DEBUG    | __main__:trials:24 - Trial = 28700/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.033 | DEBUG    | __main__:trials:29 - Trial = 28700/30000 | Total reward = 28.07
2022-01-26 14:18:46.036 | DEBUG    | __main__:trials:24 - Trial = 28701/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.037 | DEBUG    | __main__:trials:29 - Trial = 28701/30000 | Total reward = 31.13
2022-01-26 14:18:46.040 | DEBUG    | __main__:trials:24 - Trial = 28702/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.041 | DEBUG    | __main__:trials:29 - Trial = 28702/30000 | Total reward = 37.71
2022-01-26 14:18:46.044 | DEBUG    | __main__:trials:24 - Trial = 28703/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.046 | DEBUG    | __main__:trials:29 - Trial = 28703/30000 | Total reward = 56.07
2022-01-26 14:18:46.049 | DEBUG    | __main__:trials:24 - Trial = 28704/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.050 | DEBUG    | __main__:trials:29 - Trial = 28704/30000 | Total reward = 44.80
2022-01-26 14:18:46.053 | DEBUG    | __main__:trials:24 - Trial = 28705/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.054 | DEBUG    | __main__:trials:29 - Trial = 28705/30000 | Total reward = 43.08
2022-01-26 14:18:46.057 | DEBUG    | __main__:trials:24 - Trial = 28706/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.058 | DEBUG    | __main__:trials:29 - Trial = 28706/30000 | Total reward = 32.51
2022-01-26 14:18:46.061 | DEBUG    | __main__:trials:26 - Trial = 28707/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.062 | DEBUG    | __main__:trials:29 - Trial = 28707/30000 | Total reward = 28.34
2022-01-26 14:18:46.065 | DEBUG    | __main__:trials:24 - Trial = 28708/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.066 | DEBUG    | __main__:trials:29 - Trial = 28708/30000 | Total reward = 44.21
2022-01-26 14:18:46.069 | DEBUG    | __main__:trials:24 - Trial = 28709/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.070 | DEBUG    | __main__:trials:29 - Trial = 28709/30000 | Total reward = 26.29
2022-01-26 14:18:46.073 | DEBUG    | __main__:trials:26 - Trial = 28710/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.074 | DEBUG    | __main__:trials:29 - Trial = 28710/30000 | Total reward = 22.95
2022-01-26 14:18:46.077 | DEBUG    | __main__:trials:26 - Trial = 28711/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.078 | DEBUG    | __main__:trials:29 - Trial = 28711/30000 | Total reward = 23.43
2022-01-26 14:18:46.081 | DEBUG    | __main__:trials:24 - Trial = 28712/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.081 | DEBUG    | __main__:trials:29 - Trial = 28712/30000 | Total reward = 48.90
2022-01-26 14:18:46.085 | DEBUG    | __main__:trials:24 - Trial = 28713/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.086 | DEBUG    | __main__:trials:29 - Trial = 28713/30000 | Total reward = 34.02
2022-01-26 14:18:46.089 | DEBUG    | __main__:trials:24 - Trial = 28714/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.090 | DEBUG    | __main__:trials:29 - Trial = 28714/30000 | Total reward = 37.83
2022-01-26 14:18:46.093 | DEBUG    | __main__:trials:24 - Trial = 28715/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.094 | DEBUG    | __main__:trials:29 - Trial = 28715/30000 | Total reward = 34.17
2022-01-26 14:18:46.098 | DEBUG    | __main__:trials:24 - Trial = 28716/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.099 | DEBUG    | __main__:trials:29 - Trial = 28716/30000 | Total reward = 51.70
2022-01-26 14:18:46.102 | DEBUG    | __main__:trials:24 - Trial = 28717/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.103 | DEBUG    | __main__:trials:29 - Trial = 28717/30000 | Total reward = 32.89
2022-01-26 14:18:46.106 | DEBUG    | __main__:trials:26 - Trial = 28718/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.107 | DEBUG    | __main__:trials:29 - Trial = 28718/30000 | Total reward = 17.21
2022-01-26 14:18:46.110 | DEBUG    | __main__:trials:26 - Trial = 28719/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.111 | DEBUG    | __main__:trials:29 - Trial = 28719/30000 | Total reward = 9.11
2022-01-26 14:18:46.115 | DEBUG    | __main__:trials:24 - Trial = 28720/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.117 | DEBUG    | __main__:trials:29 - Trial = 28720/30000 | Total reward = 37.86
2022-01-26 14:18:46.120 | DEBUG    | __main__:trials:24 - Trial = 28721/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.120 | DEBUG    | __main__:trials:29 - Trial = 28721/30000 | Total reward = 47.40
2022-01-26 14:18:46.124 | DEBUG    | __main__:trials:24 - Trial = 28722/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.125 | DEBUG    | __main__:trials:29 - Trial = 28722/30000 | Total reward = 35.81
2022-01-26 14:18:46.128 | DEBUG    | __main__:trials:24 - Trial = 28723/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.129 | DEBUG    | __main__:trials:29 - Trial = 28723/30000 | Total reward = 41.40
2022-01-26 14:18:46.133 | DEBUG    | __main__:trials:24 - Trial = 28724/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.133 | DEBUG    | __main__:trials:29 - Trial = 28724/30000 | Total reward = 32.10
2022-01-26 14:18:46.137 | DEBUG    | __main__:trials:24 - Trial = 28725/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.138 | DEBUG    | __main__:trials:29 - Trial = 28725/30000 | Total reward = 34.17
2022-01-26 14:18:46.141 | DEBUG    | __main__:trials:24 - Trial = 28726/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.142 | DEBUG    | __main__:trials:29 - Trial = 28726/30000 | Total reward = 27.29
2022-01-26 14:18:46.146 | DEBUG    | __main__:trials:24 - Trial = 28727/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.147 | DEBUG    | __main__:trials:29 - Trial = 28727/30000 | Total reward = 35.78
2022-01-26 14:18:46.150 | DEBUG    | __main__:trials:26 - Trial = 28728/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.151 | DEBUG    | __main__:trials:29 - Trial = 28728/30000 | Total reward = 27.11
2022-01-26 14:18:46.154 | DEBUG    | __main__:trials:24 - Trial = 28729/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.155 | DEBUG    | __main__:trials:29 - Trial = 28729/30000 | Total reward = 51.11
2022-01-26 14:18:46.158 | DEBUG    | __main__:trials:24 - Trial = 28730/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.159 | DEBUG    | __main__:trials:29 - Trial = 28730/30000 | Total reward = 28.96
2022-01-26 14:18:46.163 | DEBUG    | __main__:trials:24 - Trial = 28731/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.165 | DEBUG    | __main__:trials:29 - Trial = 28731/30000 | Total reward = 35.72
2022-01-26 14:18:46.168 | DEBUG    | __main__:trials:24 - Trial = 28732/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.168 | DEBUG    | __main__:trials:29 - Trial = 28732/30000 | Total reward = 34.37
2022-01-26 14:18:46.172 | DEBUG    | __main__:trials:24 - Trial = 28733/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.172 | DEBUG    | __main__:trials:29 - Trial = 28733/30000 | Total reward = 37.99
2022-01-26 14:18:46.175 | DEBUG    | __main__:trials:26 - Trial = 28734/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.176 | DEBUG    | __main__:trials:29 - Trial = 28734/30000 | Total reward = 10.11
2022-01-26 14:18:46.180 | DEBUG    | __main__:trials:24 - Trial = 28735/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.180 | DEBUG    | __main__:trials:29 - Trial = 28735/30000 | Total reward = 32.93
2022-01-26 14:18:46.183 | DEBUG    | __main__:trials:26 - Trial = 28736/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.184 | DEBUG    | __main__:trials:29 - Trial = 28736/30000 | Total reward = 22.74
2022-01-26 14:18:46.187 | DEBUG    | __main__:trials:26 - Trial = 28737/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.188 | DEBUG    | __main__:trials:29 - Trial = 28737/30000 | Total reward = 17.66
2022-01-26 14:18:46.191 | DEBUG    | __main__:trials:26 - Trial = 28738/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.191 | DEBUG    | __main__:trials:29 - Trial = 28738/30000 | Total reward = 8.02
2022-01-26 14:18:46.193 | DEBUG    | __main__:trials:26 - Trial = 28739/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.195 | DEBUG    | __main__:trials:29 - Trial = 28739/30000 | Total reward = 13.51
2022-01-26 14:18:46.198 | DEBUG    | __main__:trials:24 - Trial = 28740/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.199 | DEBUG    | __main__:trials:29 - Trial = 28740/30000 | Total reward = 37.93
2022-01-26 14:18:46.203 | DEBUG    | __main__:trials:24 - Trial = 28741/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.204 | DEBUG    | __main__:trials:29 - Trial = 28741/30000 | Total reward = 55.69
2022-01-26 14:18:46.207 | DEBUG    | __main__:trials:26 - Trial = 28742/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.208 | DEBUG    | __main__:trials:29 - Trial = 28742/30000 | Total reward = 20.66
2022-01-26 14:18:46.211 | DEBUG    | __main__:trials:24 - Trial = 28743/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.212 | DEBUG    | __main__:trials:29 - Trial = 28743/30000 | Total reward = 25.04
2022-01-26 14:18:46.215 | DEBUG    | __main__:trials:26 - Trial = 28744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.216 | DEBUG    | __main__:trials:29 - Trial = 28744/30000 | Total reward = 17.75
2022-01-26 14:18:46.219 | DEBUG    | __main__:trials:24 - Trial = 28745/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.220 | DEBUG    | __main__:trials:29 - Trial = 28745/30000 | Total reward = 51.11
2022-01-26 14:18:46.223 | DEBUG    | __main__:trials:24 - Trial = 28746/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.224 | DEBUG    | __main__:trials:29 - Trial = 28746/30000 | Total reward = 36.07
2022-01-26 14:18:46.227 | DEBUG    | __main__:trials:24 - Trial = 28747/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.228 | DEBUG    | __main__:trials:29 - Trial = 28747/30000 | Total reward = 37.77
2022-01-26 14:18:46.232 | DEBUG    | __main__:trials:24 - Trial = 28748/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.233 | DEBUG    | __main__:trials:29 - Trial = 28748/30000 | Total reward = 46.03
2022-01-26 14:18:46.237 | DEBUG    | __main__:trials:24 - Trial = 28749/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.238 | DEBUG    | __main__:trials:29 - Trial = 28749/30000 | Total reward = 42.01
2022-01-26 14:18:46.241 | DEBUG    | __main__:trials:26 - Trial = 28750/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.242 | DEBUG    | __main__:trials:29 - Trial = 28750/30000 | Total reward = 16.28
2022-01-26 14:18:46.246 | DEBUG    | __main__:trials:24 - Trial = 28751/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.246 | DEBUG    | __main__:trials:29 - Trial = 28751/30000 | Total reward = 41.49
2022-01-26 14:18:46.250 | DEBUG    | __main__:trials:26 - Trial = 28752/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.251 | DEBUG    | __main__:trials:29 - Trial = 28752/30000 | Total reward = 12.12
2022-01-26 14:18:46.254 | DEBUG    | __main__:trials:26 - Trial = 28753/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.255 | DEBUG    | __main__:trials:29 - Trial = 28753/30000 | Total reward = 18.11
2022-01-26 14:18:46.258 | DEBUG    | __main__:trials:26 - Trial = 28754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.259 | DEBUG    | __main__:trials:29 - Trial = 28754/30000 | Total reward = 14.74
2022-01-26 14:18:46.262 | DEBUG    | __main__:trials:24 - Trial = 28755/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.264 | DEBUG    | __main__:trials:29 - Trial = 28755/30000 | Total reward = 29.81
2022-01-26 14:18:46.267 | DEBUG    | __main__:trials:26 - Trial = 28756/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.268 | DEBUG    | __main__:trials:29 - Trial = 28756/30000 | Total reward = 23.77
2022-01-26 14:18:46.272 | DEBUG    | __main__:trials:24 - Trial = 28757/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.273 | DEBUG    | __main__:trials:29 - Trial = 28757/30000 | Total reward = 29.03
2022-01-26 14:18:46.276 | DEBUG    | __main__:trials:26 - Trial = 28758/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.278 | DEBUG    | __main__:trials:29 - Trial = 28758/30000 | Total reward = 12.17
2022-01-26 14:18:46.281 | DEBUG    | __main__:trials:26 - Trial = 28759/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.282 | DEBUG    | __main__:trials:29 - Trial = 28759/30000 | Total reward = 16.32
2022-01-26 14:18:46.285 | DEBUG    | __main__:trials:26 - Trial = 28760/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.286 | DEBUG    | __main__:trials:29 - Trial = 28760/30000 | Total reward = 16.54
2022-01-26 14:18:46.289 | DEBUG    | __main__:trials:24 - Trial = 28761/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.290 | DEBUG    | __main__:trials:29 - Trial = 28761/30000 | Total reward = 47.24
2022-01-26 14:18:46.294 | DEBUG    | __main__:trials:24 - Trial = 28762/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.296 | DEBUG    | __main__:trials:29 - Trial = 28762/30000 | Total reward = 31.27
2022-01-26 14:18:46.298 | DEBUG    | __main__:trials:26 - Trial = 28763/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.300 | DEBUG    | __main__:trials:29 - Trial = 28763/30000 | Total reward = 20.84
2022-01-26 14:18:46.303 | DEBUG    | __main__:trials:26 - Trial = 28764/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.304 | DEBUG    | __main__:trials:29 - Trial = 28764/30000 | Total reward = 22.00
2022-01-26 14:18:46.306 | DEBUG    | __main__:trials:26 - Trial = 28765/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.308 | DEBUG    | __main__:trials:29 - Trial = 28765/30000 | Total reward = 17.61
2022-01-26 14:18:46.311 | DEBUG    | __main__:trials:26 - Trial = 28766/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.313 | DEBUG    | __main__:trials:29 - Trial = 28766/30000 | Total reward = 22.62
2022-01-26 14:18:46.315 | DEBUG    | __main__:trials:26 - Trial = 28767/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.316 | DEBUG    | __main__:trials:29 - Trial = 28767/30000 | Total reward = 13.65
2022-01-26 14:18:46.320 | DEBUG    | __main__:trials:24 - Trial = 28768/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.321 | DEBUG    | __main__:trials:29 - Trial = 28768/30000 | Total reward = 50.75
2022-01-26 14:18:46.324 | DEBUG    | __main__:trials:26 - Trial = 28769/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.325 | DEBUG    | __main__:trials:29 - Trial = 28769/30000 | Total reward = 20.66
2022-01-26 14:18:46.328 | DEBUG    | __main__:trials:24 - Trial = 28770/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.329 | DEBUG    | __main__:trials:29 - Trial = 28770/30000 | Total reward = 32.24
2022-01-26 14:18:46.332 | DEBUG    | __main__:trials:24 - Trial = 28771/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.334 | DEBUG    | __main__:trials:29 - Trial = 28771/30000 | Total reward = 38.44
2022-01-26 14:18:46.337 | DEBUG    | __main__:trials:24 - Trial = 28772/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.339 | DEBUG    | __main__:trials:29 - Trial = 28772/30000 | Total reward = 37.35
2022-01-26 14:18:46.342 | DEBUG    | __main__:trials:24 - Trial = 28773/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.344 | DEBUG    | __main__:trials:29 - Trial = 28773/30000 | Total reward = 47.70
2022-01-26 14:18:46.348 | DEBUG    | __main__:trials:24 - Trial = 28774/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.349 | DEBUG    | __main__:trials:29 - Trial = 28774/30000 | Total reward = 38.10
2022-01-26 14:18:46.353 | DEBUG    | __main__:trials:24 - Trial = 28775/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.354 | DEBUG    | __main__:trials:29 - Trial = 28775/30000 | Total reward = 45.18
2022-01-26 14:18:46.358 | DEBUG    | __main__:trials:24 - Trial = 28776/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.359 | DEBUG    | __main__:trials:29 - Trial = 28776/30000 | Total reward = 36.24
2022-01-26 14:18:46.363 | DEBUG    | __main__:trials:24 - Trial = 28777/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.364 | DEBUG    | __main__:trials:29 - Trial = 28777/30000 | Total reward = 37.38
2022-01-26 14:18:46.368 | DEBUG    | __main__:trials:24 - Trial = 28778/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.369 | DEBUG    | __main__:trials:29 - Trial = 28778/30000 | Total reward = 45.91
2022-01-26 14:18:46.373 | DEBUG    | __main__:trials:26 - Trial = 28779/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.374 | DEBUG    | __main__:trials:29 - Trial = 28779/30000 | Total reward = 21.34
2022-01-26 14:18:46.378 | DEBUG    | __main__:trials:24 - Trial = 28780/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.379 | DEBUG    | __main__:trials:29 - Trial = 28780/30000 | Total reward = 36.63
2022-01-26 14:18:46.383 | DEBUG    | __main__:trials:24 - Trial = 28781/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.384 | DEBUG    | __main__:trials:29 - Trial = 28781/30000 | Total reward = 32.80
2022-01-26 14:18:46.387 | DEBUG    | __main__:trials:24 - Trial = 28782/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.389 | DEBUG    | __main__:trials:29 - Trial = 28782/30000 | Total reward = 35.79
2022-01-26 14:18:46.392 | DEBUG    | __main__:trials:24 - Trial = 28783/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.394 | DEBUG    | __main__:trials:29 - Trial = 28783/30000 | Total reward = 39.58
2022-01-26 14:18:46.397 | DEBUG    | __main__:trials:24 - Trial = 28784/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.399 | DEBUG    | __main__:trials:29 - Trial = 28784/30000 | Total reward = 36.66
2022-01-26 14:18:46.402 | DEBUG    | __main__:trials:24 - Trial = 28785/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.404 | DEBUG    | __main__:trials:29 - Trial = 28785/30000 | Total reward = 45.75
2022-01-26 14:18:46.406 | DEBUG    | __main__:trials:26 - Trial = 28786/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.407 | DEBUG    | __main__:trials:29 - Trial = 28786/30000 | Total reward = 12.14
2022-01-26 14:18:46.410 | DEBUG    | __main__:trials:26 - Trial = 28787/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.412 | DEBUG    | __main__:trials:29 - Trial = 28787/30000 | Total reward = 17.61
2022-01-26 14:18:46.416 | DEBUG    | __main__:trials:24 - Trial = 28788/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.417 | DEBUG    | __main__:trials:29 - Trial = 28788/30000 | Total reward = 36.49
2022-01-26 14:18:46.421 | DEBUG    | __main__:trials:24 - Trial = 28789/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.422 | DEBUG    | __main__:trials:29 - Trial = 28789/30000 | Total reward = 36.15
2022-01-26 14:18:46.426 | DEBUG    | __main__:trials:24 - Trial = 28790/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.427 | DEBUG    | __main__:trials:29 - Trial = 28790/30000 | Total reward = 52.44
2022-01-26 14:18:46.431 | DEBUG    | __main__:trials:24 - Trial = 28791/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.432 | DEBUG    | __main__:trials:29 - Trial = 28791/30000 | Total reward = 38.28
2022-01-26 14:18:46.436 | DEBUG    | __main__:trials:24 - Trial = 28792/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.437 | DEBUG    | __main__:trials:29 - Trial = 28792/30000 | Total reward = 34.70
2022-01-26 14:18:46.440 | DEBUG    | __main__:trials:24 - Trial = 28793/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.442 | DEBUG    | __main__:trials:29 - Trial = 28793/30000 | Total reward = 34.74
2022-01-26 14:18:46.446 | DEBUG    | __main__:trials:24 - Trial = 28794/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.446 | DEBUG    | __main__:trials:29 - Trial = 28794/30000 | Total reward = 37.88
2022-01-26 14:18:46.451 | DEBUG    | __main__:trials:24 - Trial = 28795/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.452 | DEBUG    | __main__:trials:29 - Trial = 28795/30000 | Total reward = 35.06
2022-01-26 14:18:46.456 | DEBUG    | __main__:trials:24 - Trial = 28796/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.457 | DEBUG    | __main__:trials:29 - Trial = 28796/30000 | Total reward = 45.91
2022-01-26 14:18:46.461 | DEBUG    | __main__:trials:24 - Trial = 28797/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.462 | DEBUG    | __main__:trials:29 - Trial = 28797/30000 | Total reward = 55.34
2022-01-26 14:18:46.466 | DEBUG    | __main__:trials:24 - Trial = 28798/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.467 | DEBUG    | __main__:trials:29 - Trial = 28798/30000 | Total reward = 44.76
2022-01-26 14:18:46.471 | DEBUG    | __main__:trials:24 - Trial = 28799/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.472 | DEBUG    | __main__:trials:29 - Trial = 28799/30000 | Total reward = 49.08
2022-01-26 14:18:46.476 | DEBUG    | __main__:trials:24 - Trial = 28800/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.478 | DEBUG    | __main__:trials:29 - Trial = 28800/30000 | Total reward = 34.17
2022-01-26 14:18:46.480 | DEBUG    | __main__:trials:26 - Trial = 28801/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.481 | DEBUG    | __main__:trials:29 - Trial = 28801/30000 | Total reward = 14.18
2022-01-26 14:18:46.484 | DEBUG    | __main__:trials:26 - Trial = 28802/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.486 | DEBUG    | __main__:trials:29 - Trial = 28802/30000 | Total reward = 12.14
2022-01-26 14:18:46.488 | DEBUG    | __main__:trials:26 - Trial = 28803/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.489 | DEBUG    | __main__:trials:29 - Trial = 28803/30000 | Total reward = 7.77
2022-01-26 14:18:46.492 | DEBUG    | __main__:trials:26 - Trial = 28804/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.494 | DEBUG    | __main__:trials:29 - Trial = 28804/30000 | Total reward = 26.62
2022-01-26 14:18:46.497 | DEBUG    | __main__:trials:26 - Trial = 28805/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.499 | DEBUG    | __main__:trials:29 - Trial = 28805/30000 | Total reward = 22.72
2022-01-26 14:18:46.502 | DEBUG    | __main__:trials:26 - Trial = 28806/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.503 | DEBUG    | __main__:trials:29 - Trial = 28806/30000 | Total reward = 16.41
2022-01-26 14:18:46.507 | DEBUG    | __main__:trials:24 - Trial = 28807/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.507 | DEBUG    | __main__:trials:29 - Trial = 28807/30000 | Total reward = 48.80
2022-01-26 14:18:46.511 | DEBUG    | __main__:trials:26 - Trial = 28808/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.512 | DEBUG    | __main__:trials:29 - Trial = 28808/30000 | Total reward = 17.61
2022-01-26 14:18:46.516 | DEBUG    | __main__:trials:24 - Trial = 28809/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.517 | DEBUG    | __main__:trials:29 - Trial = 28809/30000 | Total reward = 56.94
2022-01-26 14:18:46.520 | DEBUG    | __main__:trials:26 - Trial = 28810/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.521 | DEBUG    | __main__:trials:29 - Trial = 28810/30000 | Total reward = 21.32
2022-01-26 14:18:46.524 | DEBUG    | __main__:trials:24 - Trial = 28811/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.525 | DEBUG    | __main__:trials:29 - Trial = 28811/30000 | Total reward = 35.88
2022-01-26 14:18:46.528 | DEBUG    | __main__:trials:24 - Trial = 28812/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.530 | DEBUG    | __main__:trials:29 - Trial = 28812/30000 | Total reward = 24.71
2022-01-26 14:18:46.533 | DEBUG    | __main__:trials:26 - Trial = 28813/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.534 | DEBUG    | __main__:trials:29 - Trial = 28813/30000 | Total reward = 18.09
2022-01-26 14:18:46.537 | DEBUG    | __main__:trials:26 - Trial = 28814/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.538 | DEBUG    | __main__:trials:29 - Trial = 28814/30000 | Total reward = 22.14
2022-01-26 14:18:46.541 | DEBUG    | __main__:trials:26 - Trial = 28815/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.543 | DEBUG    | __main__:trials:29 - Trial = 28815/30000 | Total reward = 9.47
2022-01-26 14:18:46.547 | DEBUG    | __main__:trials:24 - Trial = 28816/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.547 | DEBUG    | __main__:trials:29 - Trial = 28816/30000 | Total reward = 25.48
2022-01-26 14:18:46.552 | DEBUG    | __main__:trials:24 - Trial = 28817/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.554 | DEBUG    | __main__:trials:29 - Trial = 28817/30000 | Total reward = 22.17
2022-01-26 14:18:46.557 | DEBUG    | __main__:trials:24 - Trial = 28818/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.558 | DEBUG    | __main__:trials:29 - Trial = 28818/30000 | Total reward = 31.27
2022-01-26 14:18:46.562 | DEBUG    | __main__:trials:26 - Trial = 28819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.564 | DEBUG    | __main__:trials:29 - Trial = 28819/30000 | Total reward = 25.32
2022-01-26 14:18:46.566 | DEBUG    | __main__:trials:24 - Trial = 28820/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.568 | DEBUG    | __main__:trials:29 - Trial = 28820/30000 | Total reward = 37.54
2022-01-26 14:18:46.571 | DEBUG    | __main__:trials:24 - Trial = 28821/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.573 | DEBUG    | __main__:trials:29 - Trial = 28821/30000 | Total reward = 38.57
2022-01-26 14:18:46.576 | DEBUG    | __main__:trials:24 - Trial = 28822/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.577 | DEBUG    | __main__:trials:29 - Trial = 28822/30000 | Total reward = 39.01
2022-01-26 14:18:46.580 | DEBUG    | __main__:trials:24 - Trial = 28823/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.582 | DEBUG    | __main__:trials:29 - Trial = 28823/30000 | Total reward = 51.54
2022-01-26 14:18:46.586 | DEBUG    | __main__:trials:24 - Trial = 28824/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.587 | DEBUG    | __main__:trials:29 - Trial = 28824/30000 | Total reward = 33.71
2022-01-26 14:18:46.590 | DEBUG    | __main__:trials:26 - Trial = 28825/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.591 | DEBUG    | __main__:trials:29 - Trial = 28825/30000 | Total reward = 28.54
2022-01-26 14:18:46.595 | DEBUG    | __main__:trials:26 - Trial = 28826/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.596 | DEBUG    | __main__:trials:29 - Trial = 28826/30000 | Total reward = 31.57
2022-01-26 14:18:46.599 | DEBUG    | __main__:trials:24 - Trial = 28827/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.601 | DEBUG    | __main__:trials:29 - Trial = 28827/30000 | Total reward = 42.17
2022-01-26 14:18:46.604 | DEBUG    | __main__:trials:26 - Trial = 28828/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.605 | DEBUG    | __main__:trials:29 - Trial = 28828/30000 | Total reward = 31.59
2022-01-26 14:18:46.609 | DEBUG    | __main__:trials:24 - Trial = 28829/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.610 | DEBUG    | __main__:trials:29 - Trial = 28829/30000 | Total reward = 50.08
2022-01-26 14:18:46.614 | DEBUG    | __main__:trials:24 - Trial = 28830/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.616 | DEBUG    | __main__:trials:29 - Trial = 28830/30000 | Total reward = 46.00
2022-01-26 14:18:46.619 | DEBUG    | __main__:trials:26 - Trial = 28831/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.621 | DEBUG    | __main__:trials:29 - Trial = 28831/30000 | Total reward = 22.29
2022-01-26 14:18:46.624 | DEBUG    | __main__:trials:24 - Trial = 28832/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.626 | DEBUG    | __main__:trials:29 - Trial = 28832/30000 | Total reward = 40.16
2022-01-26 14:18:46.630 | DEBUG    | __main__:trials:24 - Trial = 28833/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.631 | DEBUG    | __main__:trials:29 - Trial = 28833/30000 | Total reward = 38.49
2022-01-26 14:18:46.635 | DEBUG    | __main__:trials:24 - Trial = 28834/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.636 | DEBUG    | __main__:trials:29 - Trial = 28834/30000 | Total reward = 52.81
2022-01-26 14:18:46.639 | DEBUG    | __main__:trials:24 - Trial = 28835/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.641 | DEBUG    | __main__:trials:29 - Trial = 28835/30000 | Total reward = 46.36
2022-01-26 14:18:46.644 | DEBUG    | __main__:trials:24 - Trial = 28836/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.646 | DEBUG    | __main__:trials:29 - Trial = 28836/30000 | Total reward = 33.99
2022-01-26 14:18:46.649 | DEBUG    | __main__:trials:24 - Trial = 28837/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.650 | DEBUG    | __main__:trials:29 - Trial = 28837/30000 | Total reward = 38.55
2022-01-26 14:18:46.653 | DEBUG    | __main__:trials:24 - Trial = 28838/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.654 | DEBUG    | __main__:trials:29 - Trial = 28838/30000 | Total reward = 50.53
2022-01-26 14:18:46.658 | DEBUG    | __main__:trials:24 - Trial = 28839/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.660 | DEBUG    | __main__:trials:29 - Trial = 28839/30000 | Total reward = 40.25
2022-01-26 14:18:46.663 | DEBUG    | __main__:trials:24 - Trial = 28840/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.664 | DEBUG    | __main__:trials:29 - Trial = 28840/30000 | Total reward = 43.33
2022-01-26 14:18:46.668 | DEBUG    | __main__:trials:24 - Trial = 28841/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.670 | DEBUG    | __main__:trials:29 - Trial = 28841/30000 | Total reward = 57.73
2022-01-26 14:18:46.673 | DEBUG    | __main__:trials:24 - Trial = 28842/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.675 | DEBUG    | __main__:trials:29 - Trial = 28842/30000 | Total reward = 45.55
2022-01-26 14:18:46.678 | DEBUG    | __main__:trials:24 - Trial = 28843/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.680 | DEBUG    | __main__:trials:29 - Trial = 28843/30000 | Total reward = 38.01
2022-01-26 14:18:46.683 | DEBUG    | __main__:trials:24 - Trial = 28844/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.684 | DEBUG    | __main__:trials:29 - Trial = 28844/30000 | Total reward = 37.48
2022-01-26 14:18:46.688 | DEBUG    | __main__:trials:26 - Trial = 28845/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.690 | DEBUG    | __main__:trials:29 - Trial = 28845/30000 | Total reward = 29.52
2022-01-26 14:18:46.693 | DEBUG    | __main__:trials:24 - Trial = 28846/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.694 | DEBUG    | __main__:trials:29 - Trial = 28846/30000 | Total reward = 40.94
2022-01-26 14:18:46.698 | DEBUG    | __main__:trials:24 - Trial = 28847/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.699 | DEBUG    | __main__:trials:29 - Trial = 28847/30000 | Total reward = 46.12
2022-01-26 14:18:46.704 | DEBUG    | __main__:trials:24 - Trial = 28848/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.704 | DEBUG    | __main__:trials:29 - Trial = 28848/30000 | Total reward = 50.04
2022-01-26 14:18:46.708 | DEBUG    | __main__:trials:26 - Trial = 28849/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.709 | DEBUG    | __main__:trials:29 - Trial = 28849/30000 | Total reward = 18.58
2022-01-26 14:18:46.713 | DEBUG    | __main__:trials:24 - Trial = 28850/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.714 | DEBUG    | __main__:trials:29 - Trial = 28850/30000 | Total reward = 47.01
2022-01-26 14:18:46.718 | DEBUG    | __main__:trials:24 - Trial = 28851/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.720 | DEBUG    | __main__:trials:29 - Trial = 28851/30000 | Total reward = 40.03
2022-01-26 14:18:46.723 | DEBUG    | __main__:trials:24 - Trial = 28852/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.724 | DEBUG    | __main__:trials:29 - Trial = 28852/30000 | Total reward = 30.82
2022-01-26 14:18:46.728 | DEBUG    | __main__:trials:24 - Trial = 28853/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.730 | DEBUG    | __main__:trials:29 - Trial = 28853/30000 | Total reward = 34.06
2022-01-26 14:18:46.733 | DEBUG    | __main__:trials:24 - Trial = 28854/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.734 | DEBUG    | __main__:trials:29 - Trial = 28854/30000 | Total reward = 47.11
2022-01-26 14:18:46.738 | DEBUG    | __main__:trials:26 - Trial = 28855/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.739 | DEBUG    | __main__:trials:29 - Trial = 28855/30000 | Total reward = 28.17
2022-01-26 14:18:46.743 | DEBUG    | __main__:trials:26 - Trial = 28856/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.744 | DEBUG    | __main__:trials:29 - Trial = 28856/30000 | Total reward = 15.25
2022-01-26 14:18:46.748 | DEBUG    | __main__:trials:24 - Trial = 28857/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.749 | DEBUG    | __main__:trials:29 - Trial = 28857/30000 | Total reward = 34.73
2022-01-26 14:18:46.752 | DEBUG    | __main__:trials:26 - Trial = 28858/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.753 | DEBUG    | __main__:trials:29 - Trial = 28858/30000 | Total reward = 23.37
2022-01-26 14:18:46.757 | DEBUG    | __main__:trials:24 - Trial = 28859/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.759 | DEBUG    | __main__:trials:29 - Trial = 28859/30000 | Total reward = 63.10
2022-01-26 14:18:46.762 | DEBUG    | __main__:trials:24 - Trial = 28860/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.763 | DEBUG    | __main__:trials:29 - Trial = 28860/30000 | Total reward = 33.64
2022-01-26 14:18:46.768 | DEBUG    | __main__:trials:24 - Trial = 28861/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.769 | DEBUG    | __main__:trials:29 - Trial = 28861/30000 | Total reward = 32.18
2022-01-26 14:18:46.772 | DEBUG    | __main__:trials:24 - Trial = 28862/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.774 | DEBUG    | __main__:trials:29 - Trial = 28862/30000 | Total reward = 45.79
2022-01-26 14:18:46.778 | DEBUG    | __main__:trials:24 - Trial = 28863/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.779 | DEBUG    | __main__:trials:29 - Trial = 28863/30000 | Total reward = 33.39
2022-01-26 14:18:46.782 | DEBUG    | __main__:trials:24 - Trial = 28864/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.783 | DEBUG    | __main__:trials:29 - Trial = 28864/30000 | Total reward = 45.97
2022-01-26 14:18:46.785 | DEBUG    | __main__:trials:26 - Trial = 28865/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.786 | DEBUG    | __main__:trials:29 - Trial = 28865/30000 | Total reward = 11.26
2022-01-26 14:18:46.790 | DEBUG    | __main__:trials:24 - Trial = 28866/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.792 | DEBUG    | __main__:trials:29 - Trial = 28866/30000 | Total reward = 32.24
2022-01-26 14:18:46.795 | DEBUG    | __main__:trials:24 - Trial = 28867/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.796 | DEBUG    | __main__:trials:29 - Trial = 28867/30000 | Total reward = 29.89
2022-01-26 14:18:46.800 | DEBUG    | __main__:trials:26 - Trial = 28868/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.801 | DEBUG    | __main__:trials:29 - Trial = 28868/30000 | Total reward = 13.91
2022-01-26 14:18:46.804 | DEBUG    | __main__:trials:26 - Trial = 28869/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.805 | DEBUG    | __main__:trials:29 - Trial = 28869/30000 | Total reward = 9.69
2022-01-26 14:18:46.808 | DEBUG    | __main__:trials:24 - Trial = 28870/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.810 | DEBUG    | __main__:trials:29 - Trial = 28870/30000 | Total reward = 30.99
2022-01-26 14:18:46.813 | DEBUG    | __main__:trials:26 - Trial = 28871/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.814 | DEBUG    | __main__:trials:29 - Trial = 28871/30000 | Total reward = 13.00
2022-01-26 14:18:46.817 | DEBUG    | __main__:trials:26 - Trial = 28872/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.818 | DEBUG    | __main__:trials:29 - Trial = 28872/30000 | Total reward = 11.06
2022-01-26 14:18:46.821 | DEBUG    | __main__:trials:24 - Trial = 28873/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.822 | DEBUG    | __main__:trials:29 - Trial = 28873/30000 | Total reward = 29.74
2022-01-26 14:18:46.825 | DEBUG    | __main__:trials:24 - Trial = 28874/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.827 | DEBUG    | __main__:trials:29 - Trial = 28874/30000 | Total reward = 36.18
2022-01-26 14:18:46.829 | DEBUG    | __main__:trials:24 - Trial = 28875/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.831 | DEBUG    | __main__:trials:29 - Trial = 28875/30000 | Total reward = 16.14
2022-01-26 14:18:46.833 | DEBUG    | __main__:trials:26 - Trial = 28876/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.835 | DEBUG    | __main__:trials:29 - Trial = 28876/30000 | Total reward = 12.72
2022-01-26 14:18:46.838 | DEBUG    | __main__:trials:26 - Trial = 28877/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.839 | DEBUG    | __main__:trials:29 - Trial = 28877/30000 | Total reward = 15.59
2022-01-26 14:18:46.842 | DEBUG    | __main__:trials:26 - Trial = 28878/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.843 | DEBUG    | __main__:trials:29 - Trial = 28878/30000 | Total reward = 15.96
2022-01-26 14:18:46.847 | DEBUG    | __main__:trials:24 - Trial = 28879/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.848 | DEBUG    | __main__:trials:29 - Trial = 28879/30000 | Total reward = 48.72
2022-01-26 14:18:46.852 | DEBUG    | __main__:trials:26 - Trial = 28880/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.853 | DEBUG    | __main__:trials:29 - Trial = 28880/30000 | Total reward = 17.12
2022-01-26 14:18:46.856 | DEBUG    | __main__:trials:26 - Trial = 28881/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.857 | DEBUG    | __main__:trials:29 - Trial = 28881/30000 | Total reward = 16.05
2022-01-26 14:18:46.860 | DEBUG    | __main__:trials:26 - Trial = 28882/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.861 | DEBUG    | __main__:trials:29 - Trial = 28882/30000 | Total reward = 15.03
2022-01-26 14:18:46.867 | DEBUG    | __main__:trials:26 - Trial = 28883/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.868 | DEBUG    | __main__:trials:29 - Trial = 28883/30000 | Total reward = 26.67
2022-01-26 14:18:46.872 | DEBUG    | __main__:trials:24 - Trial = 28884/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.873 | DEBUG    | __main__:trials:29 - Trial = 28884/30000 | Total reward = 30.71
2022-01-26 14:18:46.877 | DEBUG    | __main__:trials:24 - Trial = 28885/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.879 | DEBUG    | __main__:trials:29 - Trial = 28885/30000 | Total reward = 33.18
2022-01-26 14:18:46.882 | DEBUG    | __main__:trials:24 - Trial = 28886/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.884 | DEBUG    | __main__:trials:29 - Trial = 28886/30000 | Total reward = 31.25
2022-01-26 14:18:46.887 | DEBUG    | __main__:trials:24 - Trial = 28887/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.889 | DEBUG    | __main__:trials:29 - Trial = 28887/30000 | Total reward = 32.85
2022-01-26 14:18:46.892 | DEBUG    | __main__:trials:24 - Trial = 28888/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.894 | DEBUG    | __main__:trials:29 - Trial = 28888/30000 | Total reward = 25.79
2022-01-26 14:18:46.897 | DEBUG    | __main__:trials:26 - Trial = 28889/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.899 | DEBUG    | __main__:trials:29 - Trial = 28889/30000 | Total reward = 19.46
2022-01-26 14:18:46.902 | DEBUG    | __main__:trials:24 - Trial = 28890/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.904 | DEBUG    | __main__:trials:29 - Trial = 28890/30000 | Total reward = 37.45
2022-01-26 14:18:46.907 | DEBUG    | __main__:trials:24 - Trial = 28891/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.909 | DEBUG    | __main__:trials:29 - Trial = 28891/30000 | Total reward = 46.80
2022-01-26 14:18:46.912 | DEBUG    | __main__:trials:24 - Trial = 28892/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.913 | DEBUG    | __main__:trials:29 - Trial = 28892/30000 | Total reward = 35.84
2022-01-26 14:18:46.917 | DEBUG    | __main__:trials:24 - Trial = 28893/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.918 | DEBUG    | __main__:trials:29 - Trial = 28893/30000 | Total reward = 29.54
2022-01-26 14:18:46.922 | DEBUG    | __main__:trials:24 - Trial = 28894/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.923 | DEBUG    | __main__:trials:29 - Trial = 28894/30000 | Total reward = 43.39
2022-01-26 14:18:46.927 | DEBUG    | __main__:trials:24 - Trial = 28895/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.929 | DEBUG    | __main__:trials:29 - Trial = 28895/30000 | Total reward = 50.58
2022-01-26 14:18:46.932 | DEBUG    | __main__:trials:24 - Trial = 28896/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.934 | DEBUG    | __main__:trials:29 - Trial = 28896/30000 | Total reward = 34.23
2022-01-26 14:18:46.937 | DEBUG    | __main__:trials:24 - Trial = 28897/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.938 | DEBUG    | __main__:trials:29 - Trial = 28897/30000 | Total reward = 33.85
2022-01-26 14:18:46.942 | DEBUG    | __main__:trials:24 - Trial = 28898/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.944 | DEBUG    | __main__:trials:29 - Trial = 28898/30000 | Total reward = 40.52
2022-01-26 14:18:46.947 | DEBUG    | __main__:trials:24 - Trial = 28899/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.948 | DEBUG    | __main__:trials:29 - Trial = 28899/30000 | Total reward = 35.70
2022-01-26 14:18:46.952 | DEBUG    | __main__:trials:24 - Trial = 28900/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.953 | DEBUG    | __main__:trials:29 - Trial = 28900/30000 | Total reward = 39.33
2022-01-26 14:18:46.957 | DEBUG    | __main__:trials:24 - Trial = 28901/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.958 | DEBUG    | __main__:trials:29 - Trial = 28901/30000 | Total reward = 34.99
2022-01-26 14:18:46.961 | DEBUG    | __main__:trials:24 - Trial = 28902/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.962 | DEBUG    | __main__:trials:29 - Trial = 28902/30000 | Total reward = 32.51
2022-01-26 14:18:46.966 | DEBUG    | __main__:trials:26 - Trial = 28903/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.967 | DEBUG    | __main__:trials:29 - Trial = 28903/30000 | Total reward = 13.08
2022-01-26 14:18:46.971 | DEBUG    | __main__:trials:26 - Trial = 28904/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.972 | DEBUG    | __main__:trials:29 - Trial = 28904/30000 | Total reward = 29.47
2022-01-26 14:18:46.975 | DEBUG    | __main__:trials:24 - Trial = 28905/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.977 | DEBUG    | __main__:trials:29 - Trial = 28905/30000 | Total reward = 39.81
2022-01-26 14:18:46.981 | DEBUG    | __main__:trials:26 - Trial = 28906/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.981 | DEBUG    | __main__:trials:29 - Trial = 28906/30000 | Total reward = 25.75
2022-01-26 14:18:46.984 | DEBUG    | __main__:trials:26 - Trial = 28907/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.986 | DEBUG    | __main__:trials:29 - Trial = 28907/30000 | Total reward = 16.03
2022-01-26 14:18:46.989 | DEBUG    | __main__:trials:26 - Trial = 28908/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:46.990 | DEBUG    | __main__:trials:29 - Trial = 28908/30000 | Total reward = 19.02
2022-01-26 14:18:46.994 | DEBUG    | __main__:trials:24 - Trial = 28909/30000 | Max number of steps (20) reached
2022-01-26 14:18:46.995 | DEBUG    | __main__:trials:29 - Trial = 28909/30000 | Total reward = 32.51
2022-01-26 14:18:46.999 | DEBUG    | __main__:trials:24 - Trial = 28910/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.000 | DEBUG    | __main__:trials:29 - Trial = 28910/30000 | Total reward = 43.85
2022-01-26 14:18:47.004 | DEBUG    | __main__:trials:24 - Trial = 28911/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.005 | DEBUG    | __main__:trials:29 - Trial = 28911/30000 | Total reward = 34.23
2022-01-26 14:18:47.009 | DEBUG    | __main__:trials:24 - Trial = 28912/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.009 | DEBUG    | __main__:trials:29 - Trial = 28912/30000 | Total reward = 34.28
2022-01-26 14:18:47.014 | DEBUG    | __main__:trials:24 - Trial = 28913/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.014 | DEBUG    | __main__:trials:29 - Trial = 28913/30000 | Total reward = 43.01
2022-01-26 14:18:47.018 | DEBUG    | __main__:trials:26 - Trial = 28914/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.018 | DEBUG    | __main__:trials:29 - Trial = 28914/30000 | Total reward = 12.23
2022-01-26 14:18:47.022 | DEBUG    | __main__:trials:26 - Trial = 28915/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.023 | DEBUG    | __main__:trials:29 - Trial = 28915/30000 | Total reward = 14.28
2022-01-26 14:18:47.026 | DEBUG    | __main__:trials:26 - Trial = 28916/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.028 | DEBUG    | __main__:trials:29 - Trial = 28916/30000 | Total reward = 10.06
2022-01-26 14:18:47.031 | DEBUG    | __main__:trials:24 - Trial = 28917/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.032 | DEBUG    | __main__:trials:29 - Trial = 28917/30000 | Total reward = 35.38
2022-01-26 14:18:47.036 | DEBUG    | __main__:trials:24 - Trial = 28918/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.038 | DEBUG    | __main__:trials:29 - Trial = 28918/30000 | Total reward = 29.44
2022-01-26 14:18:47.041 | DEBUG    | __main__:trials:24 - Trial = 28919/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.043 | DEBUG    | __main__:trials:29 - Trial = 28919/30000 | Total reward = 45.87
2022-01-26 14:18:47.046 | DEBUG    | __main__:trials:24 - Trial = 28920/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.047 | DEBUG    | __main__:trials:29 - Trial = 28920/30000 | Total reward = 32.51
2022-01-26 14:18:47.051 | DEBUG    | __main__:trials:26 - Trial = 28921/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.052 | DEBUG    | __main__:trials:29 - Trial = 28921/30000 | Total reward = 17.64
2022-01-26 14:18:47.055 | DEBUG    | __main__:trials:24 - Trial = 28922/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.057 | DEBUG    | __main__:trials:29 - Trial = 28922/30000 | Total reward = 45.76
2022-01-26 14:18:47.058 | DEBUG    | __main__:trials:26 - Trial = 28923/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.060 | DEBUG    | __main__:trials:29 - Trial = 28923/30000 | Total reward = 7.96
2022-01-26 14:18:47.064 | DEBUG    | __main__:trials:26 - Trial = 28924/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.065 | DEBUG    | __main__:trials:29 - Trial = 28924/30000 | Total reward = 21.94
2022-01-26 14:18:47.068 | DEBUG    | __main__:trials:26 - Trial = 28925/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.070 | DEBUG    | __main__:trials:29 - Trial = 28925/30000 | Total reward = 14.81
2022-01-26 14:18:47.073 | DEBUG    | __main__:trials:24 - Trial = 28926/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.075 | DEBUG    | __main__:trials:29 - Trial = 28926/30000 | Total reward = 35.56
2022-01-26 14:18:47.078 | DEBUG    | __main__:trials:24 - Trial = 28927/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.080 | DEBUG    | __main__:trials:29 - Trial = 28927/30000 | Total reward = 52.62
2022-01-26 14:18:47.083 | DEBUG    | __main__:trials:24 - Trial = 28928/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.085 | DEBUG    | __main__:trials:29 - Trial = 28928/30000 | Total reward = 32.88
2022-01-26 14:18:47.088 | DEBUG    | __main__:trials:26 - Trial = 28929/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.089 | DEBUG    | __main__:trials:29 - Trial = 28929/30000 | Total reward = 21.52
2022-01-26 14:18:47.093 | DEBUG    | __main__:trials:24 - Trial = 28930/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.094 | DEBUG    | __main__:trials:29 - Trial = 28930/30000 | Total reward = 45.07
2022-01-26 14:18:47.098 | DEBUG    | __main__:trials:24 - Trial = 28931/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.098 | DEBUG    | __main__:trials:29 - Trial = 28931/30000 | Total reward = 42.59
2022-01-26 14:18:47.103 | DEBUG    | __main__:trials:24 - Trial = 28932/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.104 | DEBUG    | __main__:trials:29 - Trial = 28932/30000 | Total reward = 47.79
2022-01-26 14:18:47.108 | DEBUG    | __main__:trials:24 - Trial = 28933/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.110 | DEBUG    | __main__:trials:29 - Trial = 28933/30000 | Total reward = 39.07
2022-01-26 14:18:47.113 | DEBUG    | __main__:trials:26 - Trial = 28934/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.114 | DEBUG    | __main__:trials:29 - Trial = 28934/30000 | Total reward = 23.89
2022-01-26 14:18:47.118 | DEBUG    | __main__:trials:24 - Trial = 28935/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.120 | DEBUG    | __main__:trials:29 - Trial = 28935/30000 | Total reward = 43.50
2022-01-26 14:18:47.123 | DEBUG    | __main__:trials:24 - Trial = 28936/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.125 | DEBUG    | __main__:trials:29 - Trial = 28936/30000 | Total reward = 34.61
2022-01-26 14:18:47.129 | DEBUG    | __main__:trials:24 - Trial = 28937/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.130 | DEBUG    | __main__:trials:29 - Trial = 28937/30000 | Total reward = 37.37
2022-01-26 14:18:47.133 | DEBUG    | __main__:trials:24 - Trial = 28938/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.134 | DEBUG    | __main__:trials:29 - Trial = 28938/30000 | Total reward = 35.14
2022-01-26 14:18:47.138 | DEBUG    | __main__:trials:24 - Trial = 28939/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.140 | DEBUG    | __main__:trials:29 - Trial = 28939/30000 | Total reward = 32.52
2022-01-26 14:18:47.142 | DEBUG    | __main__:trials:24 - Trial = 28940/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.144 | DEBUG    | __main__:trials:29 - Trial = 28940/30000 | Total reward = 31.92
2022-01-26 14:18:47.148 | DEBUG    | __main__:trials:24 - Trial = 28941/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.149 | DEBUG    | __main__:trials:29 - Trial = 28941/30000 | Total reward = 38.99
2022-01-26 14:18:47.153 | DEBUG    | __main__:trials:24 - Trial = 28942/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.153 | DEBUG    | __main__:trials:29 - Trial = 28942/30000 | Total reward = 45.79
2022-01-26 14:18:47.157 | DEBUG    | __main__:trials:26 - Trial = 28943/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.158 | DEBUG    | __main__:trials:29 - Trial = 28943/30000 | Total reward = 11.06
2022-01-26 14:18:47.161 | DEBUG    | __main__:trials:26 - Trial = 28944/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.162 | DEBUG    | __main__:trials:29 - Trial = 28944/30000 | Total reward = 24.36
2022-01-26 14:18:47.167 | DEBUG    | __main__:trials:24 - Trial = 28945/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.168 | DEBUG    | __main__:trials:29 - Trial = 28945/30000 | Total reward = 42.68
2022-01-26 14:18:47.172 | DEBUG    | __main__:trials:24 - Trial = 28946/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.173 | DEBUG    | __main__:trials:29 - Trial = 28946/30000 | Total reward = 42.88
2022-01-26 14:18:47.177 | DEBUG    | __main__:trials:24 - Trial = 28947/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.178 | DEBUG    | __main__:trials:29 - Trial = 28947/30000 | Total reward = 33.82
2022-01-26 14:18:47.182 | DEBUG    | __main__:trials:24 - Trial = 28948/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.183 | DEBUG    | __main__:trials:29 - Trial = 28948/30000 | Total reward = 42.98
2022-01-26 14:18:47.186 | DEBUG    | __main__:trials:26 - Trial = 28949/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.187 | DEBUG    | __main__:trials:29 - Trial = 28949/30000 | Total reward = 10.11
2022-01-26 14:18:47.191 | DEBUG    | __main__:trials:24 - Trial = 28950/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.192 | DEBUG    | __main__:trials:29 - Trial = 28950/30000 | Total reward = 42.35
2022-01-26 14:18:47.196 | DEBUG    | __main__:trials:24 - Trial = 28951/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.198 | DEBUG    | __main__:trials:29 - Trial = 28951/30000 | Total reward = 30.27
2022-01-26 14:18:47.201 | DEBUG    | __main__:trials:24 - Trial = 28952/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.203 | DEBUG    | __main__:trials:29 - Trial = 28952/30000 | Total reward = 32.53
2022-01-26 14:18:47.206 | DEBUG    | __main__:trials:24 - Trial = 28953/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.207 | DEBUG    | __main__:trials:29 - Trial = 28953/30000 | Total reward = 34.68
2022-01-26 14:18:47.210 | DEBUG    | __main__:trials:24 - Trial = 28954/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.212 | DEBUG    | __main__:trials:29 - Trial = 28954/30000 | Total reward = 32.51
2022-01-26 14:18:47.216 | DEBUG    | __main__:trials:24 - Trial = 28955/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.217 | DEBUG    | __main__:trials:29 - Trial = 28955/30000 | Total reward = 44.40
2022-01-26 14:18:47.220 | DEBUG    | __main__:trials:26 - Trial = 28956/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.222 | DEBUG    | __main__:trials:29 - Trial = 28956/30000 | Total reward = 28.34
2022-01-26 14:18:47.225 | DEBUG    | __main__:trials:24 - Trial = 28957/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.227 | DEBUG    | __main__:trials:29 - Trial = 28957/30000 | Total reward = 42.48
2022-01-26 14:18:47.230 | DEBUG    | __main__:trials:24 - Trial = 28958/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.231 | DEBUG    | __main__:trials:29 - Trial = 28958/30000 | Total reward = 31.07
2022-01-26 14:18:47.234 | DEBUG    | __main__:trials:24 - Trial = 28959/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.236 | DEBUG    | __main__:trials:29 - Trial = 28959/30000 | Total reward = 39.19
2022-01-26 14:18:47.239 | DEBUG    | __main__:trials:24 - Trial = 28960/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.241 | DEBUG    | __main__:trials:29 - Trial = 28960/30000 | Total reward = 51.41
2022-01-26 14:18:47.245 | DEBUG    | __main__:trials:24 - Trial = 28961/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.246 | DEBUG    | __main__:trials:29 - Trial = 28961/30000 | Total reward = 62.76
2022-01-26 14:18:47.250 | DEBUG    | __main__:trials:24 - Trial = 28962/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.252 | DEBUG    | __main__:trials:29 - Trial = 28962/30000 | Total reward = 42.20
2022-01-26 14:18:47.255 | DEBUG    | __main__:trials:24 - Trial = 28963/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.257 | DEBUG    | __main__:trials:29 - Trial = 28963/30000 | Total reward = 34.37
2022-01-26 14:18:47.260 | DEBUG    | __main__:trials:24 - Trial = 28964/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.262 | DEBUG    | __main__:trials:29 - Trial = 28964/30000 | Total reward = 38.45
2022-01-26 14:18:47.266 | DEBUG    | __main__:trials:24 - Trial = 28965/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.267 | DEBUG    | __main__:trials:29 - Trial = 28965/30000 | Total reward = 36.14
2022-01-26 14:18:47.271 | DEBUG    | __main__:trials:24 - Trial = 28966/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.272 | DEBUG    | __main__:trials:29 - Trial = 28966/30000 | Total reward = 42.67
2022-01-26 14:18:47.276 | DEBUG    | __main__:trials:24 - Trial = 28967/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.277 | DEBUG    | __main__:trials:29 - Trial = 28967/30000 | Total reward = 35.34
2022-01-26 14:18:47.280 | DEBUG    | __main__:trials:26 - Trial = 28968/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.282 | DEBUG    | __main__:trials:29 - Trial = 28968/30000 | Total reward = 23.48
2022-01-26 14:18:47.285 | DEBUG    | __main__:trials:24 - Trial = 28969/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.286 | DEBUG    | __main__:trials:29 - Trial = 28969/30000 | Total reward = 38.37
2022-01-26 14:18:47.291 | DEBUG    | __main__:trials:24 - Trial = 28970/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.291 | DEBUG    | __main__:trials:29 - Trial = 28970/30000 | Total reward = 41.19
2022-01-26 14:18:47.295 | DEBUG    | __main__:trials:24 - Trial = 28971/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.297 | DEBUG    | __main__:trials:29 - Trial = 28971/30000 | Total reward = 44.35
2022-01-26 14:18:47.300 | DEBUG    | __main__:trials:26 - Trial = 28972/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.301 | DEBUG    | __main__:trials:29 - Trial = 28972/30000 | Total reward = 25.07
2022-01-26 14:18:47.305 | DEBUG    | __main__:trials:26 - Trial = 28973/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.306 | DEBUG    | __main__:trials:29 - Trial = 28973/30000 | Total reward = 22.70
2022-01-26 14:18:47.309 | DEBUG    | __main__:trials:26 - Trial = 28974/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.311 | DEBUG    | __main__:trials:29 - Trial = 28974/30000 | Total reward = 12.12
2022-01-26 14:18:47.314 | DEBUG    | __main__:trials:26 - Trial = 28975/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.316 | DEBUG    | __main__:trials:29 - Trial = 28975/30000 | Total reward = 23.90
2022-01-26 14:18:47.320 | DEBUG    | __main__:trials:24 - Trial = 28976/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.321 | DEBUG    | __main__:trials:29 - Trial = 28976/30000 | Total reward = 51.69
2022-01-26 14:18:47.324 | DEBUG    | __main__:trials:24 - Trial = 28977/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.326 | DEBUG    | __main__:trials:29 - Trial = 28977/30000 | Total reward = 34.19
2022-01-26 14:18:47.330 | DEBUG    | __main__:trials:26 - Trial = 28978/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.330 | DEBUG    | __main__:trials:29 - Trial = 28978/30000 | Total reward = 28.71
2022-01-26 14:18:47.334 | DEBUG    | __main__:trials:24 - Trial = 28979/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.336 | DEBUG    | __main__:trials:29 - Trial = 28979/30000 | Total reward = 51.11
2022-01-26 14:18:47.339 | DEBUG    | __main__:trials:24 - Trial = 28980/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.341 | DEBUG    | __main__:trials:29 - Trial = 28980/30000 | Total reward = 40.31
2022-01-26 14:18:47.344 | DEBUG    | __main__:trials:26 - Trial = 28981/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.345 | DEBUG    | __main__:trials:29 - Trial = 28981/30000 | Total reward = 24.69
2022-01-26 14:18:47.348 | DEBUG    | __main__:trials:26 - Trial = 28982/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.349 | DEBUG    | __main__:trials:29 - Trial = 28982/30000 | Total reward = 15.71
2022-01-26 14:18:47.351 | DEBUG    | __main__:trials:26 - Trial = 28983/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.352 | DEBUG    | __main__:trials:29 - Trial = 28983/30000 | Total reward = 11.06
2022-01-26 14:18:47.356 | DEBUG    | __main__:trials:24 - Trial = 28984/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.356 | DEBUG    | __main__:trials:29 - Trial = 28984/30000 | Total reward = 34.34
2022-01-26 14:18:47.359 | DEBUG    | __main__:trials:26 - Trial = 28985/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.359 | DEBUG    | __main__:trials:29 - Trial = 28985/30000 | Total reward = 14.93
2022-01-26 14:18:47.363 | DEBUG    | __main__:trials:24 - Trial = 28986/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.365 | DEBUG    | __main__:trials:29 - Trial = 28986/30000 | Total reward = 40.01
2022-01-26 14:18:47.368 | DEBUG    | __main__:trials:24 - Trial = 28987/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.369 | DEBUG    | __main__:trials:29 - Trial = 28987/30000 | Total reward = 44.03
2022-01-26 14:18:47.371 | DEBUG    | __main__:trials:26 - Trial = 28988/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.373 | DEBUG    | __main__:trials:29 - Trial = 28988/30000 | Total reward = 13.14
2022-01-26 14:18:47.376 | DEBUG    | __main__:trials:24 - Trial = 28989/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.378 | DEBUG    | __main__:trials:29 - Trial = 28989/30000 | Total reward = 48.29
2022-01-26 14:18:47.380 | DEBUG    | __main__:trials:26 - Trial = 28990/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.382 | DEBUG    | __main__:trials:29 - Trial = 28990/30000 | Total reward = 23.16
2022-01-26 14:18:47.385 | DEBUG    | __main__:trials:24 - Trial = 28991/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.386 | DEBUG    | __main__:trials:29 - Trial = 28991/30000 | Total reward = 38.38
2022-01-26 14:18:47.390 | DEBUG    | __main__:trials:24 - Trial = 28992/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.390 | DEBUG    | __main__:trials:29 - Trial = 28992/30000 | Total reward = 32.89
2022-01-26 14:18:47.394 | DEBUG    | __main__:trials:24 - Trial = 28993/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.396 | DEBUG    | __main__:trials:29 - Trial = 28993/30000 | Total reward = 32.51
2022-01-26 14:18:47.399 | DEBUG    | __main__:trials:24 - Trial = 28994/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.400 | DEBUG    | __main__:trials:29 - Trial = 28994/30000 | Total reward = 35.96
2022-01-26 14:18:47.403 | DEBUG    | __main__:trials:24 - Trial = 28995/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.405 | DEBUG    | __main__:trials:29 - Trial = 28995/30000 | Total reward = 39.34
2022-01-26 14:18:47.408 | DEBUG    | __main__:trials:24 - Trial = 28996/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.410 | DEBUG    | __main__:trials:29 - Trial = 28996/30000 | Total reward = 48.25
2022-01-26 14:18:47.413 | DEBUG    | __main__:trials:26 - Trial = 28997/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.414 | DEBUG    | __main__:trials:29 - Trial = 28997/30000 | Total reward = 20.45
2022-01-26 14:18:47.417 | DEBUG    | __main__:trials:26 - Trial = 28998/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.419 | DEBUG    | __main__:trials:29 - Trial = 28998/30000 | Total reward = 15.71
2022-01-26 14:18:47.423 | DEBUG    | __main__:trials:24 - Trial = 28999/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.424 | DEBUG    | __main__:trials:29 - Trial = 28999/30000 | Total reward = 34.74
2022-01-26 14:18:47.426 | DEBUG    | __main__:trials:26 - Trial = 29000/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.428 | DEBUG    | __main__:trials:29 - Trial = 29000/30000 | Total reward = 22.05
2022-01-26 14:18:47.431 | DEBUG    | __main__:trials:26 - Trial = 29001/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.433 | DEBUG    | __main__:trials:29 - Trial = 29001/30000 | Total reward = 18.78
2022-01-26 14:18:47.436 | DEBUG    | __main__:trials:26 - Trial = 29002/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.438 | DEBUG    | __main__:trials:29 - Trial = 29002/30000 | Total reward = 16.57
2022-01-26 14:18:47.441 | DEBUG    | __main__:trials:24 - Trial = 29003/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.442 | DEBUG    | __main__:trials:29 - Trial = 29003/30000 | Total reward = 49.11
2022-01-26 14:18:47.447 | DEBUG    | __main__:trials:24 - Trial = 29004/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.447 | DEBUG    | __main__:trials:29 - Trial = 29004/30000 | Total reward = 38.72
2022-01-26 14:18:47.452 | DEBUG    | __main__:trials:24 - Trial = 29005/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.452 | DEBUG    | __main__:trials:29 - Trial = 29005/30000 | Total reward = 45.68
2022-01-26 14:18:47.456 | DEBUG    | __main__:trials:26 - Trial = 29006/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.458 | DEBUG    | __main__:trials:29 - Trial = 29006/30000 | Total reward = 12.92
2022-01-26 14:18:47.461 | DEBUG    | __main__:trials:24 - Trial = 29007/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.462 | DEBUG    | __main__:trials:29 - Trial = 29007/30000 | Total reward = 22.52
2022-01-26 14:18:47.465 | DEBUG    | __main__:trials:24 - Trial = 29008/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.467 | DEBUG    | __main__:trials:29 - Trial = 29008/30000 | Total reward = 19.42
2022-01-26 14:18:47.469 | DEBUG    | __main__:trials:24 - Trial = 29009/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.471 | DEBUG    | __main__:trials:29 - Trial = 29009/30000 | Total reward = 41.20
2022-01-26 14:18:47.475 | DEBUG    | __main__:trials:24 - Trial = 29010/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.476 | DEBUG    | __main__:trials:29 - Trial = 29010/30000 | Total reward = 36.66
2022-01-26 14:18:47.480 | DEBUG    | __main__:trials:24 - Trial = 29011/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.482 | DEBUG    | __main__:trials:29 - Trial = 29011/30000 | Total reward = 29.51
2022-01-26 14:18:47.485 | DEBUG    | __main__:trials:26 - Trial = 29012/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.486 | DEBUG    | __main__:trials:29 - Trial = 29012/30000 | Total reward = 15.97
2022-01-26 14:18:47.490 | DEBUG    | __main__:trials:24 - Trial = 29013/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.491 | DEBUG    | __main__:trials:29 - Trial = 29013/30000 | Total reward = 36.91
2022-01-26 14:18:47.495 | DEBUG    | __main__:trials:24 - Trial = 29014/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.496 | DEBUG    | __main__:trials:29 - Trial = 29014/30000 | Total reward = 34.45
2022-01-26 14:18:47.499 | DEBUG    | __main__:trials:24 - Trial = 29015/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.501 | DEBUG    | __main__:trials:29 - Trial = 29015/30000 | Total reward = 35.46
2022-01-26 14:18:47.505 | DEBUG    | __main__:trials:24 - Trial = 29016/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.505 | DEBUG    | __main__:trials:29 - Trial = 29016/30000 | Total reward = 40.60
2022-01-26 14:18:47.510 | DEBUG    | __main__:trials:24 - Trial = 29017/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.511 | DEBUG    | __main__:trials:29 - Trial = 29017/30000 | Total reward = 23.96
2022-01-26 14:18:47.515 | DEBUG    | __main__:trials:24 - Trial = 29018/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.516 | DEBUG    | __main__:trials:29 - Trial = 29018/30000 | Total reward = 28.73
2022-01-26 14:18:47.519 | DEBUG    | __main__:trials:24 - Trial = 29019/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.521 | DEBUG    | __main__:trials:29 - Trial = 29019/30000 | Total reward = 50.40
2022-01-26 14:18:47.525 | DEBUG    | __main__:trials:24 - Trial = 29020/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.527 | DEBUG    | __main__:trials:29 - Trial = 29020/30000 | Total reward = 34.83
2022-01-26 14:18:47.530 | DEBUG    | __main__:trials:26 - Trial = 29021/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.532 | DEBUG    | __main__:trials:29 - Trial = 29021/30000 | Total reward = 34.23
2022-01-26 14:18:47.536 | DEBUG    | __main__:trials:24 - Trial = 29022/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.537 | DEBUG    | __main__:trials:29 - Trial = 29022/30000 | Total reward = 34.15
2022-01-26 14:18:47.541 | DEBUG    | __main__:trials:24 - Trial = 29023/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.542 | DEBUG    | __main__:trials:29 - Trial = 29023/30000 | Total reward = 29.46
2022-01-26 14:18:47.546 | DEBUG    | __main__:trials:24 - Trial = 29024/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.547 | DEBUG    | __main__:trials:29 - Trial = 29024/30000 | Total reward = 24.50
2022-01-26 14:18:47.551 | DEBUG    | __main__:trials:24 - Trial = 29025/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.552 | DEBUG    | __main__:trials:29 - Trial = 29025/30000 | Total reward = 46.24
2022-01-26 14:18:47.556 | DEBUG    | __main__:trials:24 - Trial = 29026/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.557 | DEBUG    | __main__:trials:29 - Trial = 29026/30000 | Total reward = 33.81
2022-01-26 14:18:47.561 | DEBUG    | __main__:trials:24 - Trial = 29027/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.563 | DEBUG    | __main__:trials:29 - Trial = 29027/30000 | Total reward = 41.53
2022-01-26 14:18:47.567 | DEBUG    | __main__:trials:24 - Trial = 29028/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.567 | DEBUG    | __main__:trials:29 - Trial = 29028/30000 | Total reward = 42.10
2022-01-26 14:18:47.572 | DEBUG    | __main__:trials:24 - Trial = 29029/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.574 | DEBUG    | __main__:trials:29 - Trial = 29029/30000 | Total reward = 39.50
2022-01-26 14:18:47.578 | DEBUG    | __main__:trials:24 - Trial = 29030/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.578 | DEBUG    | __main__:trials:29 - Trial = 29030/30000 | Total reward = 31.03
2022-01-26 14:18:47.583 | DEBUG    | __main__:trials:24 - Trial = 29031/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.585 | DEBUG    | __main__:trials:29 - Trial = 29031/30000 | Total reward = 36.15
2022-01-26 14:18:47.588 | DEBUG    | __main__:trials:24 - Trial = 29032/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.590 | DEBUG    | __main__:trials:29 - Trial = 29032/30000 | Total reward = 45.26
2022-01-26 14:18:47.593 | DEBUG    | __main__:trials:26 - Trial = 29033/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.595 | DEBUG    | __main__:trials:29 - Trial = 29033/30000 | Total reward = 24.71
2022-01-26 14:18:47.598 | DEBUG    | __main__:trials:24 - Trial = 29034/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.599 | DEBUG    | __main__:trials:29 - Trial = 29034/30000 | Total reward = 31.27
2022-01-26 14:18:47.604 | DEBUG    | __main__:trials:24 - Trial = 29035/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.604 | DEBUG    | __main__:trials:29 - Trial = 29035/30000 | Total reward = 35.44
2022-01-26 14:18:47.609 | DEBUG    | __main__:trials:24 - Trial = 29036/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.610 | DEBUG    | __main__:trials:29 - Trial = 29036/30000 | Total reward = 38.53
2022-01-26 14:18:47.613 | DEBUG    | __main__:trials:26 - Trial = 29037/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.615 | DEBUG    | __main__:trials:29 - Trial = 29037/30000 | Total reward = 23.09
2022-01-26 14:18:47.618 | DEBUG    | __main__:trials:26 - Trial = 29038/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.619 | DEBUG    | __main__:trials:29 - Trial = 29038/30000 | Total reward = 16.34
2022-01-26 14:18:47.622 | DEBUG    | __main__:trials:26 - Trial = 29039/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.623 | DEBUG    | __main__:trials:29 - Trial = 29039/30000 | Total reward = 11.06
2022-01-26 14:18:47.627 | DEBUG    | __main__:trials:24 - Trial = 29040/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.628 | DEBUG    | __main__:trials:29 - Trial = 29040/30000 | Total reward = 56.81
2022-01-26 14:18:47.631 | DEBUG    | __main__:trials:26 - Trial = 29041/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.631 | DEBUG    | __main__:trials:29 - Trial = 29041/30000 | Total reward = 12.06
2022-01-26 14:18:47.634 | DEBUG    | __main__:trials:26 - Trial = 29042/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.636 | DEBUG    | __main__:trials:29 - Trial = 29042/30000 | Total reward = 9.69
2022-01-26 14:18:47.639 | DEBUG    | __main__:trials:24 - Trial = 29043/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.640 | DEBUG    | __main__:trials:29 - Trial = 29043/30000 | Total reward = 37.01
2022-01-26 14:18:47.644 | DEBUG    | __main__:trials:24 - Trial = 29044/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.645 | DEBUG    | __main__:trials:29 - Trial = 29044/30000 | Total reward = 35.12
2022-01-26 14:18:47.647 | DEBUG    | __main__:trials:26 - Trial = 29045/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.649 | DEBUG    | __main__:trials:29 - Trial = 29045/30000 | Total reward = 11.06
2022-01-26 14:18:47.652 | DEBUG    | __main__:trials:24 - Trial = 29046/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.654 | DEBUG    | __main__:trials:29 - Trial = 29046/30000 | Total reward = 38.83
2022-01-26 14:18:47.657 | DEBUG    | __main__:trials:24 - Trial = 29047/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.658 | DEBUG    | __main__:trials:29 - Trial = 29047/30000 | Total reward = 46.39
2022-01-26 14:18:47.662 | DEBUG    | __main__:trials:26 - Trial = 29048/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.662 | DEBUG    | __main__:trials:29 - Trial = 29048/30000 | Total reward = 10.80
2022-01-26 14:18:47.667 | DEBUG    | __main__:trials:24 - Trial = 29049/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.668 | DEBUG    | __main__:trials:29 - Trial = 29049/30000 | Total reward = 43.68
2022-01-26 14:18:47.672 | DEBUG    | __main__:trials:24 - Trial = 29050/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.673 | DEBUG    | __main__:trials:29 - Trial = 29050/30000 | Total reward = 44.73
2022-01-26 14:18:47.677 | DEBUG    | __main__:trials:24 - Trial = 29051/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.679 | DEBUG    | __main__:trials:29 - Trial = 29051/30000 | Total reward = 39.78
2022-01-26 14:18:47.682 | DEBUG    | __main__:trials:24 - Trial = 29052/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.683 | DEBUG    | __main__:trials:29 - Trial = 29052/30000 | Total reward = 39.08
2022-01-26 14:18:47.688 | DEBUG    | __main__:trials:24 - Trial = 29053/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.689 | DEBUG    | __main__:trials:29 - Trial = 29053/30000 | Total reward = 39.51
2022-01-26 14:18:47.692 | DEBUG    | __main__:trials:24 - Trial = 29054/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.694 | DEBUG    | __main__:trials:29 - Trial = 29054/30000 | Total reward = 39.34
2022-01-26 14:18:47.697 | DEBUG    | __main__:trials:26 - Trial = 29055/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.698 | DEBUG    | __main__:trials:29 - Trial = 29055/30000 | Total reward = 24.76
2022-01-26 14:18:47.700 | DEBUG    | __main__:trials:26 - Trial = 29056/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.701 | DEBUG    | __main__:trials:29 - Trial = 29056/30000 | Total reward = 9.69
2022-01-26 14:18:47.704 | DEBUG    | __main__:trials:26 - Trial = 29057/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.704 | DEBUG    | __main__:trials:29 - Trial = 29057/30000 | Total reward = 11.06
2022-01-26 14:18:47.708 | DEBUG    | __main__:trials:26 - Trial = 29058/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.709 | DEBUG    | __main__:trials:29 - Trial = 29058/30000 | Total reward = 17.56
2022-01-26 14:18:47.713 | DEBUG    | __main__:trials:26 - Trial = 29059/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.713 | DEBUG    | __main__:trials:29 - Trial = 29059/30000 | Total reward = 13.78
2022-01-26 14:18:47.717 | DEBUG    | __main__:trials:26 - Trial = 29060/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.717 | DEBUG    | __main__:trials:29 - Trial = 29060/30000 | Total reward = 11.06
2022-01-26 14:18:47.721 | DEBUG    | __main__:trials:26 - Trial = 29061/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.722 | DEBUG    | __main__:trials:29 - Trial = 29061/30000 | Total reward = 10.60
2022-01-26 14:18:47.724 | DEBUG    | __main__:trials:26 - Trial = 29062/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.726 | DEBUG    | __main__:trials:29 - Trial = 29062/30000 | Total reward = 11.06
2022-01-26 14:18:47.729 | DEBUG    | __main__:trials:24 - Trial = 29063/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.730 | DEBUG    | __main__:trials:29 - Trial = 29063/30000 | Total reward = 34.14
2022-01-26 14:18:47.734 | DEBUG    | __main__:trials:24 - Trial = 29064/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.735 | DEBUG    | __main__:trials:29 - Trial = 29064/30000 | Total reward = 36.32
2022-01-26 14:18:47.738 | DEBUG    | __main__:trials:26 - Trial = 29065/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.739 | DEBUG    | __main__:trials:29 - Trial = 29065/30000 | Total reward = 11.53
2022-01-26 14:18:47.741 | DEBUG    | __main__:trials:26 - Trial = 29066/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.743 | DEBUG    | __main__:trials:29 - Trial = 29066/30000 | Total reward = 12.64
2022-01-26 14:18:47.747 | DEBUG    | __main__:trials:24 - Trial = 29067/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.748 | DEBUG    | __main__:trials:29 - Trial = 29067/30000 | Total reward = 32.16
2022-01-26 14:18:47.751 | DEBUG    | __main__:trials:24 - Trial = 29068/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.754 | DEBUG    | __main__:trials:29 - Trial = 29068/30000 | Total reward = 23.58
2022-01-26 14:18:47.757 | DEBUG    | __main__:trials:26 - Trial = 29069/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.758 | DEBUG    | __main__:trials:29 - Trial = 29069/30000 | Total reward = 11.06
2022-01-26 14:18:47.762 | DEBUG    | __main__:trials:24 - Trial = 29070/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.763 | DEBUG    | __main__:trials:29 - Trial = 29070/30000 | Total reward = 40.80
2022-01-26 14:18:47.766 | DEBUG    | __main__:trials:26 - Trial = 29071/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.768 | DEBUG    | __main__:trials:29 - Trial = 29071/30000 | Total reward = 12.08
2022-01-26 14:18:47.771 | DEBUG    | __main__:trials:24 - Trial = 29072/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.772 | DEBUG    | __main__:trials:29 - Trial = 29072/30000 | Total reward = 37.06
2022-01-26 14:18:47.775 | DEBUG    | __main__:trials:26 - Trial = 29073/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.777 | DEBUG    | __main__:trials:29 - Trial = 29073/30000 | Total reward = 9.03
2022-01-26 14:18:47.780 | DEBUG    | __main__:trials:24 - Trial = 29074/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.782 | DEBUG    | __main__:trials:29 - Trial = 29074/30000 | Total reward = 43.00
2022-01-26 14:18:47.786 | DEBUG    | __main__:trials:24 - Trial = 29075/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.787 | DEBUG    | __main__:trials:29 - Trial = 29075/30000 | Total reward = 29.35
2022-01-26 14:18:47.790 | DEBUG    | __main__:trials:24 - Trial = 29076/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.792 | DEBUG    | __main__:trials:29 - Trial = 29076/30000 | Total reward = 41.20
2022-01-26 14:18:47.796 | DEBUG    | __main__:trials:24 - Trial = 29077/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.797 | DEBUG    | __main__:trials:29 - Trial = 29077/30000 | Total reward = 31.30
2022-01-26 14:18:47.801 | DEBUG    | __main__:trials:24 - Trial = 29078/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.802 | DEBUG    | __main__:trials:29 - Trial = 29078/30000 | Total reward = 36.05
2022-01-26 14:18:47.806 | DEBUG    | __main__:trials:24 - Trial = 29079/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.808 | DEBUG    | __main__:trials:29 - Trial = 29079/30000 | Total reward = 34.20
2022-01-26 14:18:47.811 | DEBUG    | __main__:trials:24 - Trial = 29080/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.812 | DEBUG    | __main__:trials:29 - Trial = 29080/30000 | Total reward = 42.92
2022-01-26 14:18:47.817 | DEBUG    | __main__:trials:24 - Trial = 29081/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.817 | DEBUG    | __main__:trials:29 - Trial = 29081/30000 | Total reward = 19.63
2022-01-26 14:18:47.820 | DEBUG    | __main__:trials:26 - Trial = 29082/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.821 | DEBUG    | __main__:trials:29 - Trial = 29082/30000 | Total reward = 9.67
2022-01-26 14:18:47.824 | DEBUG    | __main__:trials:26 - Trial = 29083/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.825 | DEBUG    | __main__:trials:29 - Trial = 29083/30000 | Total reward = 11.06
2022-01-26 14:18:47.828 | DEBUG    | __main__:trials:26 - Trial = 29084/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.830 | DEBUG    | __main__:trials:29 - Trial = 29084/30000 | Total reward = 11.58
2022-01-26 14:18:47.833 | DEBUG    | __main__:trials:26 - Trial = 29085/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.833 | DEBUG    | __main__:trials:29 - Trial = 29085/30000 | Total reward = 11.06
2022-01-26 14:18:47.837 | DEBUG    | __main__:trials:26 - Trial = 29086/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.837 | DEBUG    | __main__:trials:29 - Trial = 29086/30000 | Total reward = 9.67
2022-01-26 14:18:47.841 | DEBUG    | __main__:trials:26 - Trial = 29087/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.842 | DEBUG    | __main__:trials:29 - Trial = 29087/30000 | Total reward = 8.97
2022-01-26 14:18:47.845 | DEBUG    | __main__:trials:24 - Trial = 29088/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.847 | DEBUG    | __main__:trials:29 - Trial = 29088/30000 | Total reward = 51.42
2022-01-26 14:18:47.851 | DEBUG    | __main__:trials:24 - Trial = 29089/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.852 | DEBUG    | __main__:trials:29 - Trial = 29089/30000 | Total reward = 40.89
2022-01-26 14:18:47.854 | DEBUG    | __main__:trials:26 - Trial = 29090/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.856 | DEBUG    | __main__:trials:29 - Trial = 29090/30000 | Total reward = 19.10
2022-01-26 14:18:47.859 | DEBUG    | __main__:trials:24 - Trial = 29091/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.861 | DEBUG    | __main__:trials:29 - Trial = 29091/30000 | Total reward = 45.97
2022-01-26 14:18:47.865 | DEBUG    | __main__:trials:24 - Trial = 29092/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.865 | DEBUG    | __main__:trials:29 - Trial = 29092/30000 | Total reward = 33.47
2022-01-26 14:18:47.869 | DEBUG    | __main__:trials:24 - Trial = 29093/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.870 | DEBUG    | __main__:trials:29 - Trial = 29093/30000 | Total reward = 31.55
2022-01-26 14:18:47.873 | DEBUG    | __main__:trials:24 - Trial = 29094/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.875 | DEBUG    | __main__:trials:29 - Trial = 29094/30000 | Total reward = 37.79
2022-01-26 14:18:47.878 | DEBUG    | __main__:trials:24 - Trial = 29095/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.879 | DEBUG    | __main__:trials:29 - Trial = 29095/30000 | Total reward = 35.69
2022-01-26 14:18:47.882 | DEBUG    | __main__:trials:24 - Trial = 29096/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.884 | DEBUG    | __main__:trials:29 - Trial = 29096/30000 | Total reward = 36.16
2022-01-26 14:18:47.887 | DEBUG    | __main__:trials:24 - Trial = 29097/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.888 | DEBUG    | __main__:trials:29 - Trial = 29097/30000 | Total reward = 36.19
2022-01-26 14:18:47.891 | DEBUG    | __main__:trials:26 - Trial = 29098/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:47.892 | DEBUG    | __main__:trials:29 - Trial = 29098/30000 | Total reward = 29.25
2022-01-26 14:18:47.895 | DEBUG    | __main__:trials:24 - Trial = 29099/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.896 | DEBUG    | __main__:trials:29 - Trial = 29099/30000 | Total reward = 37.28
2022-01-26 14:18:47.899 | DEBUG    | __main__:trials:24 - Trial = 29100/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.901 | DEBUG    | __main__:trials:29 - Trial = 29100/30000 | Total reward = 45.52
2022-01-26 14:18:47.904 | DEBUG    | __main__:trials:24 - Trial = 29101/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.905 | DEBUG    | __main__:trials:29 - Trial = 29101/30000 | Total reward = 37.62
2022-01-26 14:18:47.908 | DEBUG    | __main__:trials:24 - Trial = 29102/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.910 | DEBUG    | __main__:trials:29 - Trial = 29102/30000 | Total reward = 39.57
2022-01-26 14:18:47.913 | DEBUG    | __main__:trials:24 - Trial = 29103/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.913 | DEBUG    | __main__:trials:29 - Trial = 29103/30000 | Total reward = 29.09
2022-01-26 14:18:47.918 | DEBUG    | __main__:trials:24 - Trial = 29104/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.919 | DEBUG    | __main__:trials:29 - Trial = 29104/30000 | Total reward = 37.40
2022-01-26 14:18:47.923 | DEBUG    | __main__:trials:24 - Trial = 29105/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.925 | DEBUG    | __main__:trials:29 - Trial = 29105/30000 | Total reward = 41.38
2022-01-26 14:18:47.928 | DEBUG    | __main__:trials:24 - Trial = 29106/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.930 | DEBUG    | __main__:trials:29 - Trial = 29106/30000 | Total reward = 44.04
2022-01-26 14:18:47.933 | DEBUG    | __main__:trials:24 - Trial = 29107/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.934 | DEBUG    | __main__:trials:29 - Trial = 29107/30000 | Total reward = 48.36
2022-01-26 14:18:47.938 | DEBUG    | __main__:trials:24 - Trial = 29108/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.939 | DEBUG    | __main__:trials:29 - Trial = 29108/30000 | Total reward = 45.91
2022-01-26 14:18:47.942 | DEBUG    | __main__:trials:24 - Trial = 29109/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.944 | DEBUG    | __main__:trials:29 - Trial = 29109/30000 | Total reward = 40.43
2022-01-26 14:18:47.948 | DEBUG    | __main__:trials:24 - Trial = 29110/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.949 | DEBUG    | __main__:trials:29 - Trial = 29110/30000 | Total reward = 51.61
2022-01-26 14:18:47.953 | DEBUG    | __main__:trials:24 - Trial = 29111/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.955 | DEBUG    | __main__:trials:29 - Trial = 29111/30000 | Total reward = 39.59
2022-01-26 14:18:47.959 | DEBUG    | __main__:trials:24 - Trial = 29112/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.960 | DEBUG    | __main__:trials:29 - Trial = 29112/30000 | Total reward = 39.64
2022-01-26 14:18:47.964 | DEBUG    | __main__:trials:24 - Trial = 29113/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.965 | DEBUG    | __main__:trials:29 - Trial = 29113/30000 | Total reward = 46.97
2022-01-26 14:18:47.969 | DEBUG    | __main__:trials:24 - Trial = 29114/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.971 | DEBUG    | __main__:trials:29 - Trial = 29114/30000 | Total reward = 44.73
2022-01-26 14:18:47.974 | DEBUG    | __main__:trials:24 - Trial = 29115/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.976 | DEBUG    | __main__:trials:29 - Trial = 29115/30000 | Total reward = 44.45
2022-01-26 14:18:47.980 | DEBUG    | __main__:trials:24 - Trial = 29116/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.981 | DEBUG    | __main__:trials:29 - Trial = 29116/30000 | Total reward = 32.21
2022-01-26 14:18:47.984 | DEBUG    | __main__:trials:24 - Trial = 29117/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.986 | DEBUG    | __main__:trials:29 - Trial = 29117/30000 | Total reward = 38.85
2022-01-26 14:18:47.990 | DEBUG    | __main__:trials:24 - Trial = 29118/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.990 | DEBUG    | __main__:trials:29 - Trial = 29118/30000 | Total reward = 36.39
2022-01-26 14:18:47.994 | DEBUG    | __main__:trials:24 - Trial = 29119/30000 | Max number of steps (20) reached
2022-01-26 14:18:47.995 | DEBUG    | __main__:trials:29 - Trial = 29119/30000 | Total reward = 28.20
2022-01-26 14:18:47.999 | DEBUG    | __main__:trials:24 - Trial = 29120/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.000 | DEBUG    | __main__:trials:29 - Trial = 29120/30000 | Total reward = 37.71
2022-01-26 14:18:48.004 | DEBUG    | __main__:trials:24 - Trial = 29121/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.005 | DEBUG    | __main__:trials:29 - Trial = 29121/30000 | Total reward = 41.26
2022-01-26 14:18:48.009 | DEBUG    | __main__:trials:26 - Trial = 29122/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.009 | DEBUG    | __main__:trials:29 - Trial = 29122/30000 | Total reward = 15.71
2022-01-26 14:18:48.013 | DEBUG    | __main__:trials:24 - Trial = 29123/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.014 | DEBUG    | __main__:trials:29 - Trial = 29123/30000 | Total reward = 48.04
2022-01-26 14:18:48.017 | DEBUG    | __main__:trials:24 - Trial = 29124/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.019 | DEBUG    | __main__:trials:29 - Trial = 29124/30000 | Total reward = 44.54
2022-01-26 14:18:48.023 | DEBUG    | __main__:trials:24 - Trial = 29125/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.024 | DEBUG    | __main__:trials:29 - Trial = 29125/30000 | Total reward = 46.56
2022-01-26 14:18:48.028 | DEBUG    | __main__:trials:24 - Trial = 29126/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.030 | DEBUG    | __main__:trials:29 - Trial = 29126/30000 | Total reward = 50.82
2022-01-26 14:18:48.033 | DEBUG    | __main__:trials:26 - Trial = 29127/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.034 | DEBUG    | __main__:trials:29 - Trial = 29127/30000 | Total reward = 20.03
2022-01-26 14:18:48.038 | DEBUG    | __main__:trials:24 - Trial = 29128/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.039 | DEBUG    | __main__:trials:29 - Trial = 29128/30000 | Total reward = 41.70
2022-01-26 14:18:48.042 | DEBUG    | __main__:trials:24 - Trial = 29129/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.043 | DEBUG    | __main__:trials:29 - Trial = 29129/30000 | Total reward = 47.56
2022-01-26 14:18:48.046 | DEBUG    | __main__:trials:24 - Trial = 29130/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.048 | DEBUG    | __main__:trials:29 - Trial = 29130/30000 | Total reward = 39.97
2022-01-26 14:18:48.051 | DEBUG    | __main__:trials:24 - Trial = 29131/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.052 | DEBUG    | __main__:trials:29 - Trial = 29131/30000 | Total reward = 38.65
2022-01-26 14:18:48.056 | DEBUG    | __main__:trials:26 - Trial = 29132/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.057 | DEBUG    | __main__:trials:29 - Trial = 29132/30000 | Total reward = 25.59
2022-01-26 14:18:48.061 | DEBUG    | __main__:trials:26 - Trial = 29133/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.062 | DEBUG    | __main__:trials:29 - Trial = 29133/30000 | Total reward = 28.69
2022-01-26 14:18:48.065 | DEBUG    | __main__:trials:24 - Trial = 29134/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.065 | DEBUG    | __main__:trials:29 - Trial = 29134/30000 | Total reward = 38.45
2022-01-26 14:18:48.069 | DEBUG    | __main__:trials:24 - Trial = 29135/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.070 | DEBUG    | __main__:trials:29 - Trial = 29135/30000 | Total reward = 41.83
2022-01-26 14:18:48.075 | DEBUG    | __main__:trials:24 - Trial = 29136/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.076 | DEBUG    | __main__:trials:29 - Trial = 29136/30000 | Total reward = 33.02
2022-01-26 14:18:48.079 | DEBUG    | __main__:trials:24 - Trial = 29137/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.081 | DEBUG    | __main__:trials:29 - Trial = 29137/30000 | Total reward = 36.63
2022-01-26 14:18:48.084 | DEBUG    | __main__:trials:24 - Trial = 29138/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.086 | DEBUG    | __main__:trials:29 - Trial = 29138/30000 | Total reward = 30.10
2022-01-26 14:18:48.088 | DEBUG    | __main__:trials:26 - Trial = 29139/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.090 | DEBUG    | __main__:trials:29 - Trial = 29139/30000 | Total reward = 11.06
2022-01-26 14:18:48.093 | DEBUG    | __main__:trials:24 - Trial = 29140/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.094 | DEBUG    | __main__:trials:29 - Trial = 29140/30000 | Total reward = 28.29
2022-01-26 14:18:48.098 | DEBUG    | __main__:trials:26 - Trial = 29141/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.100 | DEBUG    | __main__:trials:29 - Trial = 29141/30000 | Total reward = 15.78
2022-01-26 14:18:48.103 | DEBUG    | __main__:trials:24 - Trial = 29142/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.105 | DEBUG    | __main__:trials:29 - Trial = 29142/30000 | Total reward = 42.96
2022-01-26 14:18:48.107 | DEBUG    | __main__:trials:26 - Trial = 29143/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.108 | DEBUG    | __main__:trials:29 - Trial = 29143/30000 | Total reward = 11.06
2022-01-26 14:18:48.111 | DEBUG    | __main__:trials:26 - Trial = 29144/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.113 | DEBUG    | __main__:trials:29 - Trial = 29144/30000 | Total reward = 17.25
2022-01-26 14:18:48.115 | DEBUG    | __main__:trials:26 - Trial = 29145/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.116 | DEBUG    | __main__:trials:29 - Trial = 29145/30000 | Total reward = 11.06
2022-01-26 14:18:48.118 | DEBUG    | __main__:trials:26 - Trial = 29146/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.120 | DEBUG    | __main__:trials:29 - Trial = 29146/30000 | Total reward = 11.06
2022-01-26 14:18:48.123 | DEBUG    | __main__:trials:26 - Trial = 29147/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.123 | DEBUG    | __main__:trials:29 - Trial = 29147/30000 | Total reward = 13.08
2022-01-26 14:18:48.126 | DEBUG    | __main__:trials:26 - Trial = 29148/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.127 | DEBUG    | __main__:trials:29 - Trial = 29148/30000 | Total reward = 10.67
2022-01-26 14:18:48.131 | DEBUG    | __main__:trials:26 - Trial = 29149/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.132 | DEBUG    | __main__:trials:29 - Trial = 29149/30000 | Total reward = 11.06
2022-01-26 14:18:48.136 | DEBUG    | __main__:trials:24 - Trial = 29150/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.137 | DEBUG    | __main__:trials:29 - Trial = 29150/30000 | Total reward = 32.64
2022-01-26 14:18:48.139 | DEBUG    | __main__:trials:26 - Trial = 29151/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.141 | DEBUG    | __main__:trials:29 - Trial = 29151/30000 | Total reward = 12.72
2022-01-26 14:18:48.143 | DEBUG    | __main__:trials:26 - Trial = 29152/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.145 | DEBUG    | __main__:trials:29 - Trial = 29152/30000 | Total reward = 9.03
2022-01-26 14:18:48.147 | DEBUG    | __main__:trials:24 - Trial = 29153/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.148 | DEBUG    | __main__:trials:29 - Trial = 29153/30000 | Total reward = 38.71
2022-01-26 14:18:48.151 | DEBUG    | __main__:trials:24 - Trial = 29154/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.153 | DEBUG    | __main__:trials:29 - Trial = 29154/30000 | Total reward = 42.09
2022-01-26 14:18:48.157 | DEBUG    | __main__:trials:24 - Trial = 29155/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.159 | DEBUG    | __main__:trials:29 - Trial = 29155/30000 | Total reward = 37.23
2022-01-26 14:18:48.162 | DEBUG    | __main__:trials:24 - Trial = 29156/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.163 | DEBUG    | __main__:trials:29 - Trial = 29156/30000 | Total reward = 30.05
2022-01-26 14:18:48.168 | DEBUG    | __main__:trials:24 - Trial = 29157/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.169 | DEBUG    | __main__:trials:29 - Trial = 29157/30000 | Total reward = 39.73
2022-01-26 14:18:48.171 | DEBUG    | __main__:trials:26 - Trial = 29158/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.173 | DEBUG    | __main__:trials:29 - Trial = 29158/30000 | Total reward = 12.92
2022-01-26 14:18:48.175 | DEBUG    | __main__:trials:26 - Trial = 29159/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.176 | DEBUG    | __main__:trials:29 - Trial = 29159/30000 | Total reward = 13.52
2022-01-26 14:18:48.180 | DEBUG    | __main__:trials:24 - Trial = 29160/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.181 | DEBUG    | __main__:trials:29 - Trial = 29160/30000 | Total reward = 37.12
2022-01-26 14:18:48.184 | DEBUG    | __main__:trials:26 - Trial = 29161/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.186 | DEBUG    | __main__:trials:29 - Trial = 29161/30000 | Total reward = 8.04
2022-01-26 14:18:48.189 | DEBUG    | __main__:trials:26 - Trial = 29162/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.190 | DEBUG    | __main__:trials:29 - Trial = 29162/30000 | Total reward = 14.77
2022-01-26 14:18:48.193 | DEBUG    | __main__:trials:26 - Trial = 29163/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.194 | DEBUG    | __main__:trials:29 - Trial = 29163/30000 | Total reward = 11.06
2022-01-26 14:18:48.198 | DEBUG    | __main__:trials:24 - Trial = 29164/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.199 | DEBUG    | __main__:trials:29 - Trial = 29164/30000 | Total reward = 22.33
2022-01-26 14:18:48.203 | DEBUG    | __main__:trials:24 - Trial = 29165/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.205 | DEBUG    | __main__:trials:29 - Trial = 29165/30000 | Total reward = 37.59
2022-01-26 14:18:48.208 | DEBUG    | __main__:trials:24 - Trial = 29166/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.210 | DEBUG    | __main__:trials:29 - Trial = 29166/30000 | Total reward = 47.52
2022-01-26 14:18:48.214 | DEBUG    | __main__:trials:24 - Trial = 29167/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.215 | DEBUG    | __main__:trials:29 - Trial = 29167/30000 | Total reward = 33.91
2022-01-26 14:18:48.219 | DEBUG    | __main__:trials:24 - Trial = 29168/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.221 | DEBUG    | __main__:trials:29 - Trial = 29168/30000 | Total reward = 27.55
2022-01-26 14:18:48.224 | DEBUG    | __main__:trials:24 - Trial = 29169/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.225 | DEBUG    | __main__:trials:29 - Trial = 29169/30000 | Total reward = 9.25
2022-01-26 14:18:48.229 | DEBUG    | __main__:trials:24 - Trial = 29170/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.230 | DEBUG    | __main__:trials:29 - Trial = 29170/30000 | Total reward = 32.34
2022-01-26 14:18:48.234 | DEBUG    | __main__:trials:24 - Trial = 29171/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.236 | DEBUG    | __main__:trials:29 - Trial = 29171/30000 | Total reward = 34.63
2022-01-26 14:18:48.239 | DEBUG    | __main__:trials:24 - Trial = 29172/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.240 | DEBUG    | __main__:trials:29 - Trial = 29172/30000 | Total reward = 38.90
2022-01-26 14:18:48.244 | DEBUG    | __main__:trials:24 - Trial = 29173/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.245 | DEBUG    | __main__:trials:29 - Trial = 29173/30000 | Total reward = 39.58
2022-01-26 14:18:48.249 | DEBUG    | __main__:trials:24 - Trial = 29174/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.251 | DEBUG    | __main__:trials:29 - Trial = 29174/30000 | Total reward = 35.56
2022-01-26 14:18:48.255 | DEBUG    | __main__:trials:24 - Trial = 29175/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.256 | DEBUG    | __main__:trials:29 - Trial = 29175/30000 | Total reward = 38.60
2022-01-26 14:18:48.260 | DEBUG    | __main__:trials:24 - Trial = 29176/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.261 | DEBUG    | __main__:trials:29 - Trial = 29176/30000 | Total reward = 39.01
2022-01-26 14:18:48.265 | DEBUG    | __main__:trials:24 - Trial = 29177/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.266 | DEBUG    | __main__:trials:29 - Trial = 29177/30000 | Total reward = 41.53
2022-01-26 14:18:48.270 | DEBUG    | __main__:trials:24 - Trial = 29178/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.271 | DEBUG    | __main__:trials:29 - Trial = 29178/30000 | Total reward = 28.72
2022-01-26 14:18:48.275 | DEBUG    | __main__:trials:24 - Trial = 29179/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.276 | DEBUG    | __main__:trials:29 - Trial = 29179/30000 | Total reward = 32.92
2022-01-26 14:18:48.280 | DEBUG    | __main__:trials:24 - Trial = 29180/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.281 | DEBUG    | __main__:trials:29 - Trial = 29180/30000 | Total reward = 60.99
2022-01-26 14:18:48.285 | DEBUG    | __main__:trials:24 - Trial = 29181/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.287 | DEBUG    | __main__:trials:29 - Trial = 29181/30000 | Total reward = 54.35
2022-01-26 14:18:48.291 | DEBUG    | __main__:trials:24 - Trial = 29182/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.292 | DEBUG    | __main__:trials:29 - Trial = 29182/30000 | Total reward = 33.86
2022-01-26 14:18:48.296 | DEBUG    | __main__:trials:24 - Trial = 29183/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.298 | DEBUG    | __main__:trials:29 - Trial = 29183/30000 | Total reward = 59.10
2022-01-26 14:18:48.301 | DEBUG    | __main__:trials:24 - Trial = 29184/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.302 | DEBUG    | __main__:trials:29 - Trial = 29184/30000 | Total reward = 26.37
2022-01-26 14:18:48.306 | DEBUG    | __main__:trials:24 - Trial = 29185/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.307 | DEBUG    | __main__:trials:29 - Trial = 29185/30000 | Total reward = 39.24
2022-01-26 14:18:48.310 | DEBUG    | __main__:trials:24 - Trial = 29186/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.312 | DEBUG    | __main__:trials:29 - Trial = 29186/30000 | Total reward = 51.42
2022-01-26 14:18:48.316 | DEBUG    | __main__:trials:24 - Trial = 29187/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.316 | DEBUG    | __main__:trials:29 - Trial = 29187/30000 | Total reward = 38.51
2022-01-26 14:18:48.321 | DEBUG    | __main__:trials:26 - Trial = 29188/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.322 | DEBUG    | __main__:trials:29 - Trial = 29188/30000 | Total reward = 31.98
2022-01-26 14:18:48.325 | DEBUG    | __main__:trials:24 - Trial = 29189/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.326 | DEBUG    | __main__:trials:29 - Trial = 29189/30000 | Total reward = 30.05
2022-01-26 14:18:48.330 | DEBUG    | __main__:trials:26 - Trial = 29190/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.330 | DEBUG    | __main__:trials:29 - Trial = 29190/30000 | Total reward = 17.66
2022-01-26 14:18:48.335 | DEBUG    | __main__:trials:24 - Trial = 29191/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.335 | DEBUG    | __main__:trials:29 - Trial = 29191/30000 | Total reward = 46.33
2022-01-26 14:18:48.340 | DEBUG    | __main__:trials:24 - Trial = 29192/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.340 | DEBUG    | __main__:trials:29 - Trial = 29192/30000 | Total reward = 54.01
2022-01-26 14:18:48.345 | DEBUG    | __main__:trials:24 - Trial = 29193/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.346 | DEBUG    | __main__:trials:29 - Trial = 29193/30000 | Total reward = 58.74
2022-01-26 14:18:48.349 | DEBUG    | __main__:trials:24 - Trial = 29194/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.350 | DEBUG    | __main__:trials:29 - Trial = 29194/30000 | Total reward = 38.15
2022-01-26 14:18:48.354 | DEBUG    | __main__:trials:24 - Trial = 29195/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.355 | DEBUG    | __main__:trials:29 - Trial = 29195/30000 | Total reward = 54.27
2022-01-26 14:18:48.359 | DEBUG    | __main__:trials:24 - Trial = 29196/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.360 | DEBUG    | __main__:trials:29 - Trial = 29196/30000 | Total reward = 40.15
2022-01-26 14:18:48.364 | DEBUG    | __main__:trials:24 - Trial = 29197/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.366 | DEBUG    | __main__:trials:29 - Trial = 29197/30000 | Total reward = 38.92
2022-01-26 14:18:48.369 | DEBUG    | __main__:trials:24 - Trial = 29198/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.370 | DEBUG    | __main__:trials:29 - Trial = 29198/30000 | Total reward = 37.30
2022-01-26 14:18:48.374 | DEBUG    | __main__:trials:24 - Trial = 29199/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.376 | DEBUG    | __main__:trials:29 - Trial = 29199/30000 | Total reward = 38.31
2022-01-26 14:18:48.380 | DEBUG    | __main__:trials:24 - Trial = 29200/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.381 | DEBUG    | __main__:trials:29 - Trial = 29200/30000 | Total reward = 49.65
2022-01-26 14:18:48.385 | DEBUG    | __main__:trials:24 - Trial = 29201/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.385 | DEBUG    | __main__:trials:29 - Trial = 29201/30000 | Total reward = 41.78
2022-01-26 14:18:48.389 | DEBUG    | __main__:trials:24 - Trial = 29202/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.391 | DEBUG    | __main__:trials:29 - Trial = 29202/30000 | Total reward = 34.70
2022-01-26 14:18:48.393 | DEBUG    | __main__:trials:26 - Trial = 29203/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.394 | DEBUG    | __main__:trials:29 - Trial = 29203/30000 | Total reward = 12.28
2022-01-26 14:18:48.398 | DEBUG    | __main__:trials:24 - Trial = 29204/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.398 | DEBUG    | __main__:trials:29 - Trial = 29204/30000 | Total reward = 26.97
2022-01-26 14:18:48.403 | DEBUG    | __main__:trials:24 - Trial = 29205/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.404 | DEBUG    | __main__:trials:29 - Trial = 29205/30000 | Total reward = 38.57
2022-01-26 14:18:48.408 | DEBUG    | __main__:trials:24 - Trial = 29206/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.410 | DEBUG    | __main__:trials:29 - Trial = 29206/30000 | Total reward = 26.96
2022-01-26 14:18:48.413 | DEBUG    | __main__:trials:26 - Trial = 29207/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.414 | DEBUG    | __main__:trials:29 - Trial = 29207/30000 | Total reward = 15.78
2022-01-26 14:18:48.418 | DEBUG    | __main__:trials:24 - Trial = 29208/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.419 | DEBUG    | __main__:trials:29 - Trial = 29208/30000 | Total reward = 40.86
2022-01-26 14:18:48.423 | DEBUG    | __main__:trials:24 - Trial = 29209/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.424 | DEBUG    | __main__:trials:29 - Trial = 29209/30000 | Total reward = 28.78
2022-01-26 14:18:48.428 | DEBUG    | __main__:trials:24 - Trial = 29210/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.429 | DEBUG    | __main__:trials:29 - Trial = 29210/30000 | Total reward = 39.60
2022-01-26 14:18:48.432 | DEBUG    | __main__:trials:24 - Trial = 29211/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.433 | DEBUG    | __main__:trials:29 - Trial = 29211/30000 | Total reward = 50.84
2022-01-26 14:18:48.437 | DEBUG    | __main__:trials:24 - Trial = 29212/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.438 | DEBUG    | __main__:trials:29 - Trial = 29212/30000 | Total reward = 38.65
2022-01-26 14:18:48.441 | DEBUG    | __main__:trials:26 - Trial = 29213/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.443 | DEBUG    | __main__:trials:29 - Trial = 29213/30000 | Total reward = 13.19
2022-01-26 14:18:48.446 | DEBUG    | __main__:trials:24 - Trial = 29214/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.447 | DEBUG    | __main__:trials:29 - Trial = 29214/30000 | Total reward = 45.59
2022-01-26 14:18:48.451 | DEBUG    | __main__:trials:24 - Trial = 29215/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.453 | DEBUG    | __main__:trials:29 - Trial = 29215/30000 | Total reward = 52.89
2022-01-26 14:18:48.456 | DEBUG    | __main__:trials:24 - Trial = 29216/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.458 | DEBUG    | __main__:trials:29 - Trial = 29216/30000 | Total reward = 38.02
2022-01-26 14:18:48.462 | DEBUG    | __main__:trials:24 - Trial = 29217/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.462 | DEBUG    | __main__:trials:29 - Trial = 29217/30000 | Total reward = 41.70
2022-01-26 14:18:48.467 | DEBUG    | __main__:trials:24 - Trial = 29218/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.468 | DEBUG    | __main__:trials:29 - Trial = 29218/30000 | Total reward = 33.31
2022-01-26 14:18:48.472 | DEBUG    | __main__:trials:24 - Trial = 29219/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.473 | DEBUG    | __main__:trials:29 - Trial = 29219/30000 | Total reward = 30.89
2022-01-26 14:18:48.477 | DEBUG    | __main__:trials:24 - Trial = 29220/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.478 | DEBUG    | __main__:trials:29 - Trial = 29220/30000 | Total reward = 37.44
2022-01-26 14:18:48.482 | DEBUG    | __main__:trials:24 - Trial = 29221/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.484 | DEBUG    | __main__:trials:29 - Trial = 29221/30000 | Total reward = 38.90
2022-01-26 14:18:48.486 | DEBUG    | __main__:trials:26 - Trial = 29222/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.487 | DEBUG    | __main__:trials:29 - Trial = 29222/30000 | Total reward = 11.06
2022-01-26 14:18:48.490 | DEBUG    | __main__:trials:26 - Trial = 29223/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.491 | DEBUG    | __main__:trials:29 - Trial = 29223/30000 | Total reward = 14.77
2022-01-26 14:18:48.495 | DEBUG    | __main__:trials:24 - Trial = 29224/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.497 | DEBUG    | __main__:trials:29 - Trial = 29224/30000 | Total reward = 46.32
2022-01-26 14:18:48.500 | DEBUG    | __main__:trials:24 - Trial = 29225/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.501 | DEBUG    | __main__:trials:29 - Trial = 29225/30000 | Total reward = 11.75
2022-01-26 14:18:48.503 | DEBUG    | __main__:trials:26 - Trial = 29226/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.505 | DEBUG    | __main__:trials:29 - Trial = 29226/30000 | Total reward = 11.06
2022-01-26 14:18:48.509 | DEBUG    | __main__:trials:24 - Trial = 29227/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.509 | DEBUG    | __main__:trials:29 - Trial = 29227/30000 | Total reward = 43.31
2022-01-26 14:18:48.512 | DEBUG    | __main__:trials:26 - Trial = 29228/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.512 | DEBUG    | __main__:trials:29 - Trial = 29228/30000 | Total reward = 15.45
2022-01-26 14:18:48.516 | DEBUG    | __main__:trials:24 - Trial = 29229/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.516 | DEBUG    | __main__:trials:29 - Trial = 29229/30000 | Total reward = 40.07
2022-01-26 14:18:48.520 | DEBUG    | __main__:trials:24 - Trial = 29230/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.520 | DEBUG    | __main__:trials:29 - Trial = 29230/30000 | Total reward = 36.58
2022-01-26 14:18:48.524 | DEBUG    | __main__:trials:24 - Trial = 29231/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.525 | DEBUG    | __main__:trials:29 - Trial = 29231/30000 | Total reward = 39.39
2022-01-26 14:18:48.530 | DEBUG    | __main__:trials:24 - Trial = 29232/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.531 | DEBUG    | __main__:trials:29 - Trial = 29232/30000 | Total reward = 48.68
2022-01-26 14:18:48.535 | DEBUG    | __main__:trials:24 - Trial = 29233/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.535 | DEBUG    | __main__:trials:29 - Trial = 29233/30000 | Total reward = 39.15
2022-01-26 14:18:48.540 | DEBUG    | __main__:trials:24 - Trial = 29234/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.541 | DEBUG    | __main__:trials:29 - Trial = 29234/30000 | Total reward = 38.52
2022-01-26 14:18:48.544 | DEBUG    | __main__:trials:26 - Trial = 29235/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.545 | DEBUG    | __main__:trials:29 - Trial = 29235/30000 | Total reward = 23.14
2022-01-26 14:18:48.550 | DEBUG    | __main__:trials:24 - Trial = 29236/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.551 | DEBUG    | __main__:trials:29 - Trial = 29236/30000 | Total reward = 36.74
2022-01-26 14:18:48.556 | DEBUG    | __main__:trials:24 - Trial = 29237/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.557 | DEBUG    | __main__:trials:29 - Trial = 29237/30000 | Total reward = 38.08
2022-01-26 14:18:48.561 | DEBUG    | __main__:trials:24 - Trial = 29238/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.562 | DEBUG    | __main__:trials:29 - Trial = 29238/30000 | Total reward = 35.90
2022-01-26 14:18:48.566 | DEBUG    | __main__:trials:26 - Trial = 29239/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.567 | DEBUG    | __main__:trials:29 - Trial = 29239/30000 | Total reward = 14.76
2022-01-26 14:18:48.571 | DEBUG    | __main__:trials:26 - Trial = 29240/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.573 | DEBUG    | __main__:trials:29 - Trial = 29240/30000 | Total reward = 31.85
2022-01-26 14:18:48.576 | DEBUG    | __main__:trials:24 - Trial = 29241/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.578 | DEBUG    | __main__:trials:29 - Trial = 29241/30000 | Total reward = 50.35
2022-01-26 14:18:48.582 | DEBUG    | __main__:trials:24 - Trial = 29242/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.583 | DEBUG    | __main__:trials:29 - Trial = 29242/30000 | Total reward = 39.18
2022-01-26 14:18:48.586 | DEBUG    | __main__:trials:24 - Trial = 29243/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.588 | DEBUG    | __main__:trials:29 - Trial = 29243/30000 | Total reward = 37.99
2022-01-26 14:18:48.592 | DEBUG    | __main__:trials:24 - Trial = 29244/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.593 | DEBUG    | __main__:trials:29 - Trial = 29244/30000 | Total reward = 29.14
2022-01-26 14:18:48.596 | DEBUG    | __main__:trials:24 - Trial = 29245/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.598 | DEBUG    | __main__:trials:29 - Trial = 29245/30000 | Total reward = 35.05
2022-01-26 14:18:48.601 | DEBUG    | __main__:trials:24 - Trial = 29246/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.602 | DEBUG    | __main__:trials:29 - Trial = 29246/30000 | Total reward = 38.97
2022-01-26 14:18:48.605 | DEBUG    | __main__:trials:24 - Trial = 29247/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.607 | DEBUG    | __main__:trials:29 - Trial = 29247/30000 | Total reward = 38.96
2022-01-26 14:18:48.610 | DEBUG    | __main__:trials:24 - Trial = 29248/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.612 | DEBUG    | __main__:trials:29 - Trial = 29248/30000 | Total reward = 38.90
2022-01-26 14:18:48.615 | DEBUG    | __main__:trials:24 - Trial = 29249/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.617 | DEBUG    | __main__:trials:29 - Trial = 29249/30000 | Total reward = 40.43
2022-01-26 14:18:48.620 | DEBUG    | __main__:trials:24 - Trial = 29250/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.622 | DEBUG    | __main__:trials:29 - Trial = 29250/30000 | Total reward = 38.90
2022-01-26 14:18:48.626 | DEBUG    | __main__:trials:24 - Trial = 29251/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.627 | DEBUG    | __main__:trials:29 - Trial = 29251/30000 | Total reward = 32.09
2022-01-26 14:18:48.630 | DEBUG    | __main__:trials:26 - Trial = 29252/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.632 | DEBUG    | __main__:trials:29 - Trial = 29252/30000 | Total reward = 25.59
2022-01-26 14:18:48.636 | DEBUG    | __main__:trials:24 - Trial = 29253/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.637 | DEBUG    | __main__:trials:29 - Trial = 29253/30000 | Total reward = 31.43
2022-01-26 14:18:48.641 | DEBUG    | __main__:trials:24 - Trial = 29254/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.642 | DEBUG    | __main__:trials:29 - Trial = 29254/30000 | Total reward = 20.21
2022-01-26 14:18:48.645 | DEBUG    | __main__:trials:26 - Trial = 29255/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.647 | DEBUG    | __main__:trials:29 - Trial = 29255/30000 | Total reward = 13.28
2022-01-26 14:18:48.650 | DEBUG    | __main__:trials:24 - Trial = 29256/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.652 | DEBUG    | __main__:trials:29 - Trial = 29256/30000 | Total reward = 36.96
2022-01-26 14:18:48.656 | DEBUG    | __main__:trials:24 - Trial = 29257/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.656 | DEBUG    | __main__:trials:29 - Trial = 29257/30000 | Total reward = 38.65
2022-01-26 14:18:48.661 | DEBUG    | __main__:trials:24 - Trial = 29258/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.662 | DEBUG    | __main__:trials:29 - Trial = 29258/30000 | Total reward = 39.41
2022-01-26 14:18:48.666 | DEBUG    | __main__:trials:24 - Trial = 29259/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.668 | DEBUG    | __main__:trials:29 - Trial = 29259/30000 | Total reward = 42.45
2022-01-26 14:18:48.671 | DEBUG    | __main__:trials:24 - Trial = 29260/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.672 | DEBUG    | __main__:trials:29 - Trial = 29260/30000 | Total reward = 30.10
2022-01-26 14:18:48.676 | DEBUG    | __main__:trials:26 - Trial = 29261/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.678 | DEBUG    | __main__:trials:29 - Trial = 29261/30000 | Total reward = 31.85
2022-01-26 14:18:48.682 | DEBUG    | __main__:trials:24 - Trial = 29262/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.683 | DEBUG    | __main__:trials:29 - Trial = 29262/30000 | Total reward = 39.02
2022-01-26 14:18:48.686 | DEBUG    | __main__:trials:24 - Trial = 29263/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.688 | DEBUG    | __main__:trials:29 - Trial = 29263/30000 | Total reward = 33.28
2022-01-26 14:18:48.691 | DEBUG    | __main__:trials:24 - Trial = 29264/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.693 | DEBUG    | __main__:trials:29 - Trial = 29264/30000 | Total reward = 39.47
2022-01-26 14:18:48.696 | DEBUG    | __main__:trials:24 - Trial = 29265/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.697 | DEBUG    | __main__:trials:29 - Trial = 29265/30000 | Total reward = 37.12
2022-01-26 14:18:48.701 | DEBUG    | __main__:trials:26 - Trial = 29266/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.702 | DEBUG    | __main__:trials:29 - Trial = 29266/30000 | Total reward = 25.93
2022-01-26 14:18:48.705 | DEBUG    | __main__:trials:26 - Trial = 29267/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.707 | DEBUG    | __main__:trials:29 - Trial = 29267/30000 | Total reward = 14.11
2022-01-26 14:18:48.710 | DEBUG    | __main__:trials:24 - Trial = 29268/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.712 | DEBUG    | __main__:trials:29 - Trial = 29268/30000 | Total reward = 54.78
2022-01-26 14:18:48.715 | DEBUG    | __main__:trials:26 - Trial = 29269/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.717 | DEBUG    | __main__:trials:29 - Trial = 29269/30000 | Total reward = 20.74
2022-01-26 14:18:48.720 | DEBUG    | __main__:trials:24 - Trial = 29270/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.721 | DEBUG    | __main__:trials:29 - Trial = 29270/30000 | Total reward = 36.24
2022-01-26 14:18:48.725 | DEBUG    | __main__:trials:24 - Trial = 29271/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.727 | DEBUG    | __main__:trials:29 - Trial = 29271/30000 | Total reward = 55.42
2022-01-26 14:18:48.731 | DEBUG    | __main__:trials:24 - Trial = 29272/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.732 | DEBUG    | __main__:trials:29 - Trial = 29272/30000 | Total reward = 50.84
2022-01-26 14:18:48.736 | DEBUG    | __main__:trials:26 - Trial = 29273/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.737 | DEBUG    | __main__:trials:29 - Trial = 29273/30000 | Total reward = 30.08
2022-01-26 14:18:48.741 | DEBUG    | __main__:trials:24 - Trial = 29274/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.743 | DEBUG    | __main__:trials:29 - Trial = 29274/30000 | Total reward = 35.50
2022-01-26 14:18:48.747 | DEBUG    | __main__:trials:24 - Trial = 29275/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.748 | DEBUG    | __main__:trials:29 - Trial = 29275/30000 | Total reward = 38.27
2022-01-26 14:18:48.752 | DEBUG    | __main__:trials:24 - Trial = 29276/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.753 | DEBUG    | __main__:trials:29 - Trial = 29276/30000 | Total reward = 43.64
2022-01-26 14:18:48.757 | DEBUG    | __main__:trials:24 - Trial = 29277/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.759 | DEBUG    | __main__:trials:29 - Trial = 29277/30000 | Total reward = 38.40
2022-01-26 14:18:48.762 | DEBUG    | __main__:trials:24 - Trial = 29278/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.763 | DEBUG    | __main__:trials:29 - Trial = 29278/30000 | Total reward = 51.61
2022-01-26 14:18:48.767 | DEBUG    | __main__:trials:24 - Trial = 29279/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.769 | DEBUG    | __main__:trials:29 - Trial = 29279/30000 | Total reward = 28.77
2022-01-26 14:18:48.771 | DEBUG    | __main__:trials:26 - Trial = 29280/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.773 | DEBUG    | __main__:trials:29 - Trial = 29280/30000 | Total reward = 25.59
2022-01-26 14:18:48.777 | DEBUG    | __main__:trials:24 - Trial = 29281/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.778 | DEBUG    | __main__:trials:29 - Trial = 29281/30000 | Total reward = 39.15
2022-01-26 14:18:48.780 | DEBUG    | __main__:trials:24 - Trial = 29282/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.782 | DEBUG    | __main__:trials:29 - Trial = 29282/30000 | Total reward = 33.11
2022-01-26 14:18:48.785 | DEBUG    | __main__:trials:26 - Trial = 29283/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.787 | DEBUG    | __main__:trials:29 - Trial = 29283/30000 | Total reward = 18.04
2022-01-26 14:18:48.789 | DEBUG    | __main__:trials:26 - Trial = 29284/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.790 | DEBUG    | __main__:trials:29 - Trial = 29284/30000 | Total reward = 5.44
2022-01-26 14:18:48.793 | DEBUG    | __main__:trials:24 - Trial = 29285/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.794 | DEBUG    | __main__:trials:29 - Trial = 29285/30000 | Total reward = 34.56
2022-01-26 14:18:48.797 | DEBUG    | __main__:trials:24 - Trial = 29286/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.799 | DEBUG    | __main__:trials:29 - Trial = 29286/30000 | Total reward = 39.54
2022-01-26 14:18:48.802 | DEBUG    | __main__:trials:24 - Trial = 29287/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.803 | DEBUG    | __main__:trials:29 - Trial = 29287/30000 | Total reward = 37.91
2022-01-26 14:18:48.807 | DEBUG    | __main__:trials:24 - Trial = 29288/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.809 | DEBUG    | __main__:trials:29 - Trial = 29288/30000 | Total reward = 32.04
2022-01-26 14:18:48.812 | DEBUG    | __main__:trials:24 - Trial = 29289/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.813 | DEBUG    | __main__:trials:29 - Trial = 29289/30000 | Total reward = 57.37
2022-01-26 14:18:48.817 | DEBUG    | __main__:trials:24 - Trial = 29290/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.819 | DEBUG    | __main__:trials:29 - Trial = 29290/30000 | Total reward = 39.34
2022-01-26 14:18:48.822 | DEBUG    | __main__:trials:24 - Trial = 29291/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.823 | DEBUG    | __main__:trials:29 - Trial = 29291/30000 | Total reward = 34.04
2022-01-26 14:18:48.827 | DEBUG    | __main__:trials:24 - Trial = 29292/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.828 | DEBUG    | __main__:trials:29 - Trial = 29292/30000 | Total reward = 53.20
2022-01-26 14:18:48.832 | DEBUG    | __main__:trials:24 - Trial = 29293/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.833 | DEBUG    | __main__:trials:29 - Trial = 29293/30000 | Total reward = 38.52
2022-01-26 14:18:48.837 | DEBUG    | __main__:trials:24 - Trial = 29294/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.838 | DEBUG    | __main__:trials:29 - Trial = 29294/30000 | Total reward = 38.90
2022-01-26 14:18:48.841 | DEBUG    | __main__:trials:24 - Trial = 29295/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.842 | DEBUG    | __main__:trials:29 - Trial = 29295/30000 | Total reward = 35.72
2022-01-26 14:18:48.846 | DEBUG    | __main__:trials:26 - Trial = 29296/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.848 | DEBUG    | __main__:trials:29 - Trial = 29296/30000 | Total reward = 28.78
2022-01-26 14:18:48.852 | DEBUG    | __main__:trials:24 - Trial = 29297/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.852 | DEBUG    | __main__:trials:29 - Trial = 29297/30000 | Total reward = 31.43
2022-01-26 14:18:48.856 | DEBUG    | __main__:trials:24 - Trial = 29298/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.858 | DEBUG    | __main__:trials:29 - Trial = 29298/30000 | Total reward = 38.44
2022-01-26 14:18:48.862 | DEBUG    | __main__:trials:24 - Trial = 29299/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.862 | DEBUG    | __main__:trials:29 - Trial = 29299/30000 | Total reward = 35.92
2022-01-26 14:18:48.866 | DEBUG    | __main__:trials:24 - Trial = 29300/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.868 | DEBUG    | __main__:trials:29 - Trial = 29300/30000 | Total reward = 38.76
2022-01-26 14:18:48.871 | DEBUG    | __main__:trials:26 - Trial = 29301/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.872 | DEBUG    | __main__:trials:29 - Trial = 29301/30000 | Total reward = 18.42
2022-01-26 14:18:48.875 | DEBUG    | __main__:trials:26 - Trial = 29302/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.877 | DEBUG    | __main__:trials:29 - Trial = 29302/30000 | Total reward = 6.44
2022-01-26 14:18:48.880 | DEBUG    | __main__:trials:26 - Trial = 29303/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.881 | DEBUG    | __main__:trials:29 - Trial = 29303/30000 | Total reward = 22.99
2022-01-26 14:18:48.883 | DEBUG    | __main__:trials:26 - Trial = 29304/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.885 | DEBUG    | __main__:trials:29 - Trial = 29304/30000 | Total reward = 10.76
2022-01-26 14:18:48.888 | DEBUG    | __main__:trials:26 - Trial = 29305/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.890 | DEBUG    | __main__:trials:29 - Trial = 29305/30000 | Total reward = 16.56
2022-01-26 14:18:48.893 | DEBUG    | __main__:trials:24 - Trial = 29306/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.895 | DEBUG    | __main__:trials:29 - Trial = 29306/30000 | Total reward = 39.08
2022-01-26 14:18:48.899 | DEBUG    | __main__:trials:24 - Trial = 29307/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.900 | DEBUG    | __main__:trials:29 - Trial = 29307/30000 | Total reward = 38.90
2022-01-26 14:18:48.903 | DEBUG    | __main__:trials:24 - Trial = 29308/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.905 | DEBUG    | __main__:trials:29 - Trial = 29308/30000 | Total reward = 38.90
2022-01-26 14:18:48.908 | DEBUG    | __main__:trials:24 - Trial = 29309/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.910 | DEBUG    | __main__:trials:29 - Trial = 29309/30000 | Total reward = 38.90
2022-01-26 14:18:48.913 | DEBUG    | __main__:trials:24 - Trial = 29310/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.914 | DEBUG    | __main__:trials:29 - Trial = 29310/30000 | Total reward = 45.63
2022-01-26 14:18:48.917 | DEBUG    | __main__:trials:24 - Trial = 29311/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.919 | DEBUG    | __main__:trials:29 - Trial = 29311/30000 | Total reward = 50.15
2022-01-26 14:18:48.922 | DEBUG    | __main__:trials:24 - Trial = 29312/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.923 | DEBUG    | __main__:trials:29 - Trial = 29312/30000 | Total reward = 31.24
2022-01-26 14:18:48.926 | DEBUG    | __main__:trials:26 - Trial = 29313/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.927 | DEBUG    | __main__:trials:29 - Trial = 29313/30000 | Total reward = 9.03
2022-01-26 14:18:48.931 | DEBUG    | __main__:trials:24 - Trial = 29314/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.931 | DEBUG    | __main__:trials:29 - Trial = 29314/30000 | Total reward = 39.02
2022-01-26 14:18:48.935 | DEBUG    | __main__:trials:24 - Trial = 29315/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.936 | DEBUG    | __main__:trials:29 - Trial = 29315/30000 | Total reward = 38.74
2022-01-26 14:18:48.939 | DEBUG    | __main__:trials:24 - Trial = 29316/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.941 | DEBUG    | __main__:trials:29 - Trial = 29316/30000 | Total reward = 29.32
2022-01-26 14:18:48.944 | DEBUG    | __main__:trials:24 - Trial = 29317/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.945 | DEBUG    | __main__:trials:29 - Trial = 29317/30000 | Total reward = 30.15
2022-01-26 14:18:48.948 | DEBUG    | __main__:trials:26 - Trial = 29318/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.950 | DEBUG    | __main__:trials:29 - Trial = 29318/30000 | Total reward = 11.06
2022-01-26 14:18:48.953 | DEBUG    | __main__:trials:24 - Trial = 29319/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.955 | DEBUG    | __main__:trials:29 - Trial = 29319/30000 | Total reward = 39.67
2022-01-26 14:18:48.959 | DEBUG    | __main__:trials:24 - Trial = 29320/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.960 | DEBUG    | __main__:trials:29 - Trial = 29320/30000 | Total reward = 32.01
2022-01-26 14:18:48.963 | DEBUG    | __main__:trials:26 - Trial = 29321/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.965 | DEBUG    | __main__:trials:29 - Trial = 29321/30000 | Total reward = 11.96
2022-01-26 14:18:48.968 | DEBUG    | __main__:trials:26 - Trial = 29322/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.968 | DEBUG    | __main__:trials:29 - Trial = 29322/30000 | Total reward = 12.92
2022-01-26 14:18:48.971 | DEBUG    | __main__:trials:26 - Trial = 29323/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.972 | DEBUG    | __main__:trials:29 - Trial = 29323/30000 | Total reward = 13.28
2022-01-26 14:18:48.975 | DEBUG    | __main__:trials:26 - Trial = 29324/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.976 | DEBUG    | __main__:trials:29 - Trial = 29324/30000 | Total reward = 9.03
2022-01-26 14:18:48.980 | DEBUG    | __main__:trials:24 - Trial = 29325/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.981 | DEBUG    | __main__:trials:29 - Trial = 29325/30000 | Total reward = 27.29
2022-01-26 14:18:48.984 | DEBUG    | __main__:trials:26 - Trial = 29326/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.986 | DEBUG    | __main__:trials:29 - Trial = 29326/30000 | Total reward = 12.06
2022-01-26 14:18:48.989 | DEBUG    | __main__:trials:26 - Trial = 29327/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.991 | DEBUG    | __main__:trials:29 - Trial = 29327/30000 | Total reward = 22.68
2022-01-26 14:18:48.994 | DEBUG    | __main__:trials:24 - Trial = 29328/30000 | Max number of steps (20) reached
2022-01-26 14:18:48.996 | DEBUG    | __main__:trials:29 - Trial = 29328/30000 | Total reward = 21.85
2022-01-26 14:18:48.998 | DEBUG    | __main__:trials:26 - Trial = 29329/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:48.999 | DEBUG    | __main__:trials:29 - Trial = 29329/30000 | Total reward = 10.11
2022-01-26 14:18:49.003 | DEBUG    | __main__:trials:24 - Trial = 29330/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.004 | DEBUG    | __main__:trials:29 - Trial = 29330/30000 | Total reward = 25.15
2022-01-26 14:18:49.007 | DEBUG    | __main__:trials:26 - Trial = 29331/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.008 | DEBUG    | __main__:trials:29 - Trial = 29331/30000 | Total reward = 11.06
2022-01-26 14:18:49.012 | DEBUG    | __main__:trials:24 - Trial = 29332/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.013 | DEBUG    | __main__:trials:29 - Trial = 29332/30000 | Total reward = 51.35
2022-01-26 14:18:49.017 | DEBUG    | __main__:trials:24 - Trial = 29333/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.019 | DEBUG    | __main__:trials:29 - Trial = 29333/30000 | Total reward = 33.75
2022-01-26 14:18:49.021 | DEBUG    | __main__:trials:26 - Trial = 29334/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.022 | DEBUG    | __main__:trials:29 - Trial = 29334/30000 | Total reward = 11.06
2022-01-26 14:18:49.026 | DEBUG    | __main__:trials:26 - Trial = 29335/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.027 | DEBUG    | __main__:trials:29 - Trial = 29335/30000 | Total reward = 15.78
2022-01-26 14:18:49.031 | DEBUG    | __main__:trials:24 - Trial = 29336/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.033 | DEBUG    | __main__:trials:29 - Trial = 29336/30000 | Total reward = 33.99
2022-01-26 14:18:49.035 | DEBUG    | __main__:trials:26 - Trial = 29337/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.037 | DEBUG    | __main__:trials:29 - Trial = 29337/30000 | Total reward = 11.06
2022-01-26 14:18:49.040 | DEBUG    | __main__:trials:24 - Trial = 29338/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.041 | DEBUG    | __main__:trials:29 - Trial = 29338/30000 | Total reward = 30.09
2022-01-26 14:18:49.046 | DEBUG    | __main__:trials:24 - Trial = 29339/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.048 | DEBUG    | __main__:trials:29 - Trial = 29339/30000 | Total reward = 10.27
2022-01-26 14:18:49.050 | DEBUG    | __main__:trials:26 - Trial = 29340/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.051 | DEBUG    | __main__:trials:29 - Trial = 29340/30000 | Total reward = 6.44
2022-01-26 14:18:49.055 | DEBUG    | __main__:trials:24 - Trial = 29341/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.057 | DEBUG    | __main__:trials:29 - Trial = 29341/30000 | Total reward = 38.52
2022-01-26 14:18:49.060 | DEBUG    | __main__:trials:26 - Trial = 29342/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.061 | DEBUG    | __main__:trials:29 - Trial = 29342/30000 | Total reward = 12.38
2022-01-26 14:18:49.064 | DEBUG    | __main__:trials:26 - Trial = 29343/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.066 | DEBUG    | __main__:trials:29 - Trial = 29343/30000 | Total reward = 18.85
2022-01-26 14:18:49.069 | DEBUG    | __main__:trials:24 - Trial = 29344/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.070 | DEBUG    | __main__:trials:29 - Trial = 29344/30000 | Total reward = 39.51
2022-01-26 14:18:49.073 | DEBUG    | __main__:trials:26 - Trial = 29345/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.074 | DEBUG    | __main__:trials:29 - Trial = 29345/30000 | Total reward = 30.50
2022-01-26 14:18:49.076 | DEBUG    | __main__:trials:26 - Trial = 29346/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.077 | DEBUG    | __main__:trials:29 - Trial = 29346/30000 | Total reward = 11.11
2022-01-26 14:18:49.079 | DEBUG    | __main__:trials:26 - Trial = 29347/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.081 | DEBUG    | __main__:trials:29 - Trial = 29347/30000 | Total reward = 7.44
2022-01-26 14:18:49.084 | DEBUG    | __main__:trials:24 - Trial = 29348/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.085 | DEBUG    | __main__:trials:29 - Trial = 29348/30000 | Total reward = 29.94
2022-01-26 14:18:49.088 | DEBUG    | __main__:trials:24 - Trial = 29349/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.090 | DEBUG    | __main__:trials:29 - Trial = 29349/30000 | Total reward = 24.44
2022-01-26 14:18:49.094 | DEBUG    | __main__:trials:24 - Trial = 29350/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.095 | DEBUG    | __main__:trials:29 - Trial = 29350/30000 | Total reward = 31.65
2022-01-26 14:18:49.099 | DEBUG    | __main__:trials:24 - Trial = 29351/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.100 | DEBUG    | __main__:trials:29 - Trial = 29351/30000 | Total reward = 41.73
2022-01-26 14:18:49.103 | DEBUG    | __main__:trials:26 - Trial = 29352/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.105 | DEBUG    | __main__:trials:29 - Trial = 29352/30000 | Total reward = 12.53
2022-01-26 14:18:49.109 | DEBUG    | __main__:trials:24 - Trial = 29353/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.110 | DEBUG    | __main__:trials:29 - Trial = 29353/30000 | Total reward = 30.26
2022-01-26 14:18:49.114 | DEBUG    | __main__:trials:24 - Trial = 29354/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.116 | DEBUG    | __main__:trials:29 - Trial = 29354/30000 | Total reward = 46.68
2022-01-26 14:18:49.118 | DEBUG    | __main__:trials:26 - Trial = 29355/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.119 | DEBUG    | __main__:trials:29 - Trial = 29355/30000 | Total reward = 11.06
2022-01-26 14:18:49.122 | DEBUG    | __main__:trials:26 - Trial = 29356/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.123 | DEBUG    | __main__:trials:29 - Trial = 29356/30000 | Total reward = 11.06
2022-01-26 14:18:49.126 | DEBUG    | __main__:trials:26 - Trial = 29357/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.128 | DEBUG    | __main__:trials:29 - Trial = 29357/30000 | Total reward = 11.06
2022-01-26 14:18:49.130 | DEBUG    | __main__:trials:26 - Trial = 29358/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.132 | DEBUG    | __main__:trials:29 - Trial = 29358/30000 | Total reward = 11.06
2022-01-26 14:18:49.135 | DEBUG    | __main__:trials:24 - Trial = 29359/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.136 | DEBUG    | __main__:trials:29 - Trial = 29359/30000 | Total reward = 49.27
2022-01-26 14:18:49.139 | DEBUG    | __main__:trials:26 - Trial = 29360/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.140 | DEBUG    | __main__:trials:29 - Trial = 29360/30000 | Total reward = 13.08
2022-01-26 14:18:49.143 | DEBUG    | __main__:trials:26 - Trial = 29361/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.144 | DEBUG    | __main__:trials:29 - Trial = 29361/30000 | Total reward = 11.06
2022-01-26 14:18:49.147 | DEBUG    | __main__:trials:26 - Trial = 29362/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.148 | DEBUG    | __main__:trials:29 - Trial = 29362/30000 | Total reward = 11.06
2022-01-26 14:18:49.151 | DEBUG    | __main__:trials:26 - Trial = 29363/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.151 | DEBUG    | __main__:trials:29 - Trial = 29363/30000 | Total reward = 12.09
2022-01-26 14:18:49.156 | DEBUG    | __main__:trials:26 - Trial = 29364/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.157 | DEBUG    | __main__:trials:29 - Trial = 29364/30000 | Total reward = 19.44
2022-01-26 14:18:49.160 | DEBUG    | __main__:trials:26 - Trial = 29365/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.161 | DEBUG    | __main__:trials:29 - Trial = 29365/30000 | Total reward = 21.73
2022-01-26 14:18:49.165 | DEBUG    | __main__:trials:24 - Trial = 29366/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.167 | DEBUG    | __main__:trials:29 - Trial = 29366/30000 | Total reward = 15.04
2022-01-26 14:18:49.171 | DEBUG    | __main__:trials:24 - Trial = 29367/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.172 | DEBUG    | __main__:trials:29 - Trial = 29367/30000 | Total reward = 25.48
2022-01-26 14:18:49.176 | DEBUG    | __main__:trials:24 - Trial = 29368/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.177 | DEBUG    | __main__:trials:29 - Trial = 29368/30000 | Total reward = 36.91
2022-01-26 14:18:49.181 | DEBUG    | __main__:trials:24 - Trial = 29369/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.182 | DEBUG    | __main__:trials:29 - Trial = 29369/30000 | Total reward = 18.65
2022-01-26 14:18:49.186 | DEBUG    | __main__:trials:24 - Trial = 29370/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.187 | DEBUG    | __main__:trials:29 - Trial = 29370/30000 | Total reward = 13.55
2022-01-26 14:18:49.190 | DEBUG    | __main__:trials:26 - Trial = 29371/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.191 | DEBUG    | __main__:trials:29 - Trial = 29371/30000 | Total reward = 16.94
2022-01-26 14:18:49.195 | DEBUG    | __main__:trials:24 - Trial = 29372/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.197 | DEBUG    | __main__:trials:29 - Trial = 29372/30000 | Total reward = 29.23
2022-01-26 14:18:49.199 | DEBUG    | __main__:trials:26 - Trial = 29373/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.200 | DEBUG    | __main__:trials:29 - Trial = 29373/30000 | Total reward = 6.44
2022-01-26 14:18:49.202 | DEBUG    | __main__:trials:26 - Trial = 29374/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.204 | DEBUG    | __main__:trials:29 - Trial = 29374/30000 | Total reward = 10.15
2022-01-26 14:18:49.207 | DEBUG    | __main__:trials:24 - Trial = 29375/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.209 | DEBUG    | __main__:trials:29 - Trial = 29375/30000 | Total reward = 40.07
2022-01-26 14:18:49.212 | DEBUG    | __main__:trials:24 - Trial = 29376/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.214 | DEBUG    | __main__:trials:29 - Trial = 29376/30000 | Total reward = 29.86
2022-01-26 14:18:49.217 | DEBUG    | __main__:trials:24 - Trial = 29377/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.218 | DEBUG    | __main__:trials:29 - Trial = 29377/30000 | Total reward = 25.95
2022-01-26 14:18:49.222 | DEBUG    | __main__:trials:24 - Trial = 29378/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.223 | DEBUG    | __main__:trials:29 - Trial = 29378/30000 | Total reward = 35.67
2022-01-26 14:18:49.227 | DEBUG    | __main__:trials:24 - Trial = 29379/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.228 | DEBUG    | __main__:trials:29 - Trial = 29379/30000 | Total reward = 41.94
2022-01-26 14:18:49.232 | DEBUG    | __main__:trials:24 - Trial = 29380/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.234 | DEBUG    | __main__:trials:29 - Trial = 29380/30000 | Total reward = 38.72
2022-01-26 14:18:49.237 | DEBUG    | __main__:trials:24 - Trial = 29381/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.239 | DEBUG    | __main__:trials:29 - Trial = 29381/30000 | Total reward = 38.90
2022-01-26 14:18:49.242 | DEBUG    | __main__:trials:24 - Trial = 29382/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.244 | DEBUG    | __main__:trials:29 - Trial = 29382/30000 | Total reward = 38.90
2022-01-26 14:18:49.248 | DEBUG    | __main__:trials:24 - Trial = 29383/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.248 | DEBUG    | __main__:trials:29 - Trial = 29383/30000 | Total reward = 31.36
2022-01-26 14:18:49.253 | DEBUG    | __main__:trials:24 - Trial = 29384/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.254 | DEBUG    | __main__:trials:29 - Trial = 29384/30000 | Total reward = 19.05
2022-01-26 14:18:49.256 | DEBUG    | __main__:trials:26 - Trial = 29385/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.257 | DEBUG    | __main__:trials:29 - Trial = 29385/30000 | Total reward = 6.44
2022-01-26 14:18:49.260 | DEBUG    | __main__:trials:26 - Trial = 29386/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.262 | DEBUG    | __main__:trials:29 - Trial = 29386/30000 | Total reward = 11.87
2022-01-26 14:18:49.264 | DEBUG    | __main__:trials:26 - Trial = 29387/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.266 | DEBUG    | __main__:trials:29 - Trial = 29387/30000 | Total reward = 6.44
2022-01-26 14:18:49.269 | DEBUG    | __main__:trials:24 - Trial = 29388/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.271 | DEBUG    | __main__:trials:29 - Trial = 29388/30000 | Total reward = 29.46
2022-01-26 14:18:49.275 | DEBUG    | __main__:trials:24 - Trial = 29389/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.276 | DEBUG    | __main__:trials:29 - Trial = 29389/30000 | Total reward = 31.67
2022-01-26 14:18:49.279 | DEBUG    | __main__:trials:26 - Trial = 29390/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.281 | DEBUG    | __main__:trials:29 - Trial = 29390/30000 | Total reward = 11.06
2022-01-26 14:18:49.284 | DEBUG    | __main__:trials:24 - Trial = 29391/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.285 | DEBUG    | __main__:trials:29 - Trial = 29391/30000 | Total reward = 30.30
2022-01-26 14:18:49.289 | DEBUG    | __main__:trials:24 - Trial = 29392/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.289 | DEBUG    | __main__:trials:29 - Trial = 29392/30000 | Total reward = 30.87
2022-01-26 14:18:49.295 | DEBUG    | __main__:trials:24 - Trial = 29393/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.295 | DEBUG    | __main__:trials:29 - Trial = 29393/30000 | Total reward = 38.60
2022-01-26 14:18:49.300 | DEBUG    | __main__:trials:24 - Trial = 29394/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.302 | DEBUG    | __main__:trials:29 - Trial = 29394/30000 | Total reward = 32.94
2022-01-26 14:18:49.305 | DEBUG    | __main__:trials:24 - Trial = 29395/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.306 | DEBUG    | __main__:trials:29 - Trial = 29395/30000 | Total reward = 38.65
2022-01-26 14:18:49.310 | DEBUG    | __main__:trials:24 - Trial = 29396/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.312 | DEBUG    | __main__:trials:29 - Trial = 29396/30000 | Total reward = 30.79
2022-01-26 14:18:49.316 | DEBUG    | __main__:trials:24 - Trial = 29397/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.317 | DEBUG    | __main__:trials:29 - Trial = 29397/30000 | Total reward = 38.90
2022-01-26 14:18:49.321 | DEBUG    | __main__:trials:24 - Trial = 29398/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.323 | DEBUG    | __main__:trials:29 - Trial = 29398/30000 | Total reward = 41.29
2022-01-26 14:18:49.326 | DEBUG    | __main__:trials:24 - Trial = 29399/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.327 | DEBUG    | __main__:trials:29 - Trial = 29399/30000 | Total reward = 32.54
2022-01-26 14:18:49.332 | DEBUG    | __main__:trials:26 - Trial = 29400/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.333 | DEBUG    | __main__:trials:29 - Trial = 29400/30000 | Total reward = 28.25
2022-01-26 14:18:49.336 | DEBUG    | __main__:trials:26 - Trial = 29401/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.338 | DEBUG    | __main__:trials:29 - Trial = 29401/30000 | Total reward = 12.84
2022-01-26 14:18:49.342 | DEBUG    | __main__:trials:24 - Trial = 29402/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.342 | DEBUG    | __main__:trials:29 - Trial = 29402/30000 | Total reward = 34.58
2022-01-26 14:18:49.345 | DEBUG    | __main__:trials:26 - Trial = 29403/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.346 | DEBUG    | __main__:trials:29 - Trial = 29403/30000 | Total reward = 10.67
2022-01-26 14:18:49.349 | DEBUG    | __main__:trials:26 - Trial = 29404/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.350 | DEBUG    | __main__:trials:29 - Trial = 29404/30000 | Total reward = 10.11
2022-01-26 14:18:49.353 | DEBUG    | __main__:trials:26 - Trial = 29405/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.355 | DEBUG    | __main__:trials:29 - Trial = 29405/30000 | Total reward = 13.06
2022-01-26 14:18:49.359 | DEBUG    | __main__:trials:24 - Trial = 29406/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.359 | DEBUG    | __main__:trials:29 - Trial = 29406/30000 | Total reward = 38.98
2022-01-26 14:18:49.364 | DEBUG    | __main__:trials:24 - Trial = 29407/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.365 | DEBUG    | __main__:trials:29 - Trial = 29407/30000 | Total reward = 50.39
2022-01-26 14:18:49.369 | DEBUG    | __main__:trials:24 - Trial = 29408/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.370 | DEBUG    | __main__:trials:29 - Trial = 29408/30000 | Total reward = 35.18
2022-01-26 14:18:49.373 | DEBUG    | __main__:trials:24 - Trial = 29409/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.374 | DEBUG    | __main__:trials:29 - Trial = 29409/30000 | Total reward = 32.83
2022-01-26 14:18:49.377 | DEBUG    | __main__:trials:24 - Trial = 29410/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.379 | DEBUG    | __main__:trials:29 - Trial = 29410/30000 | Total reward = 13.89
2022-01-26 14:18:49.382 | DEBUG    | __main__:trials:26 - Trial = 29411/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.383 | DEBUG    | __main__:trials:29 - Trial = 29411/30000 | Total reward = 6.44
2022-01-26 14:18:49.387 | DEBUG    | __main__:trials:24 - Trial = 29412/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.388 | DEBUG    | __main__:trials:29 - Trial = 29412/30000 | Total reward = 17.74
2022-01-26 14:18:49.390 | DEBUG    | __main__:trials:26 - Trial = 29413/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.392 | DEBUG    | __main__:trials:29 - Trial = 29413/30000 | Total reward = 7.84
2022-01-26 14:18:49.394 | DEBUG    | __main__:trials:26 - Trial = 29414/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.396 | DEBUG    | __main__:trials:29 - Trial = 29414/30000 | Total reward = 10.76
2022-01-26 14:18:49.399 | DEBUG    | __main__:trials:24 - Trial = 29415/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.401 | DEBUG    | __main__:trials:29 - Trial = 29415/30000 | Total reward = 47.84
2022-01-26 14:18:49.404 | DEBUG    | __main__:trials:26 - Trial = 29416/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.405 | DEBUG    | __main__:trials:29 - Trial = 29416/30000 | Total reward = 27.18
2022-01-26 14:18:49.408 | DEBUG    | __main__:trials:24 - Trial = 29417/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.409 | DEBUG    | __main__:trials:29 - Trial = 29417/30000 | Total reward = 48.84
2022-01-26 14:18:49.413 | DEBUG    | __main__:trials:24 - Trial = 29418/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.414 | DEBUG    | __main__:trials:29 - Trial = 29418/30000 | Total reward = 46.08
2022-01-26 14:18:49.418 | DEBUG    | __main__:trials:26 - Trial = 29419/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.419 | DEBUG    | __main__:trials:29 - Trial = 29419/30000 | Total reward = 39.06
2022-01-26 14:18:49.422 | DEBUG    | __main__:trials:24 - Trial = 29420/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.424 | DEBUG    | __main__:trials:29 - Trial = 29420/30000 | Total reward = 31.31
2022-01-26 14:18:49.428 | DEBUG    | __main__:trials:24 - Trial = 29421/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.429 | DEBUG    | __main__:trials:29 - Trial = 29421/30000 | Total reward = 38.87
2022-01-26 14:18:49.433 | DEBUG    | __main__:trials:24 - Trial = 29422/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.434 | DEBUG    | __main__:trials:29 - Trial = 29422/30000 | Total reward = 38.90
2022-01-26 14:18:49.438 | DEBUG    | __main__:trials:24 - Trial = 29423/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.439 | DEBUG    | __main__:trials:29 - Trial = 29423/30000 | Total reward = 38.90
2022-01-26 14:18:49.443 | DEBUG    | __main__:trials:24 - Trial = 29424/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.444 | DEBUG    | __main__:trials:29 - Trial = 29424/30000 | Total reward = 41.06
2022-01-26 14:18:49.448 | DEBUG    | __main__:trials:24 - Trial = 29425/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.449 | DEBUG    | __main__:trials:29 - Trial = 29425/30000 | Total reward = 41.70
2022-01-26 14:18:49.453 | DEBUG    | __main__:trials:24 - Trial = 29426/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.454 | DEBUG    | __main__:trials:29 - Trial = 29426/30000 | Total reward = 39.10
2022-01-26 14:18:49.458 | DEBUG    | __main__:trials:24 - Trial = 29427/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.460 | DEBUG    | __main__:trials:29 - Trial = 29427/30000 | Total reward = 38.90
2022-01-26 14:18:49.464 | DEBUG    | __main__:trials:24 - Trial = 29428/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.465 | DEBUG    | __main__:trials:29 - Trial = 29428/30000 | Total reward = 38.70
2022-01-26 14:18:49.468 | DEBUG    | __main__:trials:24 - Trial = 29429/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.470 | DEBUG    | __main__:trials:29 - Trial = 29429/30000 | Total reward = 38.89
2022-01-26 14:18:49.474 | DEBUG    | __main__:trials:24 - Trial = 29430/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.474 | DEBUG    | __main__:trials:29 - Trial = 29430/30000 | Total reward = 49.98
2022-01-26 14:18:49.479 | DEBUG    | __main__:trials:24 - Trial = 29431/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.480 | DEBUG    | __main__:trials:29 - Trial = 29431/30000 | Total reward = 38.15
2022-01-26 14:18:49.484 | DEBUG    | __main__:trials:24 - Trial = 29432/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.485 | DEBUG    | __main__:trials:29 - Trial = 29432/30000 | Total reward = 40.06
2022-01-26 14:18:49.489 | DEBUG    | __main__:trials:24 - Trial = 29433/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.490 | DEBUG    | __main__:trials:29 - Trial = 29433/30000 | Total reward = 37.38
2022-01-26 14:18:49.493 | DEBUG    | __main__:trials:26 - Trial = 29434/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.494 | DEBUG    | __main__:trials:29 - Trial = 29434/30000 | Total reward = 11.11
2022-01-26 14:18:49.498 | DEBUG    | __main__:trials:26 - Trial = 29435/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.499 | DEBUG    | __main__:trials:29 - Trial = 29435/30000 | Total reward = 33.08
2022-01-26 14:18:49.503 | DEBUG    | __main__:trials:24 - Trial = 29436/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.504 | DEBUG    | __main__:trials:29 - Trial = 29436/30000 | Total reward = 34.53
2022-01-26 14:18:49.508 | DEBUG    | __main__:trials:26 - Trial = 29437/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.509 | DEBUG    | __main__:trials:29 - Trial = 29437/30000 | Total reward = 14.31
2022-01-26 14:18:49.512 | DEBUG    | __main__:trials:26 - Trial = 29438/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.513 | DEBUG    | __main__:trials:29 - Trial = 29438/30000 | Total reward = 11.54
2022-01-26 14:18:49.516 | DEBUG    | __main__:trials:26 - Trial = 29439/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.517 | DEBUG    | __main__:trials:29 - Trial = 29439/30000 | Total reward = 10.67
2022-01-26 14:18:49.521 | DEBUG    | __main__:trials:24 - Trial = 29440/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.521 | DEBUG    | __main__:trials:29 - Trial = 29440/30000 | Total reward = 31.57
2022-01-26 14:18:49.526 | DEBUG    | __main__:trials:24 - Trial = 29441/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.527 | DEBUG    | __main__:trials:29 - Trial = 29441/30000 | Total reward = 36.98
2022-01-26 14:18:49.530 | DEBUG    | __main__:trials:26 - Trial = 29442/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.530 | DEBUG    | __main__:trials:29 - Trial = 29442/30000 | Total reward = 9.29
2022-01-26 14:18:49.535 | DEBUG    | __main__:trials:24 - Trial = 29443/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.536 | DEBUG    | __main__:trials:29 - Trial = 29443/30000 | Total reward = 51.73
2022-01-26 14:18:49.540 | DEBUG    | __main__:trials:24 - Trial = 29444/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.542 | DEBUG    | __main__:trials:29 - Trial = 29444/30000 | Total reward = 39.02
2022-01-26 14:18:49.546 | DEBUG    | __main__:trials:24 - Trial = 29445/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.546 | DEBUG    | __main__:trials:29 - Trial = 29445/30000 | Total reward = 37.02
2022-01-26 14:18:49.550 | DEBUG    | __main__:trials:24 - Trial = 29446/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.552 | DEBUG    | __main__:trials:29 - Trial = 29446/30000 | Total reward = 47.93
2022-01-26 14:18:49.556 | DEBUG    | __main__:trials:24 - Trial = 29447/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.556 | DEBUG    | __main__:trials:29 - Trial = 29447/30000 | Total reward = 39.32
2022-01-26 14:18:49.560 | DEBUG    | __main__:trials:24 - Trial = 29448/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.562 | DEBUG    | __main__:trials:29 - Trial = 29448/30000 | Total reward = 44.97
2022-01-26 14:18:49.565 | DEBUG    | __main__:trials:24 - Trial = 29449/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.567 | DEBUG    | __main__:trials:29 - Trial = 29449/30000 | Total reward = 46.97
2022-01-26 14:18:49.570 | DEBUG    | __main__:trials:24 - Trial = 29450/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.572 | DEBUG    | __main__:trials:29 - Trial = 29450/30000 | Total reward = 37.67
2022-01-26 14:18:49.575 | DEBUG    | __main__:trials:24 - Trial = 29451/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.576 | DEBUG    | __main__:trials:29 - Trial = 29451/30000 | Total reward = 58.61
2022-01-26 14:18:49.579 | DEBUG    | __main__:trials:24 - Trial = 29452/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.581 | DEBUG    | __main__:trials:29 - Trial = 29452/30000 | Total reward = 51.52
2022-01-26 14:18:49.584 | DEBUG    | __main__:trials:24 - Trial = 29453/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.586 | DEBUG    | __main__:trials:29 - Trial = 29453/30000 | Total reward = 42.42
2022-01-26 14:18:49.589 | DEBUG    | __main__:trials:24 - Trial = 29454/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.591 | DEBUG    | __main__:trials:29 - Trial = 29454/30000 | Total reward = 38.38
2022-01-26 14:18:49.595 | DEBUG    | __main__:trials:24 - Trial = 29455/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.595 | DEBUG    | __main__:trials:29 - Trial = 29455/30000 | Total reward = 28.38
2022-01-26 14:18:49.600 | DEBUG    | __main__:trials:24 - Trial = 29456/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.601 | DEBUG    | __main__:trials:29 - Trial = 29456/30000 | Total reward = 31.84
2022-01-26 14:18:49.605 | DEBUG    | __main__:trials:24 - Trial = 29457/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.606 | DEBUG    | __main__:trials:29 - Trial = 29457/30000 | Total reward = 38.92
2022-01-26 14:18:49.608 | DEBUG    | __main__:trials:26 - Trial = 29458/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.609 | DEBUG    | __main__:trials:29 - Trial = 29458/30000 | Total reward = 13.73
2022-01-26 14:18:49.611 | DEBUG    | __main__:trials:26 - Trial = 29459/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.612 | DEBUG    | __main__:trials:29 - Trial = 29459/30000 | Total reward = 13.73
2022-01-26 14:18:49.615 | DEBUG    | __main__:trials:24 - Trial = 29460/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.617 | DEBUG    | __main__:trials:29 - Trial = 29460/30000 | Total reward = 33.73
2022-01-26 14:18:49.620 | DEBUG    | __main__:trials:24 - Trial = 29461/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.622 | DEBUG    | __main__:trials:29 - Trial = 29461/30000 | Total reward = 38.90
2022-01-26 14:18:49.625 | DEBUG    | __main__:trials:24 - Trial = 29462/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.628 | DEBUG    | __main__:trials:29 - Trial = 29462/30000 | Total reward = 43.09
2022-01-26 14:18:49.630 | DEBUG    | __main__:trials:24 - Trial = 29463/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.632 | DEBUG    | __main__:trials:29 - Trial = 29463/30000 | Total reward = 54.12
2022-01-26 14:18:49.635 | DEBUG    | __main__:trials:24 - Trial = 29464/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.637 | DEBUG    | __main__:trials:29 - Trial = 29464/30000 | Total reward = 29.82
2022-01-26 14:18:49.640 | DEBUG    | __main__:trials:24 - Trial = 29465/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.641 | DEBUG    | __main__:trials:29 - Trial = 29465/30000 | Total reward = 38.18
2022-01-26 14:18:49.646 | DEBUG    | __main__:trials:24 - Trial = 29466/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.647 | DEBUG    | __main__:trials:29 - Trial = 29466/30000 | Total reward = 29.22
2022-01-26 14:18:49.650 | DEBUG    | __main__:trials:24 - Trial = 29467/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.652 | DEBUG    | __main__:trials:29 - Trial = 29467/30000 | Total reward = 39.69
2022-01-26 14:18:49.655 | DEBUG    | __main__:trials:24 - Trial = 29468/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.657 | DEBUG    | __main__:trials:29 - Trial = 29468/30000 | Total reward = 38.77
2022-01-26 14:18:49.661 | DEBUG    | __main__:trials:24 - Trial = 29469/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.662 | DEBUG    | __main__:trials:29 - Trial = 29469/30000 | Total reward = 41.57
2022-01-26 14:18:49.666 | DEBUG    | __main__:trials:24 - Trial = 29470/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.667 | DEBUG    | __main__:trials:29 - Trial = 29470/30000 | Total reward = 47.10
2022-01-26 14:18:49.671 | DEBUG    | __main__:trials:24 - Trial = 29471/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.673 | DEBUG    | __main__:trials:29 - Trial = 29471/30000 | Total reward = 34.73
2022-01-26 14:18:49.676 | DEBUG    | __main__:trials:24 - Trial = 29472/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.677 | DEBUG    | __main__:trials:29 - Trial = 29472/30000 | Total reward = 41.02
2022-01-26 14:18:49.680 | DEBUG    | __main__:trials:24 - Trial = 29473/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.682 | DEBUG    | __main__:trials:29 - Trial = 29473/30000 | Total reward = 38.17
2022-01-26 14:18:49.685 | DEBUG    | __main__:trials:26 - Trial = 29474/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.686 | DEBUG    | __main__:trials:29 - Trial = 29474/30000 | Total reward = 11.06
2022-01-26 14:18:49.689 | DEBUG    | __main__:trials:26 - Trial = 29475/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.690 | DEBUG    | __main__:trials:29 - Trial = 29475/30000 | Total reward = 12.92
2022-01-26 14:18:49.693 | DEBUG    | __main__:trials:26 - Trial = 29476/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.695 | DEBUG    | __main__:trials:29 - Trial = 29476/30000 | Total reward = 9.03
2022-01-26 14:18:49.699 | DEBUG    | __main__:trials:24 - Trial = 29477/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.700 | DEBUG    | __main__:trials:29 - Trial = 29477/30000 | Total reward = 36.98
2022-01-26 14:18:49.703 | DEBUG    | __main__:trials:24 - Trial = 29478/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.705 | DEBUG    | __main__:trials:29 - Trial = 29478/30000 | Total reward = 37.05
2022-01-26 14:18:49.708 | DEBUG    | __main__:trials:26 - Trial = 29479/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.708 | DEBUG    | __main__:trials:29 - Trial = 29479/30000 | Total reward = 10.52
2022-01-26 14:18:49.712 | DEBUG    | __main__:trials:26 - Trial = 29480/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.713 | DEBUG    | __main__:trials:29 - Trial = 29480/30000 | Total reward = 31.47
2022-01-26 14:18:49.716 | DEBUG    | __main__:trials:26 - Trial = 29481/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.717 | DEBUG    | __main__:trials:29 - Trial = 29481/30000 | Total reward = 19.20
2022-01-26 14:18:49.721 | DEBUG    | __main__:trials:24 - Trial = 29482/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.723 | DEBUG    | __main__:trials:29 - Trial = 29482/30000 | Total reward = 28.25
2022-01-26 14:18:49.725 | DEBUG    | __main__:trials:26 - Trial = 29483/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.726 | DEBUG    | __main__:trials:29 - Trial = 29483/30000 | Total reward = 11.06
2022-01-26 14:18:49.729 | DEBUG    | __main__:trials:24 - Trial = 29484/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.731 | DEBUG    | __main__:trials:29 - Trial = 29484/30000 | Total reward = 23.34
2022-01-26 14:18:49.733 | DEBUG    | __main__:trials:26 - Trial = 29485/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.734 | DEBUG    | __main__:trials:29 - Trial = 29485/30000 | Total reward = 10.67
2022-01-26 14:18:49.737 | DEBUG    | __main__:trials:24 - Trial = 29486/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.738 | DEBUG    | __main__:trials:29 - Trial = 29486/30000 | Total reward = 38.51
2022-01-26 14:18:49.740 | DEBUG    | __main__:trials:26 - Trial = 29487/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.741 | DEBUG    | __main__:trials:29 - Trial = 29487/30000 | Total reward = 11.06
2022-01-26 14:18:49.745 | DEBUG    | __main__:trials:24 - Trial = 29488/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.746 | DEBUG    | __main__:trials:29 - Trial = 29488/30000 | Total reward = 22.56
2022-01-26 14:18:49.748 | DEBUG    | __main__:trials:26 - Trial = 29489/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.749 | DEBUG    | __main__:trials:29 - Trial = 29489/30000 | Total reward = 12.39
2022-01-26 14:18:49.753 | DEBUG    | __main__:trials:24 - Trial = 29490/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.754 | DEBUG    | __main__:trials:29 - Trial = 29490/30000 | Total reward = 34.85
2022-01-26 14:18:49.757 | DEBUG    | __main__:trials:26 - Trial = 29491/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.758 | DEBUG    | __main__:trials:29 - Trial = 29491/30000 | Total reward = 10.52
2022-01-26 14:18:49.762 | DEBUG    | __main__:trials:24 - Trial = 29492/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.763 | DEBUG    | __main__:trials:29 - Trial = 29492/30000 | Total reward = 28.19
2022-01-26 14:18:49.765 | DEBUG    | __main__:trials:26 - Trial = 29493/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.767 | DEBUG    | __main__:trials:29 - Trial = 29493/30000 | Total reward = 11.06
2022-01-26 14:18:49.771 | DEBUG    | __main__:trials:24 - Trial = 29494/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.772 | DEBUG    | __main__:trials:29 - Trial = 29494/30000 | Total reward = 42.33
2022-01-26 14:18:49.776 | DEBUG    | __main__:trials:24 - Trial = 29495/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.777 | DEBUG    | __main__:trials:29 - Trial = 29495/30000 | Total reward = 38.58
2022-01-26 14:18:49.780 | DEBUG    | __main__:trials:26 - Trial = 29496/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.780 | DEBUG    | __main__:trials:29 - Trial = 29496/30000 | Total reward = 10.11
2022-01-26 14:18:49.784 | DEBUG    | __main__:trials:26 - Trial = 29497/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.785 | DEBUG    | __main__:trials:29 - Trial = 29497/30000 | Total reward = 16.12
2022-01-26 14:18:49.789 | DEBUG    | __main__:trials:24 - Trial = 29498/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.791 | DEBUG    | __main__:trials:29 - Trial = 29498/30000 | Total reward = 37.89
2022-01-26 14:18:49.794 | DEBUG    | __main__:trials:24 - Trial = 29499/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.795 | DEBUG    | __main__:trials:29 - Trial = 29499/30000 | Total reward = 40.10
2022-01-26 14:18:49.799 | DEBUG    | __main__:trials:24 - Trial = 29500/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.800 | DEBUG    | __main__:trials:29 - Trial = 29500/30000 | Total reward = 34.71
2022-01-26 14:18:49.804 | DEBUG    | __main__:trials:24 - Trial = 29501/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.804 | DEBUG    | __main__:trials:29 - Trial = 29501/30000 | Total reward = 30.42
2022-01-26 14:18:49.809 | DEBUG    | __main__:trials:24 - Trial = 29502/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.810 | DEBUG    | __main__:trials:29 - Trial = 29502/30000 | Total reward = 36.04
2022-01-26 14:18:49.814 | DEBUG    | __main__:trials:24 - Trial = 29503/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.815 | DEBUG    | __main__:trials:29 - Trial = 29503/30000 | Total reward = 38.52
2022-01-26 14:18:49.819 | DEBUG    | __main__:trials:24 - Trial = 29504/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.821 | DEBUG    | __main__:trials:29 - Trial = 29504/30000 | Total reward = 39.07
2022-01-26 14:18:49.824 | DEBUG    | __main__:trials:24 - Trial = 29505/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.826 | DEBUG    | __main__:trials:29 - Trial = 29505/30000 | Total reward = 41.86
2022-01-26 14:18:49.830 | DEBUG    | __main__:trials:24 - Trial = 29506/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.830 | DEBUG    | __main__:trials:29 - Trial = 29506/30000 | Total reward = 38.65
2022-01-26 14:18:49.835 | DEBUG    | __main__:trials:24 - Trial = 29507/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.836 | DEBUG    | __main__:trials:29 - Trial = 29507/30000 | Total reward = 43.26
2022-01-26 14:18:49.840 | DEBUG    | __main__:trials:24 - Trial = 29508/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.842 | DEBUG    | __main__:trials:29 - Trial = 29508/30000 | Total reward = 39.46
2022-01-26 14:18:49.846 | DEBUG    | __main__:trials:24 - Trial = 29509/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.846 | DEBUG    | __main__:trials:29 - Trial = 29509/30000 | Total reward = 38.33
2022-01-26 14:18:49.850 | DEBUG    | __main__:trials:24 - Trial = 29510/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.852 | DEBUG    | __main__:trials:29 - Trial = 29510/30000 | Total reward = 48.65
2022-01-26 14:18:49.856 | DEBUG    | __main__:trials:24 - Trial = 29511/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.856 | DEBUG    | __main__:trials:29 - Trial = 29511/30000 | Total reward = 33.02
2022-01-26 14:18:49.861 | DEBUG    | __main__:trials:24 - Trial = 29512/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.862 | DEBUG    | __main__:trials:29 - Trial = 29512/30000 | Total reward = 39.31
2022-01-26 14:18:49.866 | DEBUG    | __main__:trials:24 - Trial = 29513/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.866 | DEBUG    | __main__:trials:29 - Trial = 29513/30000 | Total reward = 39.34
2022-01-26 14:18:49.871 | DEBUG    | __main__:trials:24 - Trial = 29514/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.871 | DEBUG    | __main__:trials:29 - Trial = 29514/30000 | Total reward = 39.39
2022-01-26 14:18:49.875 | DEBUG    | __main__:trials:24 - Trial = 29515/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.877 | DEBUG    | __main__:trials:29 - Trial = 29515/30000 | Total reward = 30.72
2022-01-26 14:18:49.880 | DEBUG    | __main__:trials:24 - Trial = 29516/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.882 | DEBUG    | __main__:trials:29 - Trial = 29516/30000 | Total reward = 40.21
2022-01-26 14:18:49.885 | DEBUG    | __main__:trials:24 - Trial = 29517/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.886 | DEBUG    | __main__:trials:29 - Trial = 29517/30000 | Total reward = 39.64
2022-01-26 14:18:49.889 | DEBUG    | __main__:trials:24 - Trial = 29518/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.890 | DEBUG    | __main__:trials:29 - Trial = 29518/30000 | Total reward = 57.81
2022-01-26 14:18:49.893 | DEBUG    | __main__:trials:24 - Trial = 29519/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.895 | DEBUG    | __main__:trials:29 - Trial = 29519/30000 | Total reward = 48.31
2022-01-26 14:18:49.898 | DEBUG    | __main__:trials:24 - Trial = 29520/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.898 | DEBUG    | __main__:trials:29 - Trial = 29520/30000 | Total reward = 48.48
2022-01-26 14:18:49.902 | DEBUG    | __main__:trials:24 - Trial = 29521/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.903 | DEBUG    | __main__:trials:29 - Trial = 29521/30000 | Total reward = 36.44
2022-01-26 14:18:49.906 | DEBUG    | __main__:trials:24 - Trial = 29522/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.907 | DEBUG    | __main__:trials:29 - Trial = 29522/30000 | Total reward = 36.80
2022-01-26 14:18:49.910 | DEBUG    | __main__:trials:24 - Trial = 29523/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.912 | DEBUG    | __main__:trials:29 - Trial = 29523/30000 | Total reward = 38.63
2022-01-26 14:18:49.916 | DEBUG    | __main__:trials:24 - Trial = 29524/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.916 | DEBUG    | __main__:trials:29 - Trial = 29524/30000 | Total reward = 32.59
2022-01-26 14:18:49.921 | DEBUG    | __main__:trials:24 - Trial = 29525/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.922 | DEBUG    | __main__:trials:29 - Trial = 29525/30000 | Total reward = 38.52
2022-01-26 14:18:49.926 | DEBUG    | __main__:trials:24 - Trial = 29526/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.927 | DEBUG    | __main__:trials:29 - Trial = 29526/30000 | Total reward = 38.96
2022-01-26 14:18:49.930 | DEBUG    | __main__:trials:24 - Trial = 29527/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.932 | DEBUG    | __main__:trials:29 - Trial = 29527/30000 | Total reward = 43.62
2022-01-26 14:18:49.936 | DEBUG    | __main__:trials:24 - Trial = 29528/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.937 | DEBUG    | __main__:trials:29 - Trial = 29528/30000 | Total reward = 37.22
2022-01-26 14:18:49.940 | DEBUG    | __main__:trials:24 - Trial = 29529/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.942 | DEBUG    | __main__:trials:29 - Trial = 29529/30000 | Total reward = 39.52
2022-01-26 14:18:49.945 | DEBUG    | __main__:trials:24 - Trial = 29530/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.947 | DEBUG    | __main__:trials:29 - Trial = 29530/30000 | Total reward = 38.43
2022-01-26 14:18:49.951 | DEBUG    | __main__:trials:24 - Trial = 29531/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.952 | DEBUG    | __main__:trials:29 - Trial = 29531/30000 | Total reward = 39.10
2022-01-26 14:18:49.956 | DEBUG    | __main__:trials:26 - Trial = 29532/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.957 | DEBUG    | __main__:trials:29 - Trial = 29532/30000 | Total reward = 31.59
2022-01-26 14:18:49.960 | DEBUG    | __main__:trials:26 - Trial = 29533/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:49.962 | DEBUG    | __main__:trials:29 - Trial = 29533/30000 | Total reward = 11.58
2022-01-26 14:18:49.965 | DEBUG    | __main__:trials:24 - Trial = 29534/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.966 | DEBUG    | __main__:trials:29 - Trial = 29534/30000 | Total reward = 34.29
2022-01-26 14:18:49.971 | DEBUG    | __main__:trials:24 - Trial = 29535/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.972 | DEBUG    | __main__:trials:29 - Trial = 29535/30000 | Total reward = 48.59
2022-01-26 14:18:49.976 | DEBUG    | __main__:trials:24 - Trial = 29536/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.977 | DEBUG    | __main__:trials:29 - Trial = 29536/30000 | Total reward = 38.31
2022-01-26 14:18:49.980 | DEBUG    | __main__:trials:24 - Trial = 29537/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.982 | DEBUG    | __main__:trials:29 - Trial = 29537/30000 | Total reward = 39.13
2022-01-26 14:18:49.985 | DEBUG    | __main__:trials:24 - Trial = 29538/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.986 | DEBUG    | __main__:trials:29 - Trial = 29538/30000 | Total reward = 39.06
2022-01-26 14:18:49.989 | DEBUG    | __main__:trials:24 - Trial = 29539/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.990 | DEBUG    | __main__:trials:29 - Trial = 29539/30000 | Total reward = 48.97
2022-01-26 14:18:49.994 | DEBUG    | __main__:trials:24 - Trial = 29540/30000 | Max number of steps (20) reached
2022-01-26 14:18:49.995 | DEBUG    | __main__:trials:29 - Trial = 29540/30000 | Total reward = 41.45
2022-01-26 14:18:49.998 | DEBUG    | __main__:trials:24 - Trial = 29541/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.000 | DEBUG    | __main__:trials:29 - Trial = 29541/30000 | Total reward = 34.91
2022-01-26 14:18:50.005 | DEBUG    | __main__:trials:24 - Trial = 29542/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.006 | DEBUG    | __main__:trials:29 - Trial = 29542/30000 | Total reward = 27.65
2022-01-26 14:18:50.010 | DEBUG    | __main__:trials:24 - Trial = 29543/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.011 | DEBUG    | __main__:trials:29 - Trial = 29543/30000 | Total reward = 29.76
2022-01-26 14:18:50.014 | DEBUG    | __main__:trials:24 - Trial = 29544/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.016 | DEBUG    | __main__:trials:29 - Trial = 29544/30000 | Total reward = 38.76
2022-01-26 14:18:50.019 | DEBUG    | __main__:trials:24 - Trial = 29545/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.021 | DEBUG    | __main__:trials:29 - Trial = 29545/30000 | Total reward = 38.90
2022-01-26 14:18:50.024 | DEBUG    | __main__:trials:26 - Trial = 29546/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.026 | DEBUG    | __main__:trials:29 - Trial = 29546/30000 | Total reward = 35.42
2022-01-26 14:18:50.029 | DEBUG    | __main__:trials:24 - Trial = 29547/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.031 | DEBUG    | __main__:trials:29 - Trial = 29547/30000 | Total reward = 22.73
2022-01-26 14:18:50.035 | DEBUG    | __main__:trials:24 - Trial = 29548/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.036 | DEBUG    | __main__:trials:29 - Trial = 29548/30000 | Total reward = 25.78
2022-01-26 14:18:50.039 | DEBUG    | __main__:trials:24 - Trial = 29549/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.041 | DEBUG    | __main__:trials:29 - Trial = 29549/30000 | Total reward = 34.20
2022-01-26 14:18:50.044 | DEBUG    | __main__:trials:24 - Trial = 29550/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.046 | DEBUG    | __main__:trials:29 - Trial = 29550/30000 | Total reward = 40.92
2022-01-26 14:18:50.049 | DEBUG    | __main__:trials:24 - Trial = 29551/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.051 | DEBUG    | __main__:trials:29 - Trial = 29551/30000 | Total reward = 38.70
2022-01-26 14:18:50.054 | DEBUG    | __main__:trials:24 - Trial = 29552/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.055 | DEBUG    | __main__:trials:29 - Trial = 29552/30000 | Total reward = 35.50
2022-01-26 14:18:50.060 | DEBUG    | __main__:trials:24 - Trial = 29553/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.060 | DEBUG    | __main__:trials:29 - Trial = 29553/30000 | Total reward = 25.06
2022-01-26 14:18:50.064 | DEBUG    | __main__:trials:24 - Trial = 29554/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.065 | DEBUG    | __main__:trials:29 - Trial = 29554/30000 | Total reward = 35.88
2022-01-26 14:18:50.070 | DEBUG    | __main__:trials:24 - Trial = 29555/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.070 | DEBUG    | __main__:trials:29 - Trial = 29555/30000 | Total reward = 24.41
2022-01-26 14:18:50.075 | DEBUG    | __main__:trials:24 - Trial = 29556/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.076 | DEBUG    | __main__:trials:29 - Trial = 29556/30000 | Total reward = 30.00
2022-01-26 14:18:50.080 | DEBUG    | __main__:trials:24 - Trial = 29557/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.082 | DEBUG    | __main__:trials:29 - Trial = 29557/30000 | Total reward = 37.55
2022-01-26 14:18:50.086 | DEBUG    | __main__:trials:24 - Trial = 29558/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.087 | DEBUG    | __main__:trials:29 - Trial = 29558/30000 | Total reward = 50.99
2022-01-26 14:18:50.090 | DEBUG    | __main__:trials:26 - Trial = 29559/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.092 | DEBUG    | __main__:trials:29 - Trial = 29559/30000 | Total reward = 19.88
2022-01-26 14:18:50.094 | DEBUG    | __main__:trials:26 - Trial = 29560/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.096 | DEBUG    | __main__:trials:29 - Trial = 29560/30000 | Total reward = 20.26
2022-01-26 14:18:50.100 | DEBUG    | __main__:trials:24 - Trial = 29561/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.101 | DEBUG    | __main__:trials:29 - Trial = 29561/30000 | Total reward = 41.64
2022-01-26 14:18:50.105 | DEBUG    | __main__:trials:24 - Trial = 29562/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.106 | DEBUG    | __main__:trials:29 - Trial = 29562/30000 | Total reward = 33.83
2022-01-26 14:18:50.109 | DEBUG    | __main__:trials:26 - Trial = 29563/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.111 | DEBUG    | __main__:trials:29 - Trial = 29563/30000 | Total reward = 19.52
2022-01-26 14:18:50.115 | DEBUG    | __main__:trials:24 - Trial = 29564/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.116 | DEBUG    | __main__:trials:29 - Trial = 29564/30000 | Total reward = 40.12
2022-01-26 14:18:50.120 | DEBUG    | __main__:trials:24 - Trial = 29565/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.121 | DEBUG    | __main__:trials:29 - Trial = 29565/30000 | Total reward = 38.13
2022-01-26 14:18:50.125 | DEBUG    | __main__:trials:24 - Trial = 29566/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.126 | DEBUG    | __main__:trials:29 - Trial = 29566/30000 | Total reward = 39.34
2022-01-26 14:18:50.130 | DEBUG    | __main__:trials:24 - Trial = 29567/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.132 | DEBUG    | __main__:trials:29 - Trial = 29567/30000 | Total reward = 33.76
2022-01-26 14:18:50.136 | DEBUG    | __main__:trials:24 - Trial = 29568/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.136 | DEBUG    | __main__:trials:29 - Trial = 29568/30000 | Total reward = 38.29
2022-01-26 14:18:50.140 | DEBUG    | __main__:trials:24 - Trial = 29569/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.141 | DEBUG    | __main__:trials:29 - Trial = 29569/30000 | Total reward = 40.19
2022-01-26 14:18:50.146 | DEBUG    | __main__:trials:24 - Trial = 29570/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.147 | DEBUG    | __main__:trials:29 - Trial = 29570/30000 | Total reward = 27.81
2022-01-26 14:18:50.150 | DEBUG    | __main__:trials:26 - Trial = 29571/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.152 | DEBUG    | __main__:trials:29 - Trial = 29571/30000 | Total reward = 15.71
2022-01-26 14:18:50.156 | DEBUG    | __main__:trials:24 - Trial = 29572/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.157 | DEBUG    | __main__:trials:29 - Trial = 29572/30000 | Total reward = 38.90
2022-01-26 14:18:50.161 | DEBUG    | __main__:trials:24 - Trial = 29573/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.163 | DEBUG    | __main__:trials:29 - Trial = 29573/30000 | Total reward = 38.60
2022-01-26 14:18:50.165 | DEBUG    | __main__:trials:26 - Trial = 29574/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.167 | DEBUG    | __main__:trials:29 - Trial = 29574/30000 | Total reward = 15.71
2022-01-26 14:18:50.170 | DEBUG    | __main__:trials:24 - Trial = 29575/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.171 | DEBUG    | __main__:trials:29 - Trial = 29575/30000 | Total reward = 37.74
2022-01-26 14:18:50.176 | DEBUG    | __main__:trials:24 - Trial = 29576/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.176 | DEBUG    | __main__:trials:29 - Trial = 29576/30000 | Total reward = 44.82
2022-01-26 14:18:50.181 | DEBUG    | __main__:trials:24 - Trial = 29577/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.183 | DEBUG    | __main__:trials:29 - Trial = 29577/30000 | Total reward = 32.24
2022-01-26 14:18:50.186 | DEBUG    | __main__:trials:24 - Trial = 29578/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.188 | DEBUG    | __main__:trials:29 - Trial = 29578/30000 | Total reward = 39.70
2022-01-26 14:18:50.191 | DEBUG    | __main__:trials:24 - Trial = 29579/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.193 | DEBUG    | __main__:trials:29 - Trial = 29579/30000 | Total reward = 36.98
2022-01-26 14:18:50.196 | DEBUG    | __main__:trials:24 - Trial = 29580/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.197 | DEBUG    | __main__:trials:29 - Trial = 29580/30000 | Total reward = 33.23
2022-01-26 14:18:50.200 | DEBUG    | __main__:trials:26 - Trial = 29581/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.202 | DEBUG    | __main__:trials:29 - Trial = 29581/30000 | Total reward = 16.40
2022-01-26 14:18:50.205 | DEBUG    | __main__:trials:24 - Trial = 29582/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.207 | DEBUG    | __main__:trials:29 - Trial = 29582/30000 | Total reward = 45.40
2022-01-26 14:18:50.210 | DEBUG    | __main__:trials:24 - Trial = 29583/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.211 | DEBUG    | __main__:trials:29 - Trial = 29583/30000 | Total reward = 38.90
2022-01-26 14:18:50.215 | DEBUG    | __main__:trials:26 - Trial = 29584/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.217 | DEBUG    | __main__:trials:29 - Trial = 29584/30000 | Total reward = 24.07
2022-01-26 14:18:50.221 | DEBUG    | __main__:trials:24 - Trial = 29585/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.221 | DEBUG    | __main__:trials:29 - Trial = 29585/30000 | Total reward = 32.24
2022-01-26 14:18:50.226 | DEBUG    | __main__:trials:24 - Trial = 29586/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.227 | DEBUG    | __main__:trials:29 - Trial = 29586/30000 | Total reward = 45.30
2022-01-26 14:18:50.230 | DEBUG    | __main__:trials:24 - Trial = 29587/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.232 | DEBUG    | __main__:trials:29 - Trial = 29587/30000 | Total reward = 39.02
2022-01-26 14:18:50.235 | DEBUG    | __main__:trials:24 - Trial = 29588/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.236 | DEBUG    | __main__:trials:29 - Trial = 29588/30000 | Total reward = 29.27
2022-01-26 14:18:50.240 | DEBUG    | __main__:trials:24 - Trial = 29589/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.241 | DEBUG    | __main__:trials:29 - Trial = 29589/30000 | Total reward = 38.89
2022-01-26 14:18:50.245 | DEBUG    | __main__:trials:24 - Trial = 29590/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.247 | DEBUG    | __main__:trials:29 - Trial = 29590/30000 | Total reward = 38.41
2022-01-26 14:18:50.251 | DEBUG    | __main__:trials:24 - Trial = 29591/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.251 | DEBUG    | __main__:trials:29 - Trial = 29591/30000 | Total reward = 46.70
2022-01-26 14:18:50.256 | DEBUG    | __main__:trials:24 - Trial = 29592/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.257 | DEBUG    | __main__:trials:29 - Trial = 29592/30000 | Total reward = 34.83
2022-01-26 14:18:50.261 | DEBUG    | __main__:trials:24 - Trial = 29593/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.262 | DEBUG    | __main__:trials:29 - Trial = 29593/30000 | Total reward = 39.26
2022-01-26 14:18:50.265 | DEBUG    | __main__:trials:26 - Trial = 29594/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.267 | DEBUG    | __main__:trials:29 - Trial = 29594/30000 | Total reward = 21.34
2022-01-26 14:18:50.271 | DEBUG    | __main__:trials:24 - Trial = 29595/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.272 | DEBUG    | __main__:trials:29 - Trial = 29595/30000 | Total reward = 38.72
2022-01-26 14:18:50.276 | DEBUG    | __main__:trials:24 - Trial = 29596/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.277 | DEBUG    | __main__:trials:29 - Trial = 29596/30000 | Total reward = 44.36
2022-01-26 14:18:50.281 | DEBUG    | __main__:trials:26 - Trial = 29597/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.282 | DEBUG    | __main__:trials:29 - Trial = 29597/30000 | Total reward = 20.07
2022-01-26 14:18:50.285 | DEBUG    | __main__:trials:24 - Trial = 29598/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.286 | DEBUG    | __main__:trials:29 - Trial = 29598/30000 | Total reward = 38.90
2022-01-26 14:18:50.290 | DEBUG    | __main__:trials:24 - Trial = 29599/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.292 | DEBUG    | __main__:trials:29 - Trial = 29599/30000 | Total reward = 49.28
2022-01-26 14:18:50.296 | DEBUG    | __main__:trials:24 - Trial = 29600/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.297 | DEBUG    | __main__:trials:29 - Trial = 29600/30000 | Total reward = 37.12
2022-01-26 14:18:50.300 | DEBUG    | __main__:trials:24 - Trial = 29601/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.303 | DEBUG    | __main__:trials:29 - Trial = 29601/30000 | Total reward = 44.01
2022-01-26 14:18:50.306 | DEBUG    | __main__:trials:24 - Trial = 29602/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.308 | DEBUG    | __main__:trials:29 - Trial = 29602/30000 | Total reward = 47.08
2022-01-26 14:18:50.312 | DEBUG    | __main__:trials:24 - Trial = 29603/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.314 | DEBUG    | __main__:trials:29 - Trial = 29603/30000 | Total reward = 49.53
2022-01-26 14:18:50.317 | DEBUG    | __main__:trials:24 - Trial = 29604/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.320 | DEBUG    | __main__:trials:29 - Trial = 29604/30000 | Total reward = 41.61
2022-01-26 14:18:50.324 | DEBUG    | __main__:trials:24 - Trial = 29605/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.325 | DEBUG    | __main__:trials:29 - Trial = 29605/30000 | Total reward = 38.90
2022-01-26 14:18:50.329 | DEBUG    | __main__:trials:24 - Trial = 29606/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.330 | DEBUG    | __main__:trials:29 - Trial = 29606/30000 | Total reward = 32.38
2022-01-26 14:18:50.333 | DEBUG    | __main__:trials:24 - Trial = 29607/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.335 | DEBUG    | __main__:trials:29 - Trial = 29607/30000 | Total reward = 49.53
2022-01-26 14:18:50.337 | DEBUG    | __main__:trials:26 - Trial = 29608/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.338 | DEBUG    | __main__:trials:29 - Trial = 29608/30000 | Total reward = 15.30
2022-01-26 14:18:50.342 | DEBUG    | __main__:trials:24 - Trial = 29609/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.343 | DEBUG    | __main__:trials:29 - Trial = 29609/30000 | Total reward = 39.44
2022-01-26 14:18:50.346 | DEBUG    | __main__:trials:24 - Trial = 29610/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.348 | DEBUG    | __main__:trials:29 - Trial = 29610/30000 | Total reward = 43.97
2022-01-26 14:18:50.352 | DEBUG    | __main__:trials:24 - Trial = 29611/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.353 | DEBUG    | __main__:trials:29 - Trial = 29611/30000 | Total reward = 38.60
2022-01-26 14:18:50.357 | DEBUG    | __main__:trials:24 - Trial = 29612/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.359 | DEBUG    | __main__:trials:29 - Trial = 29612/30000 | Total reward = 35.38
2022-01-26 14:18:50.362 | DEBUG    | __main__:trials:24 - Trial = 29613/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.364 | DEBUG    | __main__:trials:29 - Trial = 29613/30000 | Total reward = 40.82
2022-01-26 14:18:50.368 | DEBUG    | __main__:trials:24 - Trial = 29614/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.370 | DEBUG    | __main__:trials:29 - Trial = 29614/30000 | Total reward = 37.67
2022-01-26 14:18:50.373 | DEBUG    | __main__:trials:24 - Trial = 29615/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.375 | DEBUG    | __main__:trials:29 - Trial = 29615/30000 | Total reward = 25.13
2022-01-26 14:18:50.377 | DEBUG    | __main__:trials:26 - Trial = 29616/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.379 | DEBUG    | __main__:trials:29 - Trial = 29616/30000 | Total reward = 6.44
2022-01-26 14:18:50.382 | DEBUG    | __main__:trials:24 - Trial = 29617/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.384 | DEBUG    | __main__:trials:29 - Trial = 29617/30000 | Total reward = 41.03
2022-01-26 14:18:50.387 | DEBUG    | __main__:trials:24 - Trial = 29618/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.389 | DEBUG    | __main__:trials:29 - Trial = 29618/30000 | Total reward = 44.11
2022-01-26 14:18:50.392 | DEBUG    | __main__:trials:26 - Trial = 29619/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.393 | DEBUG    | __main__:trials:29 - Trial = 29619/30000 | Total reward = 11.75
2022-01-26 14:18:50.396 | DEBUG    | __main__:trials:26 - Trial = 29620/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.398 | DEBUG    | __main__:trials:29 - Trial = 29620/30000 | Total reward = 9.72
2022-01-26 14:18:50.402 | DEBUG    | __main__:trials:24 - Trial = 29621/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.403 | DEBUG    | __main__:trials:29 - Trial = 29621/30000 | Total reward = 38.71
2022-01-26 14:18:50.406 | DEBUG    | __main__:trials:24 - Trial = 29622/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.408 | DEBUG    | __main__:trials:29 - Trial = 29622/30000 | Total reward = 21.57
2022-01-26 14:18:50.411 | DEBUG    | __main__:trials:24 - Trial = 29623/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.413 | DEBUG    | __main__:trials:29 - Trial = 29623/30000 | Total reward = 34.63
2022-01-26 14:18:50.416 | DEBUG    | __main__:trials:26 - Trial = 29624/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.417 | DEBUG    | __main__:trials:29 - Trial = 29624/30000 | Total reward = 15.71
2022-01-26 14:18:50.420 | DEBUG    | __main__:trials:24 - Trial = 29625/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.421 | DEBUG    | __main__:trials:29 - Trial = 29625/30000 | Total reward = 39.61
2022-01-26 14:18:50.425 | DEBUG    | __main__:trials:24 - Trial = 29626/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.426 | DEBUG    | __main__:trials:29 - Trial = 29626/30000 | Total reward = 38.54
2022-01-26 14:18:50.430 | DEBUG    | __main__:trials:24 - Trial = 29627/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.431 | DEBUG    | __main__:trials:29 - Trial = 29627/30000 | Total reward = 38.79
2022-01-26 14:18:50.435 | DEBUG    | __main__:trials:24 - Trial = 29628/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.437 | DEBUG    | __main__:trials:29 - Trial = 29628/30000 | Total reward = 44.66
2022-01-26 14:18:50.440 | DEBUG    | __main__:trials:24 - Trial = 29629/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.442 | DEBUG    | __main__:trials:29 - Trial = 29629/30000 | Total reward = 32.99
2022-01-26 14:18:50.445 | DEBUG    | __main__:trials:26 - Trial = 29630/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.447 | DEBUG    | __main__:trials:29 - Trial = 29630/30000 | Total reward = 24.22
2022-01-26 14:18:50.450 | DEBUG    | __main__:trials:24 - Trial = 29631/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.452 | DEBUG    | __main__:trials:29 - Trial = 29631/30000 | Total reward = 36.72
2022-01-26 14:18:50.455 | DEBUG    | __main__:trials:24 - Trial = 29632/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.456 | DEBUG    | __main__:trials:29 - Trial = 29632/30000 | Total reward = 40.68
2022-01-26 14:18:50.460 | DEBUG    | __main__:trials:24 - Trial = 29633/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.462 | DEBUG    | __main__:trials:29 - Trial = 29633/30000 | Total reward = 39.01
2022-01-26 14:18:50.465 | DEBUG    | __main__:trials:24 - Trial = 29634/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.467 | DEBUG    | __main__:trials:29 - Trial = 29634/30000 | Total reward = 39.10
2022-01-26 14:18:50.471 | DEBUG    | __main__:trials:24 - Trial = 29635/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.472 | DEBUG    | __main__:trials:29 - Trial = 29635/30000 | Total reward = 39.52
2022-01-26 14:18:50.476 | DEBUG    | __main__:trials:24 - Trial = 29636/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.477 | DEBUG    | __main__:trials:29 - Trial = 29636/30000 | Total reward = 31.41
2022-01-26 14:18:50.480 | DEBUG    | __main__:trials:24 - Trial = 29637/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.482 | DEBUG    | __main__:trials:29 - Trial = 29637/30000 | Total reward = 30.45
2022-01-26 14:18:50.486 | DEBUG    | __main__:trials:24 - Trial = 29638/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.487 | DEBUG    | __main__:trials:29 - Trial = 29638/30000 | Total reward = 36.31
2022-01-26 14:18:50.491 | DEBUG    | __main__:trials:24 - Trial = 29639/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.493 | DEBUG    | __main__:trials:29 - Trial = 29639/30000 | Total reward = 41.01
2022-01-26 14:18:50.496 | DEBUG    | __main__:trials:24 - Trial = 29640/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.497 | DEBUG    | __main__:trials:29 - Trial = 29640/30000 | Total reward = 30.45
2022-01-26 14:18:50.501 | DEBUG    | __main__:trials:24 - Trial = 29641/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.503 | DEBUG    | __main__:trials:29 - Trial = 29641/30000 | Total reward = 45.96
2022-01-26 14:18:50.506 | DEBUG    | __main__:trials:24 - Trial = 29642/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.508 | DEBUG    | __main__:trials:29 - Trial = 29642/30000 | Total reward = 37.43
2022-01-26 14:18:50.512 | DEBUG    | __main__:trials:24 - Trial = 29643/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.513 | DEBUG    | __main__:trials:29 - Trial = 29643/30000 | Total reward = 38.65
2022-01-26 14:18:50.516 | DEBUG    | __main__:trials:24 - Trial = 29644/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.518 | DEBUG    | __main__:trials:29 - Trial = 29644/30000 | Total reward = 39.15
2022-01-26 14:18:50.522 | DEBUG    | __main__:trials:26 - Trial = 29645/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.523 | DEBUG    | __main__:trials:29 - Trial = 29645/30000 | Total reward = 30.32
2022-01-26 14:18:50.526 | DEBUG    | __main__:trials:24 - Trial = 29646/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.529 | DEBUG    | __main__:trials:29 - Trial = 29646/30000 | Total reward = 33.85
2022-01-26 14:18:50.533 | DEBUG    | __main__:trials:24 - Trial = 29647/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.533 | DEBUG    | __main__:trials:29 - Trial = 29647/30000 | Total reward = 27.72
2022-01-26 14:18:50.536 | DEBUG    | __main__:trials:24 - Trial = 29648/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.538 | DEBUG    | __main__:trials:29 - Trial = 29648/30000 | Total reward = 39.14
2022-01-26 14:18:50.541 | DEBUG    | __main__:trials:24 - Trial = 29649/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.542 | DEBUG    | __main__:trials:29 - Trial = 29649/30000 | Total reward = 38.52
2022-01-26 14:18:50.545 | DEBUG    | __main__:trials:24 - Trial = 29650/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.546 | DEBUG    | __main__:trials:29 - Trial = 29650/30000 | Total reward = 30.98
2022-01-26 14:18:50.549 | DEBUG    | __main__:trials:24 - Trial = 29651/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.550 | DEBUG    | __main__:trials:29 - Trial = 29651/30000 | Total reward = 39.88
2022-01-26 14:18:50.553 | DEBUG    | __main__:trials:26 - Trial = 29652/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.554 | DEBUG    | __main__:trials:29 - Trial = 29652/30000 | Total reward = 29.88
2022-01-26 14:18:50.558 | DEBUG    | __main__:trials:24 - Trial = 29653/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.559 | DEBUG    | __main__:trials:29 - Trial = 29653/30000 | Total reward = 38.90
2022-01-26 14:18:50.563 | DEBUG    | __main__:trials:24 - Trial = 29654/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.564 | DEBUG    | __main__:trials:29 - Trial = 29654/30000 | Total reward = 38.53
2022-01-26 14:18:50.568 | DEBUG    | __main__:trials:24 - Trial = 29655/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.570 | DEBUG    | __main__:trials:29 - Trial = 29655/30000 | Total reward = 39.02
2022-01-26 14:18:50.573 | DEBUG    | __main__:trials:24 - Trial = 29656/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.575 | DEBUG    | __main__:trials:29 - Trial = 29656/30000 | Total reward = 35.64
2022-01-26 14:18:50.578 | DEBUG    | __main__:trials:24 - Trial = 29657/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.580 | DEBUG    | __main__:trials:29 - Trial = 29657/30000 | Total reward = 38.21
2022-01-26 14:18:50.584 | DEBUG    | __main__:trials:24 - Trial = 29658/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.585 | DEBUG    | __main__:trials:29 - Trial = 29658/30000 | Total reward = 35.37
2022-01-26 14:18:50.589 | DEBUG    | __main__:trials:24 - Trial = 29659/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.591 | DEBUG    | __main__:trials:29 - Trial = 29659/30000 | Total reward = 56.89
2022-01-26 14:18:50.594 | DEBUG    | __main__:trials:26 - Trial = 29660/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.596 | DEBUG    | __main__:trials:29 - Trial = 29660/30000 | Total reward = 12.19
2022-01-26 14:18:50.598 | DEBUG    | __main__:trials:26 - Trial = 29661/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.600 | DEBUG    | __main__:trials:29 - Trial = 29661/30000 | Total reward = 15.71
2022-01-26 14:18:50.603 | DEBUG    | __main__:trials:24 - Trial = 29662/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.605 | DEBUG    | __main__:trials:29 - Trial = 29662/30000 | Total reward = 37.73
2022-01-26 14:18:50.608 | DEBUG    | __main__:trials:24 - Trial = 29663/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.610 | DEBUG    | __main__:trials:29 - Trial = 29663/30000 | Total reward = 45.75
2022-01-26 14:18:50.614 | DEBUG    | __main__:trials:24 - Trial = 29664/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.615 | DEBUG    | __main__:trials:29 - Trial = 29664/30000 | Total reward = 42.73
2022-01-26 14:18:50.619 | DEBUG    | __main__:trials:24 - Trial = 29665/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.621 | DEBUG    | __main__:trials:29 - Trial = 29665/30000 | Total reward = 44.25
2022-01-26 14:18:50.624 | DEBUG    | __main__:trials:24 - Trial = 29666/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.626 | DEBUG    | __main__:trials:29 - Trial = 29666/30000 | Total reward = 31.43
2022-01-26 14:18:50.630 | DEBUG    | __main__:trials:24 - Trial = 29667/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.631 | DEBUG    | __main__:trials:29 - Trial = 29667/30000 | Total reward = 39.51
2022-01-26 14:18:50.634 | DEBUG    | __main__:trials:24 - Trial = 29668/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.636 | DEBUG    | __main__:trials:29 - Trial = 29668/30000 | Total reward = 38.12
2022-01-26 14:18:50.640 | DEBUG    | __main__:trials:24 - Trial = 29669/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.641 | DEBUG    | __main__:trials:29 - Trial = 29669/30000 | Total reward = 31.98
2022-01-26 14:18:50.645 | DEBUG    | __main__:trials:24 - Trial = 29670/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.647 | DEBUG    | __main__:trials:29 - Trial = 29670/30000 | Total reward = 38.94
2022-01-26 14:18:50.650 | DEBUG    | __main__:trials:24 - Trial = 29671/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.652 | DEBUG    | __main__:trials:29 - Trial = 29671/30000 | Total reward = 20.58
2022-01-26 14:18:50.655 | DEBUG    | __main__:trials:24 - Trial = 29672/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.657 | DEBUG    | __main__:trials:29 - Trial = 29672/30000 | Total reward = 29.29
2022-01-26 14:18:50.660 | DEBUG    | __main__:trials:24 - Trial = 29673/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.662 | DEBUG    | __main__:trials:29 - Trial = 29673/30000 | Total reward = 38.73
2022-01-26 14:18:50.665 | DEBUG    | __main__:trials:24 - Trial = 29674/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.667 | DEBUG    | __main__:trials:29 - Trial = 29674/30000 | Total reward = 36.15
2022-01-26 14:18:50.670 | DEBUG    | __main__:trials:24 - Trial = 29675/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.671 | DEBUG    | __main__:trials:29 - Trial = 29675/30000 | Total reward = 39.88
2022-01-26 14:18:50.675 | DEBUG    | __main__:trials:24 - Trial = 29676/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.677 | DEBUG    | __main__:trials:29 - Trial = 29676/30000 | Total reward = 38.57
2022-01-26 14:18:50.680 | DEBUG    | __main__:trials:24 - Trial = 29677/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.682 | DEBUG    | __main__:trials:29 - Trial = 29677/30000 | Total reward = 30.79
2022-01-26 14:18:50.685 | DEBUG    | __main__:trials:24 - Trial = 29678/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.687 | DEBUG    | __main__:trials:29 - Trial = 29678/30000 | Total reward = 50.70
2022-01-26 14:18:50.691 | DEBUG    | __main__:trials:24 - Trial = 29679/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.692 | DEBUG    | __main__:trials:29 - Trial = 29679/30000 | Total reward = 41.28
2022-01-26 14:18:50.696 | DEBUG    | __main__:trials:24 - Trial = 29680/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.697 | DEBUG    | __main__:trials:29 - Trial = 29680/30000 | Total reward = 39.51
2022-01-26 14:18:50.701 | DEBUG    | __main__:trials:24 - Trial = 29681/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.702 | DEBUG    | __main__:trials:29 - Trial = 29681/30000 | Total reward = 39.61
2022-01-26 14:18:50.705 | DEBUG    | __main__:trials:26 - Trial = 29682/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.706 | DEBUG    | __main__:trials:29 - Trial = 29682/30000 | Total reward = 13.39
2022-01-26 14:18:50.709 | DEBUG    | __main__:trials:24 - Trial = 29683/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.710 | DEBUG    | __main__:trials:29 - Trial = 29683/30000 | Total reward = 36.54
2022-01-26 14:18:50.714 | DEBUG    | __main__:trials:24 - Trial = 29684/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.716 | DEBUG    | __main__:trials:29 - Trial = 29684/30000 | Total reward = 38.90
2022-01-26 14:18:50.720 | DEBUG    | __main__:trials:24 - Trial = 29685/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.722 | DEBUG    | __main__:trials:29 - Trial = 29685/30000 | Total reward = 38.48
2022-01-26 14:18:50.725 | DEBUG    | __main__:trials:24 - Trial = 29686/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.727 | DEBUG    | __main__:trials:29 - Trial = 29686/30000 | Total reward = 35.36
2022-01-26 14:18:50.731 | DEBUG    | __main__:trials:24 - Trial = 29687/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.732 | DEBUG    | __main__:trials:29 - Trial = 29687/30000 | Total reward = 41.66
2022-01-26 14:18:50.735 | DEBUG    | __main__:trials:24 - Trial = 29688/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.737 | DEBUG    | __main__:trials:29 - Trial = 29688/30000 | Total reward = 39.01
2022-01-26 14:18:50.740 | DEBUG    | __main__:trials:24 - Trial = 29689/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.742 | DEBUG    | __main__:trials:29 - Trial = 29689/30000 | Total reward = 37.66
2022-01-26 14:18:50.746 | DEBUG    | __main__:trials:24 - Trial = 29690/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.747 | DEBUG    | __main__:trials:29 - Trial = 29690/30000 | Total reward = 36.10
2022-01-26 14:18:50.751 | DEBUG    | __main__:trials:24 - Trial = 29691/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.753 | DEBUG    | __main__:trials:29 - Trial = 29691/30000 | Total reward = 39.87
2022-01-26 14:18:50.756 | DEBUG    | __main__:trials:24 - Trial = 29692/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.758 | DEBUG    | __main__:trials:29 - Trial = 29692/30000 | Total reward = 38.90
2022-01-26 14:18:50.762 | DEBUG    | __main__:trials:26 - Trial = 29693/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.763 | DEBUG    | __main__:trials:29 - Trial = 29693/30000 | Total reward = 26.56
2022-01-26 14:18:50.767 | DEBUG    | __main__:trials:24 - Trial = 29694/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.769 | DEBUG    | __main__:trials:29 - Trial = 29694/30000 | Total reward = 18.40
2022-01-26 14:18:50.772 | DEBUG    | __main__:trials:24 - Trial = 29695/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.774 | DEBUG    | __main__:trials:29 - Trial = 29695/30000 | Total reward = 36.74
2022-01-26 14:18:50.778 | DEBUG    | __main__:trials:24 - Trial = 29696/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.779 | DEBUG    | __main__:trials:29 - Trial = 29696/30000 | Total reward = 36.09
2022-01-26 14:18:50.783 | DEBUG    | __main__:trials:24 - Trial = 29697/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.785 | DEBUG    | __main__:trials:29 - Trial = 29697/30000 | Total reward = 26.04
2022-01-26 14:18:50.787 | DEBUG    | __main__:trials:26 - Trial = 29698/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.789 | DEBUG    | __main__:trials:29 - Trial = 29698/30000 | Total reward = 14.18
2022-01-26 14:18:50.790 | DEBUG    | __main__:trials:26 - Trial = 29699/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.792 | DEBUG    | __main__:trials:29 - Trial = 29699/30000 | Total reward = 11.06
2022-01-26 14:18:50.795 | DEBUG    | __main__:trials:26 - Trial = 29700/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.797 | DEBUG    | __main__:trials:29 - Trial = 29700/30000 | Total reward = 13.08
2022-01-26 14:18:50.799 | DEBUG    | __main__:trials:26 - Trial = 29701/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.801 | DEBUG    | __main__:trials:29 - Trial = 29701/30000 | Total reward = 12.92
2022-01-26 14:18:50.804 | DEBUG    | __main__:trials:24 - Trial = 29702/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.806 | DEBUG    | __main__:trials:29 - Trial = 29702/30000 | Total reward = 32.32
2022-01-26 14:18:50.809 | DEBUG    | __main__:trials:26 - Trial = 29703/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.811 | DEBUG    | __main__:trials:29 - Trial = 29703/30000 | Total reward = 12.08
2022-01-26 14:18:50.813 | DEBUG    | __main__:trials:26 - Trial = 29704/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.815 | DEBUG    | __main__:trials:29 - Trial = 29704/30000 | Total reward = 13.08
2022-01-26 14:18:50.818 | DEBUG    | __main__:trials:26 - Trial = 29705/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.820 | DEBUG    | __main__:trials:29 - Trial = 29705/30000 | Total reward = 29.50
2022-01-26 14:18:50.822 | DEBUG    | __main__:trials:26 - Trial = 29706/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.823 | DEBUG    | __main__:trials:29 - Trial = 29706/30000 | Total reward = 11.06
2022-01-26 14:18:50.828 | DEBUG    | __main__:trials:24 - Trial = 29707/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.830 | DEBUG    | __main__:trials:29 - Trial = 29707/30000 | Total reward = 52.67
2022-01-26 14:18:50.832 | DEBUG    | __main__:trials:26 - Trial = 29708/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.834 | DEBUG    | __main__:trials:29 - Trial = 29708/30000 | Total reward = 11.06
2022-01-26 14:18:50.837 | DEBUG    | __main__:trials:26 - Trial = 29709/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.839 | DEBUG    | __main__:trials:29 - Trial = 29709/30000 | Total reward = 16.54
2022-01-26 14:18:50.842 | DEBUG    | __main__:trials:24 - Trial = 29710/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.844 | DEBUG    | __main__:trials:29 - Trial = 29710/30000 | Total reward = 38.61
2022-01-26 14:18:50.848 | DEBUG    | __main__:trials:24 - Trial = 29711/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.850 | DEBUG    | __main__:trials:29 - Trial = 29711/30000 | Total reward = 58.72
2022-01-26 14:18:50.853 | DEBUG    | __main__:trials:24 - Trial = 29712/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.855 | DEBUG    | __main__:trials:29 - Trial = 29712/30000 | Total reward = 43.62
2022-01-26 14:18:50.857 | DEBUG    | __main__:trials:26 - Trial = 29713/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.859 | DEBUG    | __main__:trials:29 - Trial = 29713/30000 | Total reward = 11.06
2022-01-26 14:18:50.863 | DEBUG    | __main__:trials:24 - Trial = 29714/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.864 | DEBUG    | __main__:trials:29 - Trial = 29714/30000 | Total reward = 39.21
2022-01-26 14:18:50.867 | DEBUG    | __main__:trials:26 - Trial = 29715/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.869 | DEBUG    | __main__:trials:29 - Trial = 29715/30000 | Total reward = 12.64
2022-01-26 14:18:50.871 | DEBUG    | __main__:trials:26 - Trial = 29716/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.873 | DEBUG    | __main__:trials:29 - Trial = 29716/30000 | Total reward = 15.28
2022-01-26 14:18:50.876 | DEBUG    | __main__:trials:26 - Trial = 29717/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.877 | DEBUG    | __main__:trials:29 - Trial = 29717/30000 | Total reward = 9.03
2022-01-26 14:18:50.880 | DEBUG    | __main__:trials:26 - Trial = 29718/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.881 | DEBUG    | __main__:trials:29 - Trial = 29718/30000 | Total reward = 11.96
2022-01-26 14:18:50.883 | DEBUG    | __main__:trials:26 - Trial = 29719/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.885 | DEBUG    | __main__:trials:29 - Trial = 29719/30000 | Total reward = 14.73
2022-01-26 14:18:50.888 | DEBUG    | __main__:trials:24 - Trial = 29720/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.890 | DEBUG    | __main__:trials:29 - Trial = 29720/30000 | Total reward = 51.21
2022-01-26 14:18:50.893 | DEBUG    | __main__:trials:26 - Trial = 29721/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.894 | DEBUG    | __main__:trials:29 - Trial = 29721/30000 | Total reward = 11.06
2022-01-26 14:18:50.897 | DEBUG    | __main__:trials:24 - Trial = 29722/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.898 | DEBUG    | __main__:trials:29 - Trial = 29722/30000 | Total reward = 50.83
2022-01-26 14:18:50.901 | DEBUG    | __main__:trials:24 - Trial = 29723/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.903 | DEBUG    | __main__:trials:29 - Trial = 29723/30000 | Total reward = 31.87
2022-01-26 14:18:50.906 | DEBUG    | __main__:trials:24 - Trial = 29724/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.907 | DEBUG    | __main__:trials:29 - Trial = 29724/30000 | Total reward = 38.82
2022-01-26 14:18:50.909 | DEBUG    | __main__:trials:26 - Trial = 29725/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.911 | DEBUG    | __main__:trials:29 - Trial = 29725/30000 | Total reward = 10.04
2022-01-26 14:18:50.914 | DEBUG    | __main__:trials:24 - Trial = 29726/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.915 | DEBUG    | __main__:trials:29 - Trial = 29726/30000 | Total reward = 41.62
2022-01-26 14:18:50.918 | DEBUG    | __main__:trials:26 - Trial = 29727/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.919 | DEBUG    | __main__:trials:29 - Trial = 29727/30000 | Total reward = 11.06
2022-01-26 14:18:50.922 | DEBUG    | __main__:trials:26 - Trial = 29728/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.922 | DEBUG    | __main__:trials:29 - Trial = 29728/30000 | Total reward = 11.06
2022-01-26 14:18:50.926 | DEBUG    | __main__:trials:26 - Trial = 29729/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.927 | DEBUG    | __main__:trials:29 - Trial = 29729/30000 | Total reward = 22.94
2022-01-26 14:18:50.931 | DEBUG    | __main__:trials:24 - Trial = 29730/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.932 | DEBUG    | __main__:trials:29 - Trial = 29730/30000 | Total reward = 42.27
2022-01-26 14:18:50.936 | DEBUG    | __main__:trials:24 - Trial = 29731/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.938 | DEBUG    | __main__:trials:29 - Trial = 29731/30000 | Total reward = 32.44
2022-01-26 14:18:50.941 | DEBUG    | __main__:trials:26 - Trial = 29732/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.942 | DEBUG    | __main__:trials:29 - Trial = 29732/30000 | Total reward = 11.06
2022-01-26 14:18:50.946 | DEBUG    | __main__:trials:24 - Trial = 29733/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.947 | DEBUG    | __main__:trials:29 - Trial = 29733/30000 | Total reward = 24.78
2022-01-26 14:18:50.950 | DEBUG    | __main__:trials:26 - Trial = 29734/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.952 | DEBUG    | __main__:trials:29 - Trial = 29734/30000 | Total reward = 11.28
2022-01-26 14:18:50.954 | DEBUG    | __main__:trials:26 - Trial = 29735/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.956 | DEBUG    | __main__:trials:29 - Trial = 29735/30000 | Total reward = 11.55
2022-01-26 14:18:50.960 | DEBUG    | __main__:trials:24 - Trial = 29736/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.961 | DEBUG    | __main__:trials:29 - Trial = 29736/30000 | Total reward = 38.85
2022-01-26 14:18:50.964 | DEBUG    | __main__:trials:26 - Trial = 29737/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.966 | DEBUG    | __main__:trials:29 - Trial = 29737/30000 | Total reward = 9.92
2022-01-26 14:18:50.969 | DEBUG    | __main__:trials:26 - Trial = 29738/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.970 | DEBUG    | __main__:trials:29 - Trial = 29738/30000 | Total reward = 31.21
2022-01-26 14:18:50.974 | DEBUG    | __main__:trials:24 - Trial = 29739/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.976 | DEBUG    | __main__:trials:29 - Trial = 29739/30000 | Total reward = 40.22
2022-01-26 14:18:50.979 | DEBUG    | __main__:trials:24 - Trial = 29740/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.981 | DEBUG    | __main__:trials:29 - Trial = 29740/30000 | Total reward = 39.39
2022-01-26 14:18:50.984 | DEBUG    | __main__:trials:26 - Trial = 29741/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.985 | DEBUG    | __main__:trials:29 - Trial = 29741/30000 | Total reward = 23.10
2022-01-26 14:18:50.988 | DEBUG    | __main__:trials:26 - Trial = 29742/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.990 | DEBUG    | __main__:trials:29 - Trial = 29742/30000 | Total reward = 6.81
2022-01-26 14:18:50.993 | DEBUG    | __main__:trials:24 - Trial = 29743/30000 | Max number of steps (20) reached
2022-01-26 14:18:50.995 | DEBUG    | __main__:trials:29 - Trial = 29743/30000 | Total reward = 44.35
2022-01-26 14:18:50.997 | DEBUG    | __main__:trials:26 - Trial = 29744/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:50.999 | DEBUG    | __main__:trials:29 - Trial = 29744/30000 | Total reward = 13.22
2022-01-26 14:18:51.002 | DEBUG    | __main__:trials:26 - Trial = 29745/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.003 | DEBUG    | __main__:trials:29 - Trial = 29745/30000 | Total reward = 12.57
2022-01-26 14:18:51.006 | DEBUG    | __main__:trials:26 - Trial = 29746/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.007 | DEBUG    | __main__:trials:29 - Trial = 29746/30000 | Total reward = 10.11
2022-01-26 14:18:51.010 | DEBUG    | __main__:trials:24 - Trial = 29747/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.012 | DEBUG    | __main__:trials:29 - Trial = 29747/30000 | Total reward = 26.37
2022-01-26 14:18:51.016 | DEBUG    | __main__:trials:24 - Trial = 29748/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.018 | DEBUG    | __main__:trials:29 - Trial = 29748/30000 | Total reward = 48.99
2022-01-26 14:18:51.020 | DEBUG    | __main__:trials:26 - Trial = 29749/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.022 | DEBUG    | __main__:trials:29 - Trial = 29749/30000 | Total reward = 10.11
2022-01-26 14:18:51.024 | DEBUG    | __main__:trials:26 - Trial = 29750/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.026 | DEBUG    | __main__:trials:29 - Trial = 29750/30000 | Total reward = 11.18
2022-01-26 14:18:51.029 | DEBUG    | __main__:trials:26 - Trial = 29751/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.031 | DEBUG    | __main__:trials:29 - Trial = 29751/30000 | Total reward = 9.91
2022-01-26 14:18:51.032 | DEBUG    | __main__:trials:26 - Trial = 29752/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.034 | DEBUG    | __main__:trials:29 - Trial = 29752/30000 | Total reward = 11.50
2022-01-26 14:18:51.038 | DEBUG    | __main__:trials:24 - Trial = 29753/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.039 | DEBUG    | __main__:trials:29 - Trial = 29753/30000 | Total reward = 26.56
2022-01-26 14:18:51.041 | DEBUG    | __main__:trials:26 - Trial = 29754/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.042 | DEBUG    | __main__:trials:29 - Trial = 29754/30000 | Total reward = 10.11
2022-01-26 14:18:51.044 | DEBUG    | __main__:trials:26 - Trial = 29755/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.045 | DEBUG    | __main__:trials:29 - Trial = 29755/30000 | Total reward = 7.43
2022-01-26 14:18:51.048 | DEBUG    | __main__:trials:26 - Trial = 29756/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.050 | DEBUG    | __main__:trials:29 - Trial = 29756/30000 | Total reward = 12.75
2022-01-26 14:18:51.052 | DEBUG    | __main__:trials:26 - Trial = 29757/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.053 | DEBUG    | __main__:trials:29 - Trial = 29757/30000 | Total reward = 10.11
2022-01-26 14:18:51.055 | DEBUG    | __main__:trials:26 - Trial = 29758/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.057 | DEBUG    | __main__:trials:29 - Trial = 29758/30000 | Total reward = 10.11
2022-01-26 14:18:51.060 | DEBUG    | __main__:trials:24 - Trial = 29759/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.061 | DEBUG    | __main__:trials:29 - Trial = 29759/30000 | Total reward = 36.73
2022-01-26 14:18:51.064 | DEBUG    | __main__:trials:24 - Trial = 29760/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.065 | DEBUG    | __main__:trials:29 - Trial = 29760/30000 | Total reward = 53.54
2022-01-26 14:18:51.067 | DEBUG    | __main__:trials:26 - Trial = 29761/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.068 | DEBUG    | __main__:trials:29 - Trial = 29761/30000 | Total reward = 6.81
2022-01-26 14:18:51.070 | DEBUG    | __main__:trials:26 - Trial = 29762/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.071 | DEBUG    | __main__:trials:29 - Trial = 29762/30000 | Total reward = 10.97
2022-01-26 14:18:51.074 | DEBUG    | __main__:trials:24 - Trial = 29763/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.075 | DEBUG    | __main__:trials:29 - Trial = 29763/30000 | Total reward = 45.69
2022-01-26 14:18:51.079 | DEBUG    | __main__:trials:26 - Trial = 29764/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.080 | DEBUG    | __main__:trials:29 - Trial = 29764/30000 | Total reward = 37.91
2022-01-26 14:18:51.083 | DEBUG    | __main__:trials:26 - Trial = 29765/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.084 | DEBUG    | __main__:trials:29 - Trial = 29765/30000 | Total reward = 10.68
2022-01-26 14:18:51.086 | DEBUG    | __main__:trials:26 - Trial = 29766/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.086 | DEBUG    | __main__:trials:29 - Trial = 29766/30000 | Total reward = 12.64
2022-01-26 14:18:51.089 | DEBUG    | __main__:trials:26 - Trial = 29767/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.090 | DEBUG    | __main__:trials:29 - Trial = 29767/30000 | Total reward = 10.11
2022-01-26 14:18:51.093 | DEBUG    | __main__:trials:26 - Trial = 29768/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.094 | DEBUG    | __main__:trials:29 - Trial = 29768/30000 | Total reward = 23.20
2022-01-26 14:18:51.097 | DEBUG    | __main__:trials:26 - Trial = 29769/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.097 | DEBUG    | __main__:trials:29 - Trial = 29769/30000 | Total reward = 11.64
2022-01-26 14:18:51.099 | DEBUG    | __main__:trials:26 - Trial = 29770/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.100 | DEBUG    | __main__:trials:29 - Trial = 29770/30000 | Total reward = 7.96
2022-01-26 14:18:51.103 | DEBUG    | __main__:trials:26 - Trial = 29771/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.104 | DEBUG    | __main__:trials:29 - Trial = 29771/30000 | Total reward = 15.32
2022-01-26 14:18:51.107 | DEBUG    | __main__:trials:26 - Trial = 29772/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.108 | DEBUG    | __main__:trials:29 - Trial = 29772/30000 | Total reward = 23.64
2022-01-26 14:18:51.109 | DEBUG    | __main__:trials:26 - Trial = 29773/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.110 | DEBUG    | __main__:trials:29 - Trial = 29773/30000 | Total reward = 11.06
2022-01-26 14:18:51.113 | DEBUG    | __main__:trials:24 - Trial = 29774/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.114 | DEBUG    | __main__:trials:29 - Trial = 29774/30000 | Total reward = 13.12
2022-01-26 14:18:51.116 | DEBUG    | __main__:trials:26 - Trial = 29775/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.117 | DEBUG    | __main__:trials:29 - Trial = 29775/30000 | Total reward = 9.03
2022-01-26 14:18:51.119 | DEBUG    | __main__:trials:26 - Trial = 29776/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.120 | DEBUG    | __main__:trials:29 - Trial = 29776/30000 | Total reward = 10.11
2022-01-26 14:18:51.121 | DEBUG    | __main__:trials:26 - Trial = 29777/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.122 | DEBUG    | __main__:trials:29 - Trial = 29777/30000 | Total reward = 11.11
2022-01-26 14:18:51.124 | DEBUG    | __main__:trials:26 - Trial = 29778/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.125 | DEBUG    | __main__:trials:29 - Trial = 29778/30000 | Total reward = 9.19
2022-01-26 14:18:51.128 | DEBUG    | __main__:trials:24 - Trial = 29779/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.128 | DEBUG    | __main__:trials:29 - Trial = 29779/30000 | Total reward = 43.39
2022-01-26 14:18:51.131 | DEBUG    | __main__:trials:26 - Trial = 29780/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.132 | DEBUG    | __main__:trials:29 - Trial = 29780/30000 | Total reward = 12.14
2022-01-26 14:18:51.134 | DEBUG    | __main__:trials:26 - Trial = 29781/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.135 | DEBUG    | __main__:trials:29 - Trial = 29781/30000 | Total reward = 18.16
2022-01-26 14:18:51.137 | DEBUG    | __main__:trials:26 - Trial = 29782/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.137 | DEBUG    | __main__:trials:29 - Trial = 29782/30000 | Total reward = 10.11
2022-01-26 14:18:51.139 | DEBUG    | __main__:trials:26 - Trial = 29783/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.140 | DEBUG    | __main__:trials:29 - Trial = 29783/30000 | Total reward = 9.87
2022-01-26 14:18:51.142 | DEBUG    | __main__:trials:26 - Trial = 29784/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.143 | DEBUG    | __main__:trials:29 - Trial = 29784/30000 | Total reward = 17.48
2022-01-26 14:18:51.145 | DEBUG    | __main__:trials:26 - Trial = 29785/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.146 | DEBUG    | __main__:trials:29 - Trial = 29785/30000 | Total reward = 10.11
2022-01-26 14:18:51.150 | DEBUG    | __main__:trials:24 - Trial = 29786/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.150 | DEBUG    | __main__:trials:29 - Trial = 29786/30000 | Total reward = 33.26
2022-01-26 14:18:51.153 | DEBUG    | __main__:trials:26 - Trial = 29787/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.154 | DEBUG    | __main__:trials:29 - Trial = 29787/30000 | Total reward = 10.11
2022-01-26 14:18:51.156 | DEBUG    | __main__:trials:26 - Trial = 29788/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.158 | DEBUG    | __main__:trials:29 - Trial = 29788/30000 | Total reward = 10.11
2022-01-26 14:18:51.161 | DEBUG    | __main__:trials:26 - Trial = 29789/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.163 | DEBUG    | __main__:trials:29 - Trial = 29789/30000 | Total reward = 20.26
2022-01-26 14:18:51.166 | DEBUG    | __main__:trials:26 - Trial = 29790/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.167 | DEBUG    | __main__:trials:29 - Trial = 29790/30000 | Total reward = 20.26
2022-01-26 14:18:51.171 | DEBUG    | __main__:trials:24 - Trial = 29791/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.173 | DEBUG    | __main__:trials:29 - Trial = 29791/30000 | Total reward = 52.53
2022-01-26 14:18:51.175 | DEBUG    | __main__:trials:26 - Trial = 29792/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.176 | DEBUG    | __main__:trials:29 - Trial = 29792/30000 | Total reward = 8.43
2022-01-26 14:18:51.178 | DEBUG    | __main__:trials:26 - Trial = 29793/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.180 | DEBUG    | __main__:trials:29 - Trial = 29793/30000 | Total reward = 10.11
2022-01-26 14:18:51.183 | DEBUG    | __main__:trials:24 - Trial = 29794/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.185 | DEBUG    | __main__:trials:29 - Trial = 29794/30000 | Total reward = 44.61
2022-01-26 14:18:51.187 | DEBUG    | __main__:trials:26 - Trial = 29795/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.188 | DEBUG    | __main__:trials:29 - Trial = 29795/30000 | Total reward = 8.43
2022-01-26 14:18:51.192 | DEBUG    | __main__:trials:24 - Trial = 29796/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.193 | DEBUG    | __main__:trials:29 - Trial = 29796/30000 | Total reward = 43.40
2022-01-26 14:18:51.196 | DEBUG    | __main__:trials:26 - Trial = 29797/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.197 | DEBUG    | __main__:trials:29 - Trial = 29797/30000 | Total reward = 10.69
2022-01-26 14:18:51.199 | DEBUG    | __main__:trials:26 - Trial = 29798/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.200 | DEBUG    | __main__:trials:29 - Trial = 29798/30000 | Total reward = 11.18
2022-01-26 14:18:51.203 | DEBUG    | __main__:trials:26 - Trial = 29799/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.205 | DEBUG    | __main__:trials:29 - Trial = 29799/30000 | Total reward = 21.53
2022-01-26 14:18:51.208 | DEBUG    | __main__:trials:26 - Trial = 29800/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.209 | DEBUG    | __main__:trials:29 - Trial = 29800/30000 | Total reward = 18.71
2022-01-26 14:18:51.212 | DEBUG    | __main__:trials:26 - Trial = 29801/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.212 | DEBUG    | __main__:trials:29 - Trial = 29801/30000 | Total reward = 9.43
2022-01-26 14:18:51.215 | DEBUG    | __main__:trials:26 - Trial = 29802/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.216 | DEBUG    | __main__:trials:29 - Trial = 29802/30000 | Total reward = 13.14
2022-01-26 14:18:51.220 | DEBUG    | __main__:trials:24 - Trial = 29803/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.221 | DEBUG    | __main__:trials:29 - Trial = 29803/30000 | Total reward = 50.04
2022-01-26 14:18:51.223 | DEBUG    | __main__:trials:26 - Trial = 29804/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.225 | DEBUG    | __main__:trials:29 - Trial = 29804/30000 | Total reward = 9.11
2022-01-26 14:18:51.228 | DEBUG    | __main__:trials:26 - Trial = 29805/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.229 | DEBUG    | __main__:trials:29 - Trial = 29805/30000 | Total reward = 11.58
2022-01-26 14:18:51.231 | DEBUG    | __main__:trials:26 - Trial = 29806/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.232 | DEBUG    | __main__:trials:29 - Trial = 29806/30000 | Total reward = 10.11
2022-01-26 14:18:51.235 | DEBUG    | __main__:trials:26 - Trial = 29807/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.235 | DEBUG    | __main__:trials:29 - Trial = 29807/30000 | Total reward = 9.97
2022-01-26 14:18:51.239 | DEBUG    | __main__:trials:24 - Trial = 29808/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.241 | DEBUG    | __main__:trials:29 - Trial = 29808/30000 | Total reward = 33.83
2022-01-26 14:18:51.243 | DEBUG    | __main__:trials:26 - Trial = 29809/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.244 | DEBUG    | __main__:trials:29 - Trial = 29809/30000 | Total reward = 10.11
2022-01-26 14:18:51.248 | DEBUG    | __main__:trials:24 - Trial = 29810/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.249 | DEBUG    | __main__:trials:29 - Trial = 29810/30000 | Total reward = 38.90
2022-01-26 14:18:51.252 | DEBUG    | __main__:trials:26 - Trial = 29811/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.253 | DEBUG    | __main__:trials:29 - Trial = 29811/30000 | Total reward = 8.29
2022-01-26 14:18:51.256 | DEBUG    | __main__:trials:24 - Trial = 29812/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.258 | DEBUG    | __main__:trials:29 - Trial = 29812/30000 | Total reward = 26.70
2022-01-26 14:18:51.262 | DEBUG    | __main__:trials:24 - Trial = 29813/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.263 | DEBUG    | __main__:trials:29 - Trial = 29813/30000 | Total reward = 36.55
2022-01-26 14:18:51.267 | DEBUG    | __main__:trials:24 - Trial = 29814/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.268 | DEBUG    | __main__:trials:29 - Trial = 29814/30000 | Total reward = 39.45
2022-01-26 14:18:51.271 | DEBUG    | __main__:trials:26 - Trial = 29815/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.272 | DEBUG    | __main__:trials:29 - Trial = 29815/30000 | Total reward = 11.45
2022-01-26 14:18:51.276 | DEBUG    | __main__:trials:24 - Trial = 29816/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.277 | DEBUG    | __main__:trials:29 - Trial = 29816/30000 | Total reward = 38.93
2022-01-26 14:18:51.279 | DEBUG    | __main__:trials:26 - Trial = 29817/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.281 | DEBUG    | __main__:trials:29 - Trial = 29817/30000 | Total reward = 10.11
2022-01-26 14:18:51.284 | DEBUG    | __main__:trials:26 - Trial = 29818/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.285 | DEBUG    | __main__:trials:29 - Trial = 29818/30000 | Total reward = 15.73
2022-01-26 14:18:51.288 | DEBUG    | __main__:trials:26 - Trial = 29819/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.288 | DEBUG    | __main__:trials:29 - Trial = 29819/30000 | Total reward = 13.14
2022-01-26 14:18:51.291 | DEBUG    | __main__:trials:26 - Trial = 29820/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.293 | DEBUG    | __main__:trials:29 - Trial = 29820/30000 | Total reward = 11.45
2022-01-26 14:18:51.296 | DEBUG    | __main__:trials:24 - Trial = 29821/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.298 | DEBUG    | __main__:trials:29 - Trial = 29821/30000 | Total reward = 37.22
2022-01-26 14:18:51.302 | DEBUG    | __main__:trials:24 - Trial = 29822/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.303 | DEBUG    | __main__:trials:29 - Trial = 29822/30000 | Total reward = 35.62
2022-01-26 14:18:51.306 | DEBUG    | __main__:trials:26 - Trial = 29823/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.306 | DEBUG    | __main__:trials:29 - Trial = 29823/30000 | Total reward = 8.43
2022-01-26 14:18:51.311 | DEBUG    | __main__:trials:24 - Trial = 29824/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.313 | DEBUG    | __main__:trials:29 - Trial = 29824/30000 | Total reward = 35.40
2022-01-26 14:18:51.316 | DEBUG    | __main__:trials:24 - Trial = 29825/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.317 | DEBUG    | __main__:trials:29 - Trial = 29825/30000 | Total reward = 50.85
2022-01-26 14:18:51.320 | DEBUG    | __main__:trials:26 - Trial = 29826/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.321 | DEBUG    | __main__:trials:29 - Trial = 29826/30000 | Total reward = 10.11
2022-01-26 14:18:51.324 | DEBUG    | __main__:trials:26 - Trial = 29827/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.326 | DEBUG    | __main__:trials:29 - Trial = 29827/30000 | Total reward = 11.66
2022-01-26 14:18:51.328 | DEBUG    | __main__:trials:26 - Trial = 29828/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.330 | DEBUG    | __main__:trials:29 - Trial = 29828/30000 | Total reward = 12.35
2022-01-26 14:18:51.332 | DEBUG    | __main__:trials:26 - Trial = 29829/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.334 | DEBUG    | __main__:trials:29 - Trial = 29829/30000 | Total reward = 9.11
2022-01-26 14:18:51.336 | DEBUG    | __main__:trials:26 - Trial = 29830/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.338 | DEBUG    | __main__:trials:29 - Trial = 29830/30000 | Total reward = 15.45
2022-01-26 14:18:51.342 | DEBUG    | __main__:trials:24 - Trial = 29831/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.343 | DEBUG    | __main__:trials:29 - Trial = 29831/30000 | Total reward = 34.60
2022-01-26 14:18:51.345 | DEBUG    | __main__:trials:26 - Trial = 29832/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.347 | DEBUG    | __main__:trials:29 - Trial = 29832/30000 | Total reward = 10.11
2022-01-26 14:18:51.350 | DEBUG    | __main__:trials:24 - Trial = 29833/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.352 | DEBUG    | __main__:trials:29 - Trial = 29833/30000 | Total reward = 36.44
2022-01-26 14:18:51.355 | DEBUG    | __main__:trials:26 - Trial = 29834/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.357 | DEBUG    | __main__:trials:29 - Trial = 29834/30000 | Total reward = 24.54
2022-01-26 14:18:51.360 | DEBUG    | __main__:trials:24 - Trial = 29835/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.362 | DEBUG    | __main__:trials:29 - Trial = 29835/30000 | Total reward = 39.04
2022-01-26 14:18:51.365 | DEBUG    | __main__:trials:26 - Trial = 29836/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.367 | DEBUG    | __main__:trials:29 - Trial = 29836/30000 | Total reward = 20.81
2022-01-26 14:18:51.371 | DEBUG    | __main__:trials:24 - Trial = 29837/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.372 | DEBUG    | __main__:trials:29 - Trial = 29837/30000 | Total reward = 37.82
2022-01-26 14:18:51.375 | DEBUG    | __main__:trials:26 - Trial = 29838/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.376 | DEBUG    | __main__:trials:29 - Trial = 29838/30000 | Total reward = 14.41
2022-01-26 14:18:51.380 | DEBUG    | __main__:trials:24 - Trial = 29839/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.382 | DEBUG    | __main__:trials:29 - Trial = 29839/30000 | Total reward = 53.39
2022-01-26 14:18:51.385 | DEBUG    | __main__:trials:26 - Trial = 29840/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.385 | DEBUG    | __main__:trials:29 - Trial = 29840/30000 | Total reward = 10.11
2022-01-26 14:18:51.387 | DEBUG    | __main__:trials:26 - Trial = 29841/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.389 | DEBUG    | __main__:trials:29 - Trial = 29841/30000 | Total reward = 10.85
2022-01-26 14:18:51.392 | DEBUG    | __main__:trials:24 - Trial = 29842/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.393 | DEBUG    | __main__:trials:29 - Trial = 29842/30000 | Total reward = 45.53
2022-01-26 14:18:51.397 | DEBUG    | __main__:trials:24 - Trial = 29843/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.399 | DEBUG    | __main__:trials:29 - Trial = 29843/30000 | Total reward = 38.28
2022-01-26 14:18:51.401 | DEBUG    | __main__:trials:24 - Trial = 29844/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.403 | DEBUG    | __main__:trials:29 - Trial = 29844/30000 | Total reward = 29.19
2022-01-26 14:18:51.407 | DEBUG    | __main__:trials:24 - Trial = 29845/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.409 | DEBUG    | __main__:trials:29 - Trial = 29845/30000 | Total reward = 52.62
2022-01-26 14:18:51.411 | DEBUG    | __main__:trials:26 - Trial = 29846/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.413 | DEBUG    | __main__:trials:29 - Trial = 29846/30000 | Total reward = 11.11
2022-01-26 14:18:51.416 | DEBUG    | __main__:trials:24 - Trial = 29847/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.417 | DEBUG    | __main__:trials:29 - Trial = 29847/30000 | Total reward = 56.43
2022-01-26 14:18:51.421 | DEBUG    | __main__:trials:24 - Trial = 29848/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.423 | DEBUG    | __main__:trials:29 - Trial = 29848/30000 | Total reward = 42.86
2022-01-26 14:18:51.425 | DEBUG    | __main__:trials:26 - Trial = 29849/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.427 | DEBUG    | __main__:trials:29 - Trial = 29849/30000 | Total reward = 9.58
2022-01-26 14:18:51.428 | DEBUG    | __main__:trials:26 - Trial = 29850/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.430 | DEBUG    | __main__:trials:29 - Trial = 29850/30000 | Total reward = 10.11
2022-01-26 14:18:51.433 | DEBUG    | __main__:trials:26 - Trial = 29851/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.434 | DEBUG    | __main__:trials:29 - Trial = 29851/30000 | Total reward = 11.06
2022-01-26 14:18:51.437 | DEBUG    | __main__:trials:26 - Trial = 29852/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.438 | DEBUG    | __main__:trials:29 - Trial = 29852/30000 | Total reward = 10.63
2022-01-26 14:18:51.440 | DEBUG    | __main__:trials:26 - Trial = 29853/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.442 | DEBUG    | __main__:trials:29 - Trial = 29853/30000 | Total reward = 9.97
2022-01-26 14:18:51.445 | DEBUG    | __main__:trials:24 - Trial = 29854/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.447 | DEBUG    | __main__:trials:29 - Trial = 29854/30000 | Total reward = 39.20
2022-01-26 14:18:51.451 | DEBUG    | __main__:trials:24 - Trial = 29855/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.453 | DEBUG    | __main__:trials:29 - Trial = 29855/30000 | Total reward = 46.18
2022-01-26 14:18:51.456 | DEBUG    | __main__:trials:26 - Trial = 29856/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.457 | DEBUG    | __main__:trials:29 - Trial = 29856/30000 | Total reward = 11.35
2022-01-26 14:18:51.460 | DEBUG    | __main__:trials:26 - Trial = 29857/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.461 | DEBUG    | __main__:trials:29 - Trial = 29857/30000 | Total reward = 14.13
2022-01-26 14:18:51.464 | DEBUG    | __main__:trials:24 - Trial = 29858/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.466 | DEBUG    | __main__:trials:29 - Trial = 29858/30000 | Total reward = 44.76
2022-01-26 14:18:51.470 | DEBUG    | __main__:trials:24 - Trial = 29859/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.471 | DEBUG    | __main__:trials:29 - Trial = 29859/30000 | Total reward = 39.10
2022-01-26 14:18:51.475 | DEBUG    | __main__:trials:24 - Trial = 29860/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.476 | DEBUG    | __main__:trials:29 - Trial = 29860/30000 | Total reward = 53.71
2022-01-26 14:18:51.479 | DEBUG    | __main__:trials:26 - Trial = 29861/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.479 | DEBUG    | __main__:trials:29 - Trial = 29861/30000 | Total reward = 6.81
2022-01-26 14:18:51.483 | DEBUG    | __main__:trials:26 - Trial = 29862/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.484 | DEBUG    | __main__:trials:29 - Trial = 29862/30000 | Total reward = 15.71
2022-01-26 14:18:51.488 | DEBUG    | __main__:trials:24 - Trial = 29863/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.489 | DEBUG    | __main__:trials:29 - Trial = 29863/30000 | Total reward = 25.57
2022-01-26 14:18:51.492 | DEBUG    | __main__:trials:24 - Trial = 29864/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.494 | DEBUG    | __main__:trials:29 - Trial = 29864/30000 | Total reward = 38.82
2022-01-26 14:18:51.496 | DEBUG    | __main__:trials:26 - Trial = 29865/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.498 | DEBUG    | __main__:trials:29 - Trial = 29865/30000 | Total reward = 8.43
2022-01-26 14:18:51.500 | DEBUG    | __main__:trials:26 - Trial = 29866/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.502 | DEBUG    | __main__:trials:29 - Trial = 29866/30000 | Total reward = 11.11
2022-01-26 14:18:51.505 | DEBUG    | __main__:trials:24 - Trial = 29867/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.507 | DEBUG    | __main__:trials:29 - Trial = 29867/30000 | Total reward = 41.80
2022-01-26 14:18:51.510 | DEBUG    | __main__:trials:26 - Trial = 29868/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.511 | DEBUG    | __main__:trials:29 - Trial = 29868/30000 | Total reward = 9.43
2022-01-26 14:18:51.514 | DEBUG    | __main__:trials:26 - Trial = 29869/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.515 | DEBUG    | __main__:trials:29 - Trial = 29869/30000 | Total reward = 11.35
2022-01-26 14:18:51.518 | DEBUG    | __main__:trials:26 - Trial = 29870/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.519 | DEBUG    | __main__:trials:29 - Trial = 29870/30000 | Total reward = 9.43
2022-01-26 14:18:51.523 | DEBUG    | __main__:trials:26 - Trial = 29871/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.526 | DEBUG    | __main__:trials:29 - Trial = 29871/30000 | Total reward = 25.86
2022-01-26 14:18:51.528 | DEBUG    | __main__:trials:26 - Trial = 29872/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.529 | DEBUG    | __main__:trials:29 - Trial = 29872/30000 | Total reward = 10.11
2022-01-26 14:18:51.532 | DEBUG    | __main__:trials:26 - Trial = 29873/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.533 | DEBUG    | __main__:trials:29 - Trial = 29873/30000 | Total reward = 10.11
2022-01-26 14:18:51.537 | DEBUG    | __main__:trials:24 - Trial = 29874/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.539 | DEBUG    | __main__:trials:29 - Trial = 29874/30000 | Total reward = 32.35
2022-01-26 14:18:51.542 | DEBUG    | __main__:trials:24 - Trial = 29875/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.544 | DEBUG    | __main__:trials:29 - Trial = 29875/30000 | Total reward = 27.53
2022-01-26 14:18:51.546 | DEBUG    | __main__:trials:26 - Trial = 29876/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.547 | DEBUG    | __main__:trials:29 - Trial = 29876/30000 | Total reward = 7.81
2022-01-26 14:18:51.549 | DEBUG    | __main__:trials:26 - Trial = 29877/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.550 | DEBUG    | __main__:trials:29 - Trial = 29877/30000 | Total reward = 11.45
2022-01-26 14:18:51.552 | DEBUG    | __main__:trials:26 - Trial = 29878/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.554 | DEBUG    | __main__:trials:29 - Trial = 29878/30000 | Total reward = 11.78
2022-01-26 14:18:51.556 | DEBUG    | __main__:trials:26 - Trial = 29879/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.558 | DEBUG    | __main__:trials:29 - Trial = 29879/30000 | Total reward = 9.43
2022-01-26 14:18:51.560 | DEBUG    | __main__:trials:26 - Trial = 29880/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.562 | DEBUG    | __main__:trials:29 - Trial = 29880/30000 | Total reward = 11.14
2022-01-26 14:18:51.564 | DEBUG    | __main__:trials:26 - Trial = 29881/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.566 | DEBUG    | __main__:trials:29 - Trial = 29881/30000 | Total reward = 11.18
2022-01-26 14:18:51.570 | DEBUG    | __main__:trials:24 - Trial = 29882/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.571 | DEBUG    | __main__:trials:29 - Trial = 29882/30000 | Total reward = 39.18
2022-01-26 14:18:51.575 | DEBUG    | __main__:trials:24 - Trial = 29883/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.577 | DEBUG    | __main__:trials:29 - Trial = 29883/30000 | Total reward = 33.84
2022-01-26 14:18:51.579 | DEBUG    | __main__:trials:26 - Trial = 29884/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.580 | DEBUG    | __main__:trials:29 - Trial = 29884/30000 | Total reward = 10.11
2022-01-26 14:18:51.584 | DEBUG    | __main__:trials:24 - Trial = 29885/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.585 | DEBUG    | __main__:trials:29 - Trial = 29885/30000 | Total reward = 35.16
2022-01-26 14:18:51.588 | DEBUG    | __main__:trials:24 - Trial = 29886/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.590 | DEBUG    | __main__:trials:29 - Trial = 29886/30000 | Total reward = 41.00
2022-01-26 14:18:51.593 | DEBUG    | __main__:trials:26 - Trial = 29887/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.594 | DEBUG    | __main__:trials:29 - Trial = 29887/30000 | Total reward = 9.11
2022-01-26 14:18:51.596 | DEBUG    | __main__:trials:26 - Trial = 29888/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.598 | DEBUG    | __main__:trials:29 - Trial = 29888/30000 | Total reward = 11.35
2022-01-26 14:18:51.601 | DEBUG    | __main__:trials:26 - Trial = 29889/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.602 | DEBUG    | __main__:trials:29 - Trial = 29889/30000 | Total reward = 14.43
2022-01-26 14:18:51.604 | DEBUG    | __main__:trials:26 - Trial = 29890/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.606 | DEBUG    | __main__:trials:29 - Trial = 29890/30000 | Total reward = 10.11
2022-01-26 14:18:51.608 | DEBUG    | __main__:trials:26 - Trial = 29891/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.609 | DEBUG    | __main__:trials:29 - Trial = 29891/30000 | Total reward = 13.29
2022-01-26 14:18:51.612 | DEBUG    | __main__:trials:26 - Trial = 29892/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.614 | DEBUG    | __main__:trials:29 - Trial = 29892/30000 | Total reward = 9.64
2022-01-26 14:18:51.617 | DEBUG    | __main__:trials:24 - Trial = 29893/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.618 | DEBUG    | __main__:trials:29 - Trial = 29893/30000 | Total reward = 53.05
2022-01-26 14:18:51.620 | DEBUG    | __main__:trials:26 - Trial = 29894/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.621 | DEBUG    | __main__:trials:29 - Trial = 29894/30000 | Total reward = 10.11
2022-01-26 14:18:51.623 | DEBUG    | __main__:trials:26 - Trial = 29895/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.625 | DEBUG    | __main__:trials:29 - Trial = 29895/30000 | Total reward = 12.57
2022-01-26 14:18:51.628 | DEBUG    | __main__:trials:24 - Trial = 29896/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.629 | DEBUG    | __main__:trials:29 - Trial = 29896/30000 | Total reward = 25.66
2022-01-26 14:18:51.631 | DEBUG    | __main__:trials:26 - Trial = 29897/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.632 | DEBUG    | __main__:trials:29 - Trial = 29897/30000 | Total reward = 10.11
2022-01-26 14:18:51.634 | DEBUG    | __main__:trials:26 - Trial = 29898/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.636 | DEBUG    | __main__:trials:29 - Trial = 29898/30000 | Total reward = 10.52
2022-01-26 14:18:51.639 | DEBUG    | __main__:trials:24 - Trial = 29899/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.641 | DEBUG    | __main__:trials:29 - Trial = 29899/30000 | Total reward = 53.78
2022-01-26 14:18:51.644 | DEBUG    | __main__:trials:24 - Trial = 29900/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.646 | DEBUG    | __main__:trials:29 - Trial = 29900/30000 | Total reward = 61.02
2022-01-26 14:18:51.649 | DEBUG    | __main__:trials:24 - Trial = 29901/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.650 | DEBUG    | __main__:trials:29 - Trial = 29901/30000 | Total reward = 50.15
2022-01-26 14:18:51.653 | DEBUG    | __main__:trials:24 - Trial = 29902/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.655 | DEBUG    | __main__:trials:29 - Trial = 29902/30000 | Total reward = 38.78
2022-01-26 14:18:51.657 | DEBUG    | __main__:trials:26 - Trial = 29903/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.659 | DEBUG    | __main__:trials:29 - Trial = 29903/30000 | Total reward = 10.11
2022-01-26 14:18:51.662 | DEBUG    | __main__:trials:24 - Trial = 29904/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.664 | DEBUG    | __main__:trials:29 - Trial = 29904/30000 | Total reward = 42.18
2022-01-26 14:18:51.668 | DEBUG    | __main__:trials:26 - Trial = 29905/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.669 | DEBUG    | __main__:trials:29 - Trial = 29905/30000 | Total reward = 27.82
2022-01-26 14:18:51.672 | DEBUG    | __main__:trials:26 - Trial = 29906/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.673 | DEBUG    | __main__:trials:29 - Trial = 29906/30000 | Total reward = 7.43
2022-01-26 14:18:51.676 | DEBUG    | __main__:trials:26 - Trial = 29907/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.676 | DEBUG    | __main__:trials:29 - Trial = 29907/30000 | Total reward = 10.63
2022-01-26 14:18:51.680 | DEBUG    | __main__:trials:24 - Trial = 29908/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.682 | DEBUG    | __main__:trials:29 - Trial = 29908/30000 | Total reward = 38.70
2022-01-26 14:18:51.684 | DEBUG    | __main__:trials:26 - Trial = 29909/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.686 | DEBUG    | __main__:trials:29 - Trial = 29909/30000 | Total reward = 9.43
2022-01-26 14:18:51.689 | DEBUG    | __main__:trials:26 - Trial = 29910/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.690 | DEBUG    | __main__:trials:29 - Trial = 29910/30000 | Total reward = 10.11
2022-01-26 14:18:51.693 | DEBUG    | __main__:trials:26 - Trial = 29911/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.694 | DEBUG    | __main__:trials:29 - Trial = 29911/30000 | Total reward = 9.11
2022-01-26 14:18:51.697 | DEBUG    | __main__:trials:26 - Trial = 29912/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.698 | DEBUG    | __main__:trials:29 - Trial = 29912/30000 | Total reward = 10.11
2022-01-26 14:18:51.701 | DEBUG    | __main__:trials:26 - Trial = 29913/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.702 | DEBUG    | __main__:trials:29 - Trial = 29913/30000 | Total reward = 9.97
2022-01-26 14:18:51.706 | DEBUG    | __main__:trials:24 - Trial = 29914/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.707 | DEBUG    | __main__:trials:29 - Trial = 29914/30000 | Total reward = 28.14
2022-01-26 14:18:51.710 | DEBUG    | __main__:trials:24 - Trial = 29915/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.712 | DEBUG    | __main__:trials:29 - Trial = 29915/30000 | Total reward = 62.08
2022-01-26 14:18:51.716 | DEBUG    | __main__:trials:24 - Trial = 29916/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.718 | DEBUG    | __main__:trials:29 - Trial = 29916/30000 | Total reward = 50.76
2022-01-26 14:18:51.721 | DEBUG    | __main__:trials:24 - Trial = 29917/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.723 | DEBUG    | __main__:trials:29 - Trial = 29917/30000 | Total reward = 35.56
2022-01-26 14:18:51.727 | DEBUG    | __main__:trials:24 - Trial = 29918/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.729 | DEBUG    | __main__:trials:29 - Trial = 29918/30000 | Total reward = 38.54
2022-01-26 14:18:51.732 | DEBUG    | __main__:trials:24 - Trial = 29919/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.734 | DEBUG    | __main__:trials:29 - Trial = 29919/30000 | Total reward = 34.94
2022-01-26 14:18:51.738 | DEBUG    | __main__:trials:24 - Trial = 29920/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.740 | DEBUG    | __main__:trials:29 - Trial = 29920/30000 | Total reward = 37.48
2022-01-26 14:18:51.743 | DEBUG    | __main__:trials:24 - Trial = 29921/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.745 | DEBUG    | __main__:trials:29 - Trial = 29921/30000 | Total reward = 36.17
2022-01-26 14:18:51.747 | DEBUG    | __main__:trials:26 - Trial = 29922/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.748 | DEBUG    | __main__:trials:29 - Trial = 29922/30000 | Total reward = 11.78
2022-01-26 14:18:51.752 | DEBUG    | __main__:trials:24 - Trial = 29923/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.754 | DEBUG    | __main__:trials:29 - Trial = 29923/30000 | Total reward = 39.02
2022-01-26 14:18:51.758 | DEBUG    | __main__:trials:24 - Trial = 29924/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.759 | DEBUG    | __main__:trials:29 - Trial = 29924/30000 | Total reward = 54.40
2022-01-26 14:18:51.763 | DEBUG    | __main__:trials:24 - Trial = 29925/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.765 | DEBUG    | __main__:trials:29 - Trial = 29925/30000 | Total reward = 38.85
2022-01-26 14:18:51.769 | DEBUG    | __main__:trials:24 - Trial = 29926/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.770 | DEBUG    | __main__:trials:29 - Trial = 29926/30000 | Total reward = 37.06
2022-01-26 14:18:51.774 | DEBUG    | __main__:trials:24 - Trial = 29927/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.775 | DEBUG    | __main__:trials:29 - Trial = 29927/30000 | Total reward = 48.55
2022-01-26 14:18:51.779 | DEBUG    | __main__:trials:24 - Trial = 29928/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.781 | DEBUG    | __main__:trials:29 - Trial = 29928/30000 | Total reward = 31.59
2022-01-26 14:18:51.784 | DEBUG    | __main__:trials:24 - Trial = 29929/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.785 | DEBUG    | __main__:trials:29 - Trial = 29929/30000 | Total reward = 44.79
2022-01-26 14:18:51.789 | DEBUG    | __main__:trials:24 - Trial = 29930/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.791 | DEBUG    | __main__:trials:29 - Trial = 29930/30000 | Total reward = 42.83
2022-01-26 14:18:51.796 | DEBUG    | __main__:trials:24 - Trial = 29931/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.797 | DEBUG    | __main__:trials:29 - Trial = 29931/30000 | Total reward = 37.33
2022-01-26 14:18:51.801 | DEBUG    | __main__:trials:24 - Trial = 29932/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.803 | DEBUG    | __main__:trials:29 - Trial = 29932/30000 | Total reward = 23.93
2022-01-26 14:18:51.806 | DEBUG    | __main__:trials:24 - Trial = 29933/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.808 | DEBUG    | __main__:trials:29 - Trial = 29933/30000 | Total reward = 35.95
2022-01-26 14:18:51.811 | DEBUG    | __main__:trials:26 - Trial = 29934/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.813 | DEBUG    | __main__:trials:29 - Trial = 29934/30000 | Total reward = 24.62
2022-01-26 14:18:51.815 | DEBUG    | __main__:trials:26 - Trial = 29935/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.817 | DEBUG    | __main__:trials:29 - Trial = 29935/30000 | Total reward = 16.06
2022-01-26 14:18:51.821 | DEBUG    | __main__:trials:24 - Trial = 29936/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.822 | DEBUG    | __main__:trials:29 - Trial = 29936/30000 | Total reward = 38.52
2022-01-26 14:18:51.826 | DEBUG    | __main__:trials:24 - Trial = 29937/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.828 | DEBUG    | __main__:trials:29 - Trial = 29937/30000 | Total reward = 38.80
2022-01-26 14:18:51.830 | DEBUG    | __main__:trials:24 - Trial = 29938/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.833 | DEBUG    | __main__:trials:29 - Trial = 29938/30000 | Total reward = 37.82
2022-01-26 14:18:51.836 | DEBUG    | __main__:trials:24 - Trial = 29939/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.838 | DEBUG    | __main__:trials:29 - Trial = 29939/30000 | Total reward = 38.97
2022-01-26 14:18:51.842 | DEBUG    | __main__:trials:24 - Trial = 29940/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.843 | DEBUG    | __main__:trials:29 - Trial = 29940/30000 | Total reward = 38.90
2022-01-26 14:18:51.847 | DEBUG    | __main__:trials:24 - Trial = 29941/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.849 | DEBUG    | __main__:trials:29 - Trial = 29941/30000 | Total reward = 32.63
2022-01-26 14:18:51.853 | DEBUG    | __main__:trials:26 - Trial = 29942/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.854 | DEBUG    | __main__:trials:29 - Trial = 29942/30000 | Total reward = 21.92
2022-01-26 14:18:51.857 | DEBUG    | __main__:trials:24 - Trial = 29943/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.859 | DEBUG    | __main__:trials:29 - Trial = 29943/30000 | Total reward = 31.03
2022-01-26 14:18:51.862 | DEBUG    | __main__:trials:26 - Trial = 29944/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.863 | DEBUG    | __main__:trials:29 - Trial = 29944/30000 | Total reward = 9.43
2022-01-26 14:18:51.865 | DEBUG    | __main__:trials:26 - Trial = 29945/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.866 | DEBUG    | __main__:trials:29 - Trial = 29945/30000 | Total reward = 12.35
2022-01-26 14:18:51.868 | DEBUG    | __main__:trials:26 - Trial = 29946/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.870 | DEBUG    | __main__:trials:29 - Trial = 29946/30000 | Total reward = 17.61
2022-01-26 14:18:51.872 | DEBUG    | __main__:trials:26 - Trial = 29947/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.872 | DEBUG    | __main__:trials:29 - Trial = 29947/30000 | Total reward = 11.11
2022-01-26 14:18:51.876 | DEBUG    | __main__:trials:26 - Trial = 29948/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.876 | DEBUG    | __main__:trials:29 - Trial = 29948/30000 | Total reward = 22.89
2022-01-26 14:18:51.879 | DEBUG    | __main__:trials:26 - Trial = 29949/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.880 | DEBUG    | __main__:trials:29 - Trial = 29949/30000 | Total reward = 11.45
2022-01-26 14:18:51.883 | DEBUG    | __main__:trials:26 - Trial = 29950/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.885 | DEBUG    | __main__:trials:29 - Trial = 29950/30000 | Total reward = 14.34
2022-01-26 14:18:51.888 | DEBUG    | __main__:trials:24 - Trial = 29951/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.890 | DEBUG    | __main__:trials:29 - Trial = 29951/30000 | Total reward = 32.86
2022-01-26 14:18:51.893 | DEBUG    | __main__:trials:26 - Trial = 29952/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.894 | DEBUG    | __main__:trials:29 - Trial = 29952/30000 | Total reward = 10.11
2022-01-26 14:18:51.897 | DEBUG    | __main__:trials:26 - Trial = 29953/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.897 | DEBUG    | __main__:trials:29 - Trial = 29953/30000 | Total reward = 9.58
2022-01-26 14:18:51.900 | DEBUG    | __main__:trials:26 - Trial = 29954/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.901 | DEBUG    | __main__:trials:29 - Trial = 29954/30000 | Total reward = 10.11
2022-01-26 14:18:51.904 | DEBUG    | __main__:trials:26 - Trial = 29955/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.906 | DEBUG    | __main__:trials:29 - Trial = 29955/30000 | Total reward = 7.97
2022-01-26 14:18:51.908 | DEBUG    | __main__:trials:26 - Trial = 29956/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.910 | DEBUG    | __main__:trials:29 - Trial = 29956/30000 | Total reward = 8.58
2022-01-26 14:18:51.912 | DEBUG    | __main__:trials:26 - Trial = 29957/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.914 | DEBUG    | __main__:trials:29 - Trial = 29957/30000 | Total reward = 9.03
2022-01-26 14:18:51.916 | DEBUG    | __main__:trials:26 - Trial = 29958/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.917 | DEBUG    | __main__:trials:29 - Trial = 29958/30000 | Total reward = 10.11
2022-01-26 14:18:51.920 | DEBUG    | __main__:trials:26 - Trial = 29959/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.922 | DEBUG    | __main__:trials:29 - Trial = 29959/30000 | Total reward = 13.82
2022-01-26 14:18:51.924 | DEBUG    | __main__:trials:26 - Trial = 29960/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.926 | DEBUG    | __main__:trials:29 - Trial = 29960/30000 | Total reward = 13.40
2022-01-26 14:18:51.930 | DEBUG    | __main__:trials:24 - Trial = 29961/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.931 | DEBUG    | __main__:trials:29 - Trial = 29961/30000 | Total reward = 40.46
2022-01-26 14:18:51.935 | DEBUG    | __main__:trials:24 - Trial = 29962/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.937 | DEBUG    | __main__:trials:29 - Trial = 29962/30000 | Total reward = 27.40
2022-01-26 14:18:51.940 | DEBUG    | __main__:trials:26 - Trial = 29963/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.941 | DEBUG    | __main__:trials:29 - Trial = 29963/30000 | Total reward = 9.11
2022-01-26 14:18:51.943 | DEBUG    | __main__:trials:26 - Trial = 29964/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.945 | DEBUG    | __main__:trials:29 - Trial = 29964/30000 | Total reward = 11.06
2022-01-26 14:18:51.947 | DEBUG    | __main__:trials:26 - Trial = 29965/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.949 | DEBUG    | __main__:trials:29 - Trial = 29965/30000 | Total reward = 10.11
2022-01-26 14:18:51.952 | DEBUG    | __main__:trials:26 - Trial = 29966/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.953 | DEBUG    | __main__:trials:29 - Trial = 29966/30000 | Total reward = 22.18
2022-01-26 14:18:51.955 | DEBUG    | __main__:trials:26 - Trial = 29967/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.957 | DEBUG    | __main__:trials:29 - Trial = 29967/30000 | Total reward = 10.11
2022-01-26 14:18:51.960 | DEBUG    | __main__:trials:24 - Trial = 29968/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.961 | DEBUG    | __main__:trials:29 - Trial = 29968/30000 | Total reward = 43.24
2022-01-26 14:18:51.964 | DEBUG    | __main__:trials:26 - Trial = 29969/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.965 | DEBUG    | __main__:trials:29 - Trial = 29969/30000 | Total reward = 14.61
2022-01-26 14:18:51.967 | DEBUG    | __main__:trials:26 - Trial = 29970/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.967 | DEBUG    | __main__:trials:29 - Trial = 29970/30000 | Total reward = 8.43
2022-01-26 14:18:51.970 | DEBUG    | __main__:trials:26 - Trial = 29971/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.970 | DEBUG    | __main__:trials:29 - Trial = 29971/30000 | Total reward = 11.35
2022-01-26 14:18:51.974 | DEBUG    | __main__:trials:26 - Trial = 29972/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.976 | DEBUG    | __main__:trials:29 - Trial = 29972/30000 | Total reward = 15.19
2022-01-26 14:18:51.977 | DEBUG    | __main__:trials:26 - Trial = 29973/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.979 | DEBUG    | __main__:trials:29 - Trial = 29973/30000 | Total reward = 10.11
2022-01-26 14:18:51.982 | DEBUG    | __main__:trials:26 - Trial = 29974/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.984 | DEBUG    | __main__:trials:29 - Trial = 29974/30000 | Total reward = 10.11
2022-01-26 14:18:51.986 | DEBUG    | __main__:trials:26 - Trial = 29975/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:51.988 | DEBUG    | __main__:trials:29 - Trial = 29975/30000 | Total reward = 7.96
2022-01-26 14:18:51.992 | DEBUG    | __main__:trials:24 - Trial = 29976/30000 | Max number of steps (20) reached
2022-01-26 14:18:51.993 | DEBUG    | __main__:trials:29 - Trial = 29976/30000 | Total reward = 39.39
2022-01-26 14:18:51.998 | DEBUG    | __main__:trials:24 - Trial = 29977/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.000 | DEBUG    | __main__:trials:29 - Trial = 29977/30000 | Total reward = 27.81
2022-01-26 14:18:52.004 | DEBUG    | __main__:trials:24 - Trial = 29978/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.005 | DEBUG    | __main__:trials:29 - Trial = 29978/30000 | Total reward = 40.05
2022-01-26 14:18:52.009 | DEBUG    | __main__:trials:24 - Trial = 29979/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.010 | DEBUG    | __main__:trials:29 - Trial = 29979/30000 | Total reward = 36.87
2022-01-26 14:18:52.014 | DEBUG    | __main__:trials:24 - Trial = 29980/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.016 | DEBUG    | __main__:trials:29 - Trial = 29980/30000 | Total reward = 40.53
2022-01-26 14:18:52.019 | DEBUG    | __main__:trials:24 - Trial = 29981/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.021 | DEBUG    | __main__:trials:29 - Trial = 29981/30000 | Total reward = 38.98
2022-01-26 14:18:52.025 | DEBUG    | __main__:trials:24 - Trial = 29982/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.026 | DEBUG    | __main__:trials:29 - Trial = 29982/30000 | Total reward = 39.46
2022-01-26 14:18:52.029 | DEBUG    | __main__:trials:24 - Trial = 29983/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.031 | DEBUG    | __main__:trials:29 - Trial = 29983/30000 | Total reward = 38.07
2022-01-26 14:18:52.035 | DEBUG    | __main__:trials:24 - Trial = 29984/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.036 | DEBUG    | __main__:trials:29 - Trial = 29984/30000 | Total reward = 40.89
2022-01-26 14:18:52.040 | DEBUG    | __main__:trials:24 - Trial = 29985/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.041 | DEBUG    | __main__:trials:29 - Trial = 29985/30000 | Total reward = 60.29
2022-01-26 14:18:52.045 | DEBUG    | __main__:trials:26 - Trial = 29986/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:52.045 | DEBUG    | __main__:trials:29 - Trial = 29986/30000 | Total reward = 11.06
2022-01-26 14:18:52.049 | DEBUG    | __main__:trials:24 - Trial = 29987/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.050 | DEBUG    | __main__:trials:29 - Trial = 29987/30000 | Total reward = 38.77
2022-01-26 14:18:52.054 | DEBUG    | __main__:trials:24 - Trial = 29988/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.056 | DEBUG    | __main__:trials:29 - Trial = 29988/30000 | Total reward = 37.79
2022-01-26 14:18:52.059 | DEBUG    | __main__:trials:24 - Trial = 29989/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.061 | DEBUG    | __main__:trials:29 - Trial = 29989/30000 | Total reward = 38.45
2022-01-26 14:18:52.064 | DEBUG    | __main__:trials:26 - Trial = 29990/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:52.065 | DEBUG    | __main__:trials:29 - Trial = 29990/30000 | Total reward = 19.08
2022-01-26 14:18:52.069 | DEBUG    | __main__:trials:24 - Trial = 29991/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.071 | DEBUG    | __main__:trials:29 - Trial = 29991/30000 | Total reward = 48.41
2022-01-26 14:18:52.073 | DEBUG    | __main__:trials:26 - Trial = 29992/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:52.074 | DEBUG    | __main__:trials:29 - Trial = 29992/30000 | Total reward = 15.99
2022-01-26 14:18:52.077 | DEBUG    | __main__:trials:24 - Trial = 29993/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.078 | DEBUG    | __main__:trials:29 - Trial = 29993/30000 | Total reward = 29.14
2022-01-26 14:18:52.082 | DEBUG    | __main__:trials:24 - Trial = 29994/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.082 | DEBUG    | __main__:trials:29 - Trial = 29994/30000 | Total reward = 38.77
2022-01-26 14:18:52.086 | DEBUG    | __main__:trials:24 - Trial = 29995/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.088 | DEBUG    | __main__:trials:29 - Trial = 29995/30000 | Total reward = 38.90
2022-01-26 14:18:52.090 | DEBUG    | __main__:trials:26 - Trial = 29996/30000 | Agent went out of bounds, resetting
2022-01-26 14:18:52.092 | DEBUG    | __main__:trials:29 - Trial = 29996/30000 | Total reward = 18.57
2022-01-26 14:18:52.095 | DEBUG    | __main__:trials:24 - Trial = 29997/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.097 | DEBUG    | __main__:trials:29 - Trial = 29997/30000 | Total reward = 37.77
2022-01-26 14:18:52.100 | DEBUG    | __main__:trials:24 - Trial = 29998/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.101 | DEBUG    | __main__:trials:29 - Trial = 29998/30000 | Total reward = 34.02
2022-01-26 14:18:52.105 | DEBUG    | __main__:trials:24 - Trial = 29999/30000 | Max number of steps (20) reached
2022-01-26 14:18:52.106 | DEBUG    | __main__:trials:29 - Trial = 29999/30000 | Total reward = 53.66
2022-01-26 14:18:52.605 | INFO     | __main__:plot:30 - Number of steps: 20
2022-01-26 14:18:52.607 | INFO     | __main__:plot:31 - Number of trials: 30000
../_images/examples_Hex_Q-Learning_8_1.png